This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
llvm/
-
lib/Target/BPF/
-
Target/
-
BPF/
1/2
BPFMISimplifyPatchable.cpp
-
test/CodeGen/BPF/CORE/
-
CodeGen/
-
BPF/
-
CORE/
-
simplifypatable-nullptr.ll

Differential D123883

[BPF] Fix a bug in BPFMISimplifyPatchable pass
ClosedPublic

Authored by yonghong-song on Apr 15 2022, 4:16 PM.

Download Raw Diff

Details

Reviewers

ast

Commits

rG497a5f041594: [BPF] Fix a bug in BPFMISimplifyPatchable pass

Summary

LLVM BPF pass SimplifyPatchable is used to do necessary
code conversion for CO-RE operations. When studying bpf
selftest 'exhandler', I found a corner case not handled properly.
The following is the C code, modified from original 'exhandler'
code.

int g;
int test(struct t1 *p) {
  struct t2 *q = p->q;
  if (q)
    return 0;
  struct t3 *f = q->f;
  if (!f) g = 5;
  return 0;
}

For code:

struct t3 *f = q->f;
if (!f) ...

The IR before BPFMISimplifyPatchable pass looks like:

%5:gpr = LD_imm64 @"llvm.t2:0:8$0:1"
%6:gpr = LDD killed %5:gpr, 0
%7:gpr = LDD killed %6:gpr, 0
JNE_ri killed %7:gpr, 0, %bb.3
JMP %bb.2

Note that compiler knows q = 0 based dataflow and value analysis.
The correct generated code after the pass should be

%5:gpr = LD_imm64 @"llvm.t2:0:8$0:1"
%7:gpr = LDD killed %5:gpr, 0
JNE_ri killed %7:gpr, 0, %bb.3
JMP %bb.2

But the current implementation did further optimization for the
above code and generates

%5:gpr = LD_imm64 @"llvm.t2:0:8$0:1"
JNE_ri killed %5:gpr, 0, %bb.3
JMP %bb.2

which is incorrect.

This patch added a cache to remember those load insns not associated
with CO-RE offset value and will skip these load insns during
transformation.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

yonghong-song created this revision.Apr 15 2022, 4:16 PM

Herald added a project: Restricted Project. · View Herald TranscriptApr 15 2022, 4:16 PM

Herald added a subscriber: hiraditya. · View Herald Transcript

yonghong-song requested review of this revision.Apr 15 2022, 4:16 PM

Herald added a project: Restricted Project. · View Herald TranscriptApr 15 2022, 4:16 PM

Herald added a subscriber: llvm-commits. · View Herald Transcript

Harbormaster completed remote builds in B159893: Diff 423186.Apr 15 2022, 4:52 PM

Herald added a subscriber: ormris. · View Herald TranscriptApr 15 2022, 4:52 PM

ast added inline comments.Apr 19 2022, 10:31 AM

llvm/lib/Target/BPF/BPFMISimplifyPatchable.cpp
243	why gate only loads here? The hunk below will apply to loads only anyway, so this check looks unnecessary. If both filter_loads checks (here and line 267) are necessary may be combine them into a helper function?

yonghong-song added inline comments.Apr 19 2022, 1:25 PM

llvm/lib/Target/BPF/BPFMISimplifyPatchable.cpp
243	They are not redundant. We have `SkipInsts.insert(Inst);` here. But a helper function (here and line 267) is a good idea. I kind of realize it but a little bit lazy, but since you mentioned this. Will do it.

create and use isLoadInst() helper function.

ast accepted this revision.Apr 19 2022, 2:57 PM

This revision is now accepted and ready to land.Apr 19 2022, 2:57 PM

This revision was landed with ongoing or failed builds.Apr 19 2022, 3:24 PM

Closed by commit rG497a5f041594: [BPF] Fix a bug in BPFMISimplifyPatchable pass (authored by klausler, committed by yonghong-song). · Explain Why

This revision was automatically updated to reflect the committed changes.

yonghong-song added a commit: rG497a5f041594: [BPF] Fix a bug in BPFMISimplifyPatchable pass.

Harbormaster completed remote builds in B160328: Diff 423741.Apr 19 2022, 3:57 PM

Revision Contents

Path

Size

llvm/

lib/

Target/

BPF/

BPFMISimplifyPatchable.cpp

23 lines

test/

CodeGen/

BPF/

CORE/

simplifypatable-nullptr.ll

136 lines

Diff 423741

llvm/lib/Target/BPF/BPFMISimplifyPatchable.cpp

	Show All 29 Lines
	#include "BPF.h"			#include "BPF.h"
	#include "BPFCORE.h"			#include "BPFCORE.h"
	#include "BPFInstrInfo.h"			#include "BPFInstrInfo.h"
	#include "BPFTargetMachine.h"			#include "BPFTargetMachine.h"
	#include "llvm/CodeGen/MachineFunctionPass.h"			#include "llvm/CodeGen/MachineFunctionPass.h"
	#include "llvm/CodeGen/MachineInstrBuilder.h"			#include "llvm/CodeGen/MachineInstrBuilder.h"
	#include "llvm/CodeGen/MachineRegisterInfo.h"			#include "llvm/CodeGen/MachineRegisterInfo.h"
	#include "llvm/Support/Debug.h"			#include "llvm/Support/Debug.h"
				#include <set>

	using namespace llvm;			using namespace llvm;

	#define DEBUG_TYPE "bpf-mi-simplify-patchable"			#define DEBUG_TYPE "bpf-mi-simplify-patchable"

	namespace {			namespace {

	struct BPFMISimplifyPatchable : public MachineFunctionPass {			struct BPFMISimplifyPatchable : public MachineFunctionPass {

	static char ID;			static char ID;
	const BPFInstrInfo *TII;			const BPFInstrInfo *TII;
	MachineFunction *MF;			MachineFunction *MF;

	BPFMISimplifyPatchable() : MachineFunctionPass(ID) {			BPFMISimplifyPatchable() : MachineFunctionPass(ID) {
	initializeBPFMISimplifyPatchablePass(*PassRegistry::getPassRegistry());			initializeBPFMISimplifyPatchablePass(*PassRegistry::getPassRegistry());
	}			}

	private:			private:
				std::set<MachineInstr *> SkipInsts;

	// Initialize class variables.			// Initialize class variables.
	void initialize(MachineFunction &MFParm);			void initialize(MachineFunction &MFParm);

				bool isLoadInst(unsigned Opcode);
	bool removeLD();			bool removeLD();
	void processCandidate(MachineRegisterInfo *MRI, MachineBasicBlock &MBB,			void processCandidate(MachineRegisterInfo *MRI, MachineBasicBlock &MBB,
	MachineInstr &MI, Register &SrcReg, Register &DstReg,			MachineInstr &MI, Register &SrcReg, Register &DstReg,
	const GlobalValue *GVal, bool IsAma);			const GlobalValue *GVal, bool IsAma);
	void processDstReg(MachineRegisterInfo *MRI, Register &DstReg,			void processDstReg(MachineRegisterInfo *MRI, Register &DstReg,
	Register &SrcReg, const GlobalValue *GVal,			Register &SrcReg, const GlobalValue *GVal,
	bool doSrcRegProp, bool IsAma);			bool doSrcRegProp, bool IsAma);
	void processInst(MachineRegisterInfo MRI, MachineInstr Inst,			void processInst(MachineRegisterInfo MRI, MachineInstr Inst,
	Show All 17 Lines

	// Initialize class variables.			// Initialize class variables.
	void BPFMISimplifyPatchable::initialize(MachineFunction &MFParm) {			void BPFMISimplifyPatchable::initialize(MachineFunction &MFParm) {
	MF = &MFParm;			MF = &MFParm;
	TII = MF->getSubtarget<BPFSubtarget>().getInstrInfo();			TII = MF->getSubtarget<BPFSubtarget>().getInstrInfo();
	LLVM_DEBUG(dbgs() << "* BPF simplify patchable insts pass *\n\n");			LLVM_DEBUG(dbgs() << "* BPF simplify patchable insts pass *\n\n");
	}			}

				bool BPFMISimplifyPatchable::isLoadInst(unsigned Opcode) {
				return Opcode == BPF::LDD \|\| Opcode == BPF::LDW \|\| Opcode == BPF::LDH \|\|
				Opcode == BPF::LDB \|\| Opcode == BPF::LDW32 \|\| Opcode == BPF::LDH32 \|\|
				Opcode == BPF::LDB32;
				}

	void BPFMISimplifyPatchable::checkADDrr(MachineRegisterInfo *MRI,			void BPFMISimplifyPatchable::checkADDrr(MachineRegisterInfo *MRI,
	MachineOperand RelocOp, const GlobalValue GVal) {			MachineOperand RelocOp, const GlobalValue GVal) {
	const MachineInstr *Inst = RelocOp->getParent();			const MachineInstr *Inst = RelocOp->getParent();
	const MachineOperand *Op1 = &Inst->getOperand(1);			const MachineOperand *Op1 = &Inst->getOperand(1);
	const MachineOperand *Op2 = &Inst->getOperand(2);			const MachineOperand *Op2 = &Inst->getOperand(2);
	const MachineOperand *BaseOp = (RelocOp == Op1) ? Op2 : Op1;			const MachineOperand *BaseOp = (RelocOp == Op1) ? Op2 : Op1;

	// Go through all uses of %1 as in %1 = ADD_rr %2, %3			// Go through all uses of %1 as in %1 = ADD_rr %2, %3
	▲ Show 20 Lines • Show All 125 Lines • ▼ Show 20 Lines
	// %17 = SRA_rr %14, %16			// %17 = SRA_rr %14, %16
	// The `%17 = ...` will be transformed to			// The `%17 = ...` will be transformed to
	// %17 = CORE_SHIFT(SRA_ri, %14, @"llvm.t:5:63$0:2")			// %17 = CORE_SHIFT(SRA_ri, %14, @"llvm.t:5:63$0:2")
	// and later on, BTF emit phase will translate to			// and later on, BTF emit phase will translate to
	// %r4 = SRA_ri %r4, 63			// %r4 = SRA_ri %r4, 63
	void BPFMISimplifyPatchable::processInst(MachineRegisterInfo *MRI,			void BPFMISimplifyPatchable::processInst(MachineRegisterInfo *MRI,
	MachineInstr Inst, MachineOperand RelocOp, const GlobalValue *GVal) {			MachineInstr Inst, MachineOperand RelocOp, const GlobalValue *GVal) {
	unsigned Opcode = Inst->getOpcode();			unsigned Opcode = Inst->getOpcode();
				if (isLoadInst(Opcode)) {
				astUnsubmitted Not Done Reply Inline Actions why gate only loads here? The hunk below will apply to loads only anyway, so this check looks unnecessary. If both filter_loads checks (here and line 267) are necessary may be combine them into a helper function? ast: why gate only loads here? The hunk below will apply to loads only anyway, so this check looks…
				yonghong-songAuthorUnsubmitted Done Reply Inline Actions They are not redundant. We have `SkipInsts.insert(Inst);` here. But a helper function (here and line 267) is a good idea. I kind of realize it but a little bit lazy, but since you mentioned this. Will do it. yonghong-song: They are not redundant. We have `SkipInsts.insert(Inst);` here. But a helper function (here and…
				SkipInsts.insert(Inst);
				return;
				}

	if (Opcode == BPF::ADD_rr)			if (Opcode == BPF::ADD_rr)
	checkADDrr(MRI, RelocOp, GVal);			checkADDrr(MRI, RelocOp, GVal);
	else if (Opcode == BPF::SLL_rr)			else if (Opcode == BPF::SLL_rr)
	checkShift(MRI, *Inst->getParent(), RelocOp, GVal, BPF::SLL_ri);			checkShift(MRI, *Inst->getParent(), RelocOp, GVal, BPF::SLL_ri);
	else if (Opcode == BPF::SRA_rr)			else if (Opcode == BPF::SRA_rr)
	checkShift(MRI, *Inst->getParent(), RelocOp, GVal, BPF::SRA_ri);			checkShift(MRI, *Inst->getParent(), RelocOp, GVal, BPF::SRA_ri);
	else if (Opcode == BPF::SRL_rr)			else if (Opcode == BPF::SRL_rr)
	checkShift(MRI, *Inst->getParent(), RelocOp, GVal, BPF::SRL_ri);			checkShift(MRI, *Inst->getParent(), RelocOp, GVal, BPF::SRL_ri);
	}			}

	/// Remove unneeded Load instructions.			/// Remove unneeded Load instructions.
	bool BPFMISimplifyPatchable::removeLD() {			bool BPFMISimplifyPatchable::removeLD() {
	MachineRegisterInfo *MRI = &MF->getRegInfo();			MachineRegisterInfo *MRI = &MF->getRegInfo();
	MachineInstr *ToErase = nullptr;			MachineInstr *ToErase = nullptr;
	bool Changed = false;			bool Changed = false;

	for (MachineBasicBlock &MBB : *MF) {			for (MachineBasicBlock &MBB : *MF) {
	for (MachineInstr &MI : MBB) {			for (MachineInstr &MI : MBB) {
	if (ToErase) {			if (ToErase) {
	ToErase->eraseFromParent();			ToErase->eraseFromParent();
	ToErase = nullptr;			ToErase = nullptr;
	}			}

	// Ensure the register format is LOAD <reg>, <reg>, 0			// Ensure the register format is LOAD <reg>, <reg>, 0
	if (MI.getOpcode() != BPF::LDD && MI.getOpcode() != BPF::LDW &&			if (!isLoadInst(MI.getOpcode()))
	MI.getOpcode() != BPF::LDH && MI.getOpcode() != BPF::LDB &&			continue;
	MI.getOpcode() != BPF::LDW32 && MI.getOpcode() != BPF::LDH32 &&
	MI.getOpcode() != BPF::LDB32)			if (SkipInsts.find(&MI) != SkipInsts.end())
	continue;			continue;

	if (!MI.getOperand(0).isReg() \|\| !MI.getOperand(1).isReg())			if (!MI.getOperand(0).isReg() \|\| !MI.getOperand(1).isReg())
	continue;			continue;

	if (!MI.getOperand(2).isImm() \|\| MI.getOperand(2).getImm())			if (!MI.getOperand(2).isImm() \|\| MI.getOperand(2).getImm())
	continue;			continue;

	▲ Show 20 Lines • Show All 45 Lines • Show Last 20 Lines

llvm/test/CodeGen/BPF/CORE/simplifypatable-nullptr.ll

This file was added.

				; RUN: llc -O2 -march=bpf -mcpu=v3 < %s \| FileCheck %s
				; Source code:
				; struct t3 {
				; int i;
				; } __attribute__((preserve_access_index));
				; struct t2 {
				; void *pad;
				; struct t3 *f;
				; } __attribute__((preserve_access_index));
				; struct t1 {
				; void *pad;
				; struct t2 *q;
				; } __attribute__((preserve_access_index));
				;
				; int g;
				; int test(struct t1 *p) {
				; struct t2 *q = p->q;
				; if (q)
				; return 0;
				; struct t3 *f = q->f;
				; if (!f) g = 5;
				; return 0;
				; }
				; Compilation flag:
				; clang -target bpf -O2 -g -S -emit-llvm t.c

				@g = dso_local local_unnamed_addr global i32 0, align 4, !dbg !0
				@"llvm.t2:0:8$0:1" = external global i64, !llvm.preserve.access.index !6 #0
				@"llvm.t1:0:8$0:1" = external global i64, !llvm.preserve.access.index !15 #0

				; Function Attrs: mustprogress nofree nosync nounwind willreturn
				define dso_local i32 @test(ptr noundef readonly %p) local_unnamed_addr #1 !dbg !25 {
				entry:
				call void @llvm.dbg.value(metadata ptr %p, metadata !30, metadata !DIExpression()), !dbg !33
				%0 = load i64, ptr @"llvm.t1:0:8$0:1", align 8
				%1 = getelementptr i8, ptr %p, i64 %0
				%2 = tail call ptr @llvm.bpf.passthrough.p0.p0(i32 1, ptr %1)
				%3 = load ptr, ptr %2, align 8, !dbg !34, !tbaa !35
				call void @llvm.dbg.value(metadata ptr %3, metadata !31, metadata !DIExpression()), !dbg !33
				%tobool.not = icmp eq ptr %3, null, !dbg !40
				br i1 %tobool.not, label %if.end, label %cleanup, !dbg !42

				; CHECK-LABEL: test
				; CHECK: r1 = (u64 )(r1 + 8)
				; CHECK: if r1 != 0 goto

				if.end: ; preds = %entry
				%4 = load i64, ptr @"llvm.t2:0:8$0:1", align 8
				%5 = getelementptr i8, ptr null, i64 %4
				%6 = tail call ptr @llvm.bpf.passthrough.p0.p0(i32 0, ptr %5)
				%7 = load ptr, ptr %6, align 8, !dbg !43, !tbaa !44
				call void @llvm.dbg.value(metadata ptr %7, metadata !32, metadata !DIExpression()), !dbg !33
				%tobool1.not = icmp eq ptr %7, null, !dbg !46
				br i1 %tobool1.not, label %if.then2, label %cleanup, !dbg !48

				; CHECK: r1 = 8
				; CHECK: r1 = (u64 )(r1 + 0)
				; CHECK: if r1 != 0 goto

				if.then2: ; preds = %if.end
				store i32 5, ptr @g, align 4, !dbg !49, !tbaa !50
				br label %cleanup, !dbg !52

				cleanup: ; preds = %if.end, %if.then2, %entry
				ret i32 0, !dbg !53
				}

				; Function Attrs: nofree nosync nounwind readnone
				declare ptr @llvm.bpf.passthrough.p0.p0(i32, ptr) #2

				; Function Attrs: nocallback nofree nosync nounwind readnone speculatable willreturn
				declare void @llvm.dbg.value(metadata, metadata, metadata) #3

				attributes #0 = { "btf_ama" }
				attributes #1 = { mustprogress nofree nosync nounwind willreturn "frame-pointer"="all" "min-legal-vector-width"="0" "no-trapping-math"="true" "stack-protector-buffer-size"="8" }
				attributes #2 = { nofree nosync nounwind readnone }
				attributes #3 = { nocallback nofree nosync nounwind readnone speculatable willreturn }

				!llvm.dbg.cu = !{!2}
				!llvm.module.flags = !{!20, !21, !22, !23}
				!llvm.ident = !{!24}

				!0 = !DIGlobalVariableExpression(var: !1, expr: !DIExpression())
				!1 = distinct !DIGlobalVariable(name: "g", scope: !2, file: !3, line: 13, type: !5, isLocal: false, isDefinition: true)
				!2 = distinct !DICompileUnit(language: DW_LANG_C99, file: !3, producer: "clang version 15.0.0 (https://github.com/llvm/llvm-project.git ca2be81e34a6d87edb8e555dfac94ab68ee20f70)", isOptimized: true, runtimeVersion: 0, emissionKind: FullDebug, globals: !4, splitDebugInlining: false, nameTableKind: None)
				!3 = !DIFile(filename: "t.c", directory: "/tmp/home/yhs/work/tests/llvm/nullptr", checksumkind: CSK_MD5, checksum: "2c0ea9b3c647baf31f56992f9142b0df")
				!4 = !{!0}
				!5 = !DIBasicType(name: "int", size: 32, encoding: DW_ATE_signed)
				!6 = distinct !DICompositeType(tag: DW_TAG_structure_type, name: "t2", file: !3, line: 4, size: 128, elements: !7)
				!7 = !{!8, !10}
				!8 = !DIDerivedType(tag: DW_TAG_member, name: "pad", scope: !6, file: !3, line: 5, baseType: !9, size: 64)
				!9 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: null, size: 64)
				!10 = !DIDerivedType(tag: DW_TAG_member, name: "f", scope: !6, file: !3, line: 6, baseType: !11, size: 64, offset: 64)
				!11 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !12, size: 64)
				!12 = distinct !DICompositeType(tag: DW_TAG_structure_type, name: "t3", file: !3, line: 1, size: 32, elements: !13)
				!13 = !{!14}
				!14 = !DIDerivedType(tag: DW_TAG_member, name: "i", scope: !12, file: !3, line: 2, baseType: !5, size: 32)
				!15 = distinct !DICompositeType(tag: DW_TAG_structure_type, name: "t1", file: !3, line: 8, size: 128, elements: !16)
				!16 = !{!17, !18}
				!17 = !DIDerivedType(tag: DW_TAG_member, name: "pad", scope: !15, file: !3, line: 9, baseType: !9, size: 64)
				!18 = !DIDerivedType(tag: DW_TAG_member, name: "q", scope: !15, file: !3, line: 10, baseType: !19, size: 64, offset: 64)
				!19 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !6, size: 64)
				!20 = !{i32 7, !"Dwarf Version", i32 5}
				!21 = !{i32 2, !"Debug Info Version", i32 3}
				!22 = !{i32 1, !"wchar_size", i32 4}
				!23 = !{i32 7, !"frame-pointer", i32 2}
				!24 = !{!"clang version 15.0.0 (https://github.com/llvm/llvm-project.git ca2be81e34a6d87edb8e555dfac94ab68ee20f70)"}
				!25 = distinct !DISubprogram(name: "test", scope: !3, file: !3, line: 14, type: !26, scopeLine: 14, flags: DIFlagPrototyped \| DIFlagAllCallsDescribed, spFlags: DISPFlagDefinition \| DISPFlagOptimized, unit: !2, retainedNodes: !29)
				!26 = !DISubroutineType(types: !27)
				!27 = !{!5, !28}
				!28 = !DIDerivedType(tag: DW_TAG_pointer_type, baseType: !15, size: 64)
				!29 = !{!30, !31, !32}
				!30 = !DILocalVariable(name: "p", arg: 1, scope: !25, file: !3, line: 14, type: !28)
				!31 = !DILocalVariable(name: "q", scope: !25, file: !3, line: 15, type: !19)
				!32 = !DILocalVariable(name: "f", scope: !25, file: !3, line: 18, type: !11)
				!33 = !DILocation(line: 0, scope: !25)
				!34 = !DILocation(line: 15, column: 21, scope: !25)
				!35 = !{!36, !37, i64 8}
				!36 = !{!"t1", !37, i64 0, !37, i64 8}
				!37 = !{!"any pointer", !38, i64 0}
				!38 = !{!"omnipotent char", !39, i64 0}
				!39 = !{!"Simple C/C++ TBAA"}
				!40 = !DILocation(line: 16, column: 7, scope: !41)
				!41 = distinct !DILexicalBlock(scope: !25, file: !3, line: 16, column: 7)
				!42 = !DILocation(line: 16, column: 7, scope: !25)
				!43 = !DILocation(line: 18, column: 21, scope: !25)
				!44 = !{!45, !37, i64 8}
				!45 = !{!"t2", !37, i64 0, !37, i64 8}
				!46 = !DILocation(line: 19, column: 8, scope: !47)
				!47 = distinct !DILexicalBlock(scope: !25, file: !3, line: 19, column: 7)
				!48 = !DILocation(line: 19, column: 7, scope: !25)
				!49 = !DILocation(line: 19, column: 13, scope: !47)
				!50 = !{!51, !51, i64 0}
				!51 = !{!"int", !38, i64 0}
				!52 = !DILocation(line: 19, column: 11, scope: !47)
				!53 = !DILocation(line: 21, column: 1, scope: !25)