diff --git a/llvm/include/llvm/IR/Attributes.td b/llvm/include/llvm/IR/Attributes.td --- a/llvm/include/llvm/IR/Attributes.td +++ b/llvm/include/llvm/IR/Attributes.td @@ -294,3 +294,4 @@ def : MergeRule<"adjustCallerStackProbeSize">; def : MergeRule<"adjustMinLegalVectorWidth">; def : MergeRule<"adjustNullPointerValidAttr">; +def : MergeRule<"setAND">; diff --git a/llvm/test/Transforms/Inline/inlined-mustprogress-loop-metadata.ll b/llvm/test/Transforms/Inline/inlined-mustprogress-loop-metadata.ll new file mode 100644 --- /dev/null +++ b/llvm/test/Transforms/Inline/inlined-mustprogress-loop-metadata.ll @@ -0,0 +1,528 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --function-signature --check-attributes --force-update +; RUN: opt < %s -S -passes="inline" | FileCheck %s + +define void @callee(i32 %a, i32 %b) #0 { +entry: + br label %for.cond +for.cond: + %cmp = icmp slt i32 %a, %b + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond, !llvm.loop !0 +for.end: + br label %while.body +while.body: + br label %while.body +} + +define void @caller(i32 %a, i32 %b) #1 { +; CHECK: Function Attrs: noinline +; CHECK-LABEL: define {{[^@]+}}@caller +; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) [[ATTR1:#.*]] { +; CHECK-NEXT: entry: +; CHECK-NEXT: br label [[FOR_COND:%.*]] +; CHECK: for.cond: +; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[A]], [[B]] +; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] +; CHECK: for.body: +; CHECK-NEXT: br label [[FOR_COND]] +; CHECK: for.end: +; CHECK-NEXT: br label [[FOR_COND_I:%.*]] +; CHECK: for.cond.i: + ; CHECK-NEXT: br label [[FOR_COND_I]], !llvm.loop [[LOOP0:![0-9]+]] +; CHECK: callee.exit: +; CHECK-NEXT: ret void +; +entry: + br label %for.cond +for.cond: + %cmp = icmp slt i32 %a, %b + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond +for.end: + call void @callee(i32 0, i32 5) + ret void +} + +define void @callee_no_metadata(i32 %a, i32 %b) { +entry: + br label %for.cond +for.cond: + %cmp = icmp slt i32 %a, %b + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond +for.end: + br label %while.body +while.body: + br label %while.body +} + +define void @caller_no_metadata(i32 %a, i32 %b) { +; CHECK-LABEL: define {{[^@]+}}@caller_no_metadata +; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) { +; CHECK-NEXT: entry: +; CHECK-NEXT: br label [[FOR_COND:%.*]] +; CHECK: for.cond: +; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[A]], [[B]] +; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] +; CHECK: for.body: +; CHECK-NEXT: br label [[FOR_COND]] +; CHECK: for.end: +; CHECK-NEXT: br label [[FOR_COND_I:%.*]] +; CHECK: for.cond.i: +; CHECK-NEXT: br label [[FOR_COND_I]] +; CHECK: callee_no_metadata.exit: +; CHECK-NEXT: ret void +; +entry: + br label %for.cond +for.cond: + %cmp = icmp slt i32 %a, %b + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond +for.end: + call void @callee_no_metadata(i32 0, i32 5) + ret void +} + +define void @callee_mustprogress(i32 %a, i32 %b) #0 { +entry: + br label %for.cond +for.cond: + %cmp = icmp slt i32 %a, %b + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond +for.end: + br label %while.body +while.body: + br label %while.body +} + +define void @caller_mustprogress(i32 %a, i32 %b) #0 { +; CHECK: Function Attrs: mustprogress +; CHECK-LABEL: define {{[^@]+}}@caller_mustprogress +; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) [[ATTR0:#[0-9]+]] { +; CHECK-NEXT: entry: +; CHECK-NEXT: br label [[FOR_COND:%.*]] +; CHECK: for.cond: +; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[A]], [[B]] +; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] +; CHECK: for.body: +; CHECK-NEXT: br label [[FOR_COND]] +; CHECK: for.end: +; CHECK-NEXT: br label [[FOR_COND_I:%.*]] +; CHECK: for.cond.i: +; CHECK-NEXT: br label [[FOR_COND_I]] +; CHECK: callee_mustprogress.exit: +; CHECK-NEXT: ret void +; +entry: + br label %for.cond +for.cond: + %cmp = icmp slt i32 %a, %b + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond +for.end: + call void @callee_mustprogress(i32 0, i32 5) + ret void +} + +define void @caller_mustprogress_callee_no_metadata(i32 %a, i32 %b) #0 { +; CHECK-LABEL: define {{[^@]+}}@caller_mustprogress_callee_no_metadata +; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) { +; CHECK-NEXT: entry: +; CHECK-NEXT: br label [[FOR_COND:%.*]] +; CHECK: for.cond: +; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[A]], [[B]] +; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] +; CHECK: for.body: +; CHECK-NEXT: br label [[FOR_COND]] +; CHECK: for.end: +; CHECK-NEXT: br label [[FOR_COND_I:%.*]] +; CHECK: for.cond.i: +; CHECK-NEXT: br label [[FOR_COND_I]] +; CHECK: callee_no_metadata.exit: +; CHECK-NEXT: ret void +; +entry: + br label %for.cond +for.cond: + %cmp = icmp slt i32 %a, %b + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond +for.end: + call void @callee_no_metadata(i32 0, i32 5) + ret void +} + +define void @callee_multiple(i32 %a, i32 %b) #0 { +entry: + %a.addr = alloca i32, align 4 + %b.addr = alloca i32, align 4 + %i = alloca i32, align 4 + store i32 %a, i32* %a.addr, align 4 + store i32 %b, i32* %b.addr, align 4 + br label %for.cond +for.cond: + %0 = load i32, i32* %a.addr, align 4 + %1 = load i32, i32* %b.addr, align 4 + %cmp = icmp slt i32 %0, %1 + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond, !llvm.loop !2 +for.end: + store i32 0, i32* %i, align 4 + br label %for.cond1 +for.cond1: + %2 = load i32, i32* %i, align 4 + %cmp2 = icmp slt i32 %2, 10 + br i1 %cmp2, label %for.body3, label %for.end4 +for.body3: + br label %for.inc +for.inc: + %3 = load i32, i32* %i, align 4 + %inc = add nsw i32 %3, 1 + store i32 %inc, i32* %i, align 4 + br label %for.cond1, !llvm.loop !4 +for.end4: + br label %while.body +while.body: + br label %while.body +} + +define void @caller_multiple(i32 %a, i32 %b) #1 { +; CHECK: Function Attrs: noinline +; CHECK-LABEL: define {{[^@]+}}@caller_multiple +; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) [[ATTR1]] { +; CHECK-NEXT: entry: +; CHECK-NEXT: [[A_ADDR_I:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[B_ADDR_I:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[I_I:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[A_ADDR:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[B_ADDR:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[I:%.*]] = alloca i32, align 4 +; CHECK-NEXT: store i32 [[A]], i32* [[A_ADDR]], align 4 +; CHECK-NEXT: store i32 [[B]], i32* [[B_ADDR]], align 4 +; CHECK-NEXT: br label [[FOR_COND:%.*]] +; CHECK: for.cond: +; CHECK-NEXT: [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4 +; CHECK-NEXT: [[TMP1:%.*]] = load i32, i32* [[B_ADDR]], align 4 +; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] +; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END:%.*]] +; CHECK: for.body: +; CHECK-NEXT: br label [[FOR_COND]] +; CHECK: for.end: +; CHECK-NEXT: store i32 0, i32* [[I]], align 4 +; CHECK-NEXT: br label [[FOR_COND1:%.*]] +; CHECK: for.cond1: +; CHECK-NEXT: [[TMP2:%.*]] = load i32, i32* [[I]], align 4 +; CHECK-NEXT: [[CMP2:%.*]] = icmp slt i32 [[TMP2]], 10 +; CHECK-NEXT: br i1 [[CMP2]], label [[FOR_BODY3:%.*]], label [[FOR_END4:%.*]] +; CHECK: for.body3: +; CHECK-NEXT: br label [[FOR_INC:%.*]] +; CHECK: for.inc: +; CHECK-NEXT: [[TMP3:%.*]] = load i32, i32* [[I]], align 4 +; CHECK-NEXT: [[INC:%.*]] = add nsw i32 [[TMP3]], 1 +; CHECK-NEXT: store i32 [[INC]], i32* [[I]], align 4 +; CHECK-NEXT: br label [[FOR_COND1]] +; CHECK: for.end4: +; CHECK-NEXT: [[TMP4:%.*]] = bitcast i32* [[A_ADDR_I]] to i8* +; CHECK-NEXT: call void @llvm.lifetime.start.p0i8(i64 4, i8* [[TMP4]]) +; CHECK-NEXT: [[TMP5:%.*]] = bitcast i32* [[B_ADDR_I]] to i8* +; CHECK-NEXT: call void @llvm.lifetime.start.p0i8(i64 4, i8* [[TMP5]]) +; CHECK-NEXT: [[TMP6:%.*]] = bitcast i32* [[I_I]] to i8* +; CHECK-NEXT: call void @llvm.lifetime.start.p0i8(i64 4, i8* [[TMP6]]) +; CHECK-NEXT: store i32 0, i32* [[A_ADDR_I]], align 4 +; CHECK-NEXT: store i32 5, i32* [[B_ADDR_I]], align 4 +; CHECK-NEXT: br label [[FOR_COND_I:%.*]] +; CHECK: for.cond.i: +; CHECK-NEXT: [[TMP7:%.*]] = load i32, i32* [[A_ADDR_I]], align 4 +; CHECK-NEXT: [[TMP8:%.*]] = load i32, i32* [[B_ADDR_I]], align 4 +; CHECK-NEXT: [[CMP_I:%.*]] = icmp slt i32 [[TMP7]], [[TMP8]] +; CHECK-NEXT: br i1 [[CMP_I]], label [[FOR_BODY_I:%.*]], label [[FOR_END_I:%.*]] +; CHECK: for.body.i: + ; CHECK-NEXT: br label [[FOR_COND_I]], !llvm.loop [[LOOP2:![0-9]+]] +; CHECK: for.end.i: +; CHECK-NEXT: store i32 0, i32* [[I_I]], align 4 +; CHECK-NEXT: br label [[FOR_COND1_I:%.*]] +; CHECK: for.cond1.i: +; CHECK-NEXT: [[TMP9:%.*]] = load i32, i32* [[I_I]], align 4 +; CHECK-NEXT: [[CMP2_I:%.*]] = icmp slt i32 [[TMP9]], 10 +; CHECK-NEXT: br i1 [[CMP2_I]], label [[FOR_BODY3_I:%.*]], label [[FOR_END4_I:%.*]] +; CHECK: for.body3.i: +; CHECK-NEXT: [[TMP10:%.*]] = load i32, i32* [[I_I]], align 4 +; CHECK-NEXT: [[INC_I:%.*]] = add nsw i32 [[TMP10]], 1 +; CHECK-NEXT: store i32 [[INC_I]], i32* [[I_I]], align 4 +; CHECK-NEXT: br label [[FOR_COND1_I]], !llvm.loop [[LOOP3:![0-9]+]] +; CHECK: for.end4.i: +; CHECK-NEXT: br label [[WHILE_BODY_I:%.*]] +; CHECK: while.body.i: +; CHECK-NEXT: br label [[WHILE_BODY_I]] +; CHECK: callee_multiple.exit: +; CHECK-NEXT: ret void +; +entry: + %a.addr = alloca i32, align 4 + %b.addr = alloca i32, align 4 + %i = alloca i32, align 4 + store i32 %a, i32* %a.addr, align 4 + store i32 %b, i32* %b.addr, align 4 + br label %for.cond +for.cond: + %0 = load i32, i32* %a.addr, align 4 + %1 = load i32, i32* %b.addr, align 4 + %cmp = icmp slt i32 %0, %1 + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond +for.end: + store i32 0, i32* %i, align 4 + br label %for.cond1 +for.cond1: + %2 = load i32, i32* %i, align 4 + %cmp2 = icmp slt i32 %2, 10 + br i1 %cmp2, label %for.body3, label %for.end4 +for.body3: + br label %for.inc +for.inc: + %3 = load i32, i32* %i, align 4 + %inc = add nsw i32 %3, 1 + store i32 %inc, i32* %i, align 4 + br label %for.cond1 +for.end4: + call void @callee_multiple(i32 0, i32 5) + ret void +} + +define void @callee_nested(i32 %a, i32 %b) #0 { +entry: + %a.addr = alloca i32, align 4 + %b.addr = alloca i32, align 4 + %i = alloca i32, align 4 + store i32 %a, i32* %a.addr, align 4 + store i32 %b, i32* %b.addr, align 4 + br label %for.cond +for.cond: + %0 = load i32, i32* %a.addr, align 4 + %1 = load i32, i32* %b.addr, align 4 + %cmp = icmp slt i32 %0, %1 + br i1 %cmp, label %for.body, label %for.end +for.body: + br label %for.cond, !llvm.loop !0 +for.end: + store i32 0, i32* %i, align 4 + br label %for.cond1 +for.cond1: + %2 = load i32, i32* %i, align 4 + %cmp2 = icmp slt i32 %2, 10 + br i1 %cmp2, label %for.body3, label %for.end8 +for.body3: + br label %for.cond4 +for.cond4: + %3 = load i32, i32* %b.addr, align 4 + %4 = load i32, i32* %a.addr, align 4 + %cmp5 = icmp slt i32 %3, %4 + br i1 %cmp5, label %for.body6, label %for.end7 +for.body6: + br label %for.cond4, !llvm.loop !2 +for.end7: + br label %for.inc +for.inc: + %5 = load i32, i32* %i, align 4 + %inc = add nsw i32 %5, 1 + store i32 %inc, i32* %i, align 4 + br label %for.cond1, !llvm.loop !3 +for.end8: + br label %while.body +while.body: + br label %while.body +} + +define void @caller_nested(i32 %a, i32 %b) #1 { +; CHECK: Function Attrs: noinline +; CHECK-LABEL: define {{[^@]+}}@caller_nested +; CHECK-SAME: (i32 [[A:%.*]], i32 [[B:%.*]]) [[ATTR1]] { +; CHECK-NEXT: entry: +; CHECK-NEXT: [[A_ADDR_I:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[B_ADDR_I:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[I_I:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[A_ADDR:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[B_ADDR:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[I:%.*]] = alloca i32, align 4 +; CHECK-NEXT: [[I9:%.*]] = alloca i32, align 4 +; CHECK-NEXT: store i32 [[A]], i32* [[A_ADDR]], align 4 +; CHECK-NEXT: store i32 [[B]], i32* [[B_ADDR]], align 4 +; CHECK-NEXT: br label [[FOR_COND:%.*]] +; CHECK: for.cond: +; CHECK-NEXT: [[TMP0:%.*]] = load i32, i32* [[A_ADDR]], align 4 +; CHECK-NEXT: [[TMP1:%.*]] = load i32, i32* [[B_ADDR]], align 4 +; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP0]], [[TMP1]] +; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY:%.*]], label [[FOR_END8:%.*]] +; CHECK: for.body: +; CHECK-NEXT: store i32 0, i32* [[I]], align 4 +; CHECK-NEXT: br label [[FOR_COND1:%.*]] +; CHECK: for.cond1: +; CHECK-NEXT: [[TMP2:%.*]] = load i32, i32* [[I]], align 4 +; CHECK-NEXT: [[CMP2:%.*]] = icmp slt i32 [[TMP2]], 10 +; CHECK-NEXT: br i1 [[CMP2]], label [[FOR_BODY3:%.*]], label [[FOR_END7:%.*]] +; CHECK: for.body3: +; CHECK-NEXT: br label [[FOR_COND4:%.*]] +; CHECK: for.cond4: +; CHECK-NEXT: [[TMP3:%.*]] = load i32, i32* [[B_ADDR]], align 4 +; CHECK-NEXT: [[TMP4:%.*]] = load i32, i32* [[A_ADDR]], align 4 +; CHECK-NEXT: [[CMP5:%.*]] = icmp slt i32 [[TMP3]], [[TMP4]] +; CHECK-NEXT: br i1 [[CMP5]], label [[FOR_BODY6:%.*]], label [[FOR_END:%.*]] +; CHECK: for.body6: +; CHECK-NEXT: br label [[FOR_COND4]] +; CHECK: for.end: +; CHECK-NEXT: br label [[FOR_INC:%.*]] +; CHECK: for.inc: +; CHECK-NEXT: [[TMP5:%.*]] = load i32, i32* [[I]], align 4 +; CHECK-NEXT: [[INC:%.*]] = add nsw i32 [[TMP5]], 1 +; CHECK-NEXT: store i32 [[INC]], i32* [[I]], align 4 +; CHECK-NEXT: br label [[FOR_COND1]] +; CHECK: for.end7: +; CHECK-NEXT: br label [[FOR_COND]] +; CHECK: for.end8: +; CHECK-NEXT: store i32 0, i32* [[I9]], align 4 +; CHECK-NEXT: br label [[FOR_COND10:%.*]] +; CHECK: for.cond10: +; CHECK-NEXT: [[TMP6:%.*]] = load i32, i32* [[I9]], align 4 +; CHECK-NEXT: [[CMP11:%.*]] = icmp slt i32 [[TMP6]], 10 +; CHECK-NEXT: br i1 [[CMP11]], label [[FOR_BODY12:%.*]], label [[FOR_END15:%.*]] +; CHECK: for.body12: +; CHECK-NEXT: br label [[FOR_INC13:%.*]] +; CHECK: for.inc13: +; CHECK-NEXT: [[TMP7:%.*]] = load i32, i32* [[I9]], align 4 +; CHECK-NEXT: [[INC14:%.*]] = add nsw i32 [[TMP7]], 1 +; CHECK-NEXT: store i32 [[INC14]], i32* [[I9]], align 4 +; CHECK-NEXT: br label [[FOR_COND10]] +; CHECK: for.end15: +; CHECK-NEXT: [[TMP8:%.*]] = bitcast i32* [[A_ADDR_I]] to i8* +; CHECK-NEXT: call void @llvm.lifetime.start.p0i8(i64 4, i8* [[TMP8]]) +; CHECK-NEXT: [[TMP9:%.*]] = bitcast i32* [[B_ADDR_I]] to i8* +; CHECK-NEXT: call void @llvm.lifetime.start.p0i8(i64 4, i8* [[TMP9]]) +; CHECK-NEXT: [[TMP10:%.*]] = bitcast i32* [[I_I]] to i8* +; CHECK-NEXT: call void @llvm.lifetime.start.p0i8(i64 4, i8* [[TMP10]]) +; CHECK-NEXT: store i32 0, i32* [[A_ADDR_I]], align 4 +; CHECK-NEXT: store i32 5, i32* [[B_ADDR_I]], align 4 +; CHECK-NEXT: br label [[FOR_COND_I:%.*]] +; CHECK: for.cond.i: +; CHECK-NEXT: [[TMP11:%.*]] = load i32, i32* [[A_ADDR_I]], align 4 +; CHECK-NEXT: [[TMP12:%.*]] = load i32, i32* [[B_ADDR_I]], align 4 +; CHECK-NEXT: [[CMP_I:%.*]] = icmp slt i32 [[TMP11]], [[TMP12]] +; CHECK-NEXT: br i1 [[CMP_I]], label [[FOR_BODY_I:%.*]], label [[FOR_END_I:%.*]] +; CHECK: for.body.i: +; CHECK-NEXT: br label [[FOR_COND_I]], !llvm.loop [[LOOP0]] +; CHECK: for.end.i: +; CHECK-NEXT: store i32 0, i32* [[I_I]], align 4 +; CHECK-NEXT: br label [[FOR_COND1_I:%.*]] +; CHECK: for.cond1.i: +; CHECK-NEXT: [[TMP13:%.*]] = load i32, i32* [[I_I]], align 4 +; CHECK-NEXT: [[CMP2_I:%.*]] = icmp slt i32 [[TMP13]], 10 +; CHECK-NEXT: br i1 [[CMP2_I]], label [[FOR_BODY3_I:%.*]], label [[FOR_END8_I:%.*]] +; CHECK: for.body3.i: +; CHECK-NEXT: br label [[FOR_COND4_I:%.*]] +; CHECK: for.cond4.i: +; CHECK-NEXT: [[TMP14:%.*]] = load i32, i32* [[B_ADDR_I]], align 4 +; CHECK-NEXT: [[TMP15:%.*]] = load i32, i32* [[A_ADDR_I]], align 4 +; CHECK-NEXT: [[CMP5_I:%.*]] = icmp slt i32 [[TMP14]], [[TMP15]] +; CHECK-NEXT: br i1 [[CMP5_I]], label [[FOR_BODY6_I:%.*]], label [[FOR_END7_I:%.*]] +; CHECK: for.body6.i: + ; CHECK-NEXT: br label [[FOR_COND4_I]], !llvm.loop [[LOOP2:![0-9]+]] +; CHECK: for.end7.i: +; CHECK-NEXT: [[TMP16:%.*]] = load i32, i32* [[I_I]], align 4 +; CHECK-NEXT: [[INC_I:%.*]] = add nsw i32 [[TMP16]], 1 +; CHECK-NEXT: store i32 [[INC_I]], i32* [[I_I]], align 4 +; CHECK-NEXT: br label [[FOR_COND1_I]], !llvm.loop [[LOOP4:![0-9]+]] +; CHECK: for.end8.i: +; CHECK-NEXT: br label [[WHILE_BODY_I:%.*]] +; CHECK: while.body.i: +; CHECK-NEXT: br label [[WHILE_BODY_I]] +; CHECK: callee_nested.exit: +; CHECK-NEXT: ret void +; +entry: + %a.addr = alloca i32, align 4 + %b.addr = alloca i32, align 4 + %i = alloca i32, align 4 + %i9 = alloca i32, align 4 + store i32 %a, i32* %a.addr, align 4 + store i32 %b, i32* %b.addr, align 4 + br label %for.cond +for.cond: + %0 = load i32, i32* %a.addr, align 4 + %1 = load i32, i32* %b.addr, align 4 + %cmp = icmp slt i32 %0, %1 + br i1 %cmp, label %for.body, label %for.end8 +for.body: + store i32 0, i32* %i, align 4 + br label %for.cond1 +for.cond1: + %2 = load i32, i32* %i, align 4 + %cmp2 = icmp slt i32 %2, 10 + br i1 %cmp2, label %for.body3, label %for.end7 +for.body3: + br label %for.cond4 +for.cond4: + %3 = load i32, i32* %b.addr, align 4 + %4 = load i32, i32* %a.addr, align 4 + %cmp5 = icmp slt i32 %3, %4 + br i1 %cmp5, label %for.body6, label %for.end +for.body6: + br label %for.cond4 +for.end: + br label %for.inc +for.inc: + %5 = load i32, i32* %i, align 4 + %inc = add nsw i32 %5, 1 + store i32 %inc, i32* %i, align 4 + br label %for.cond1 +for.end7: + br label %for.cond +for.end8: + store i32 0, i32* %i9, align 4 + br label %for.cond10 +for.cond10: + %6 = load i32, i32* %i9, align 4 + %cmp11 = icmp slt i32 %6, 10 + br i1 %cmp11, label %for.body12, label %for.end15 +for.body12: + br label %for.inc13 +for.inc13: + %7 = load i32, i32* %i9, align 4 + %inc14 = add nsw i32 %7, 1 + store i32 %inc14, i32* %i9, align 4 + br label %for.cond10 +for.end15: + call void @callee_nested(i32 0, i32 5) + ret void +} + +; CHECK: attributes [[ATTR0]] = { mustprogress } +; CHECK: attributes [[ATTR1]] = { noinline } + +; CHECK: [[LOOP0]] = distinct !{[[LOOP0]], [[GEN1:!.*]]} +; CHECK: [[GEN1]] = !{!"llvm.loop.mustprogress"} +; CHECK: [[LOOP2]] = distinct !{[[LOOP2]], [[GEN1:!.*]]} +; CHECK: [[LOOP3]] = distinct !{[[LOOP3]], [[GEN1:!.*]]} +; CHECK: [[LOOP4]] = distinct !{[[LOOP4]], [[GEN1:!.*]]} + +attributes #0 = { mustprogress } +attributes #1 = { noinline } +attributes #2 = { noinline mustprogress } + +!0 = distinct !{!0, !1} +!1 = !{!"llvm.loop.mustprogress"} +!2 = distinct !{!2, !1} +!3 = distinct !{!3, !1} +!4 = distinct !{!4, !1} +!5 = distinct !{!5, !1} +!6 = distinct !{!6, !1} +!7 = distinct !{!7, !1}