diff --git a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp --- a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp +++ b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp @@ -6214,7 +6214,8 @@ // This can be a pure constant or a vector splat, in which case we treat the // vector as a scalar and use the splat value. APInt Constant = APInt::getZero(1); - if (const ConstantSDNode *C = isConstOrConstSplat(N1)) { + if (const ConstantSDNode *C = isConstOrConstSplat( + N1, /*AllowUndef=*/false, /*AllowTruncation=*/true)) { Constant = C->getAPIntValue(); } else if (BuildVectorSDNode *Vector = dyn_cast(N1)) { APInt SplatValue, SplatUndef; diff --git a/llvm/test/CodeGen/AArch64/sve-extload-icmp.ll b/llvm/test/CodeGen/AArch64/sve-extload-icmp.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/AArch64/sve-extload-icmp.ll @@ -0,0 +1,106 @@ +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py +; RUN: llc < %s | FileCheck %s + +target triple = "aarch64-unknown-linux-gnu" + +define @extload_icmp_nxv8i8(ptr %in) #0 { +; CHECK-LABEL: extload_icmp_nxv8i8: +; CHECK: // %bb.0: +; CHECK-NEXT: ptrue p0.h +; CHECK-NEXT: ld1b { z0.h }, p0/z, [x0] +; CHECK-NEXT: cmpeq p0.h, p0/z, z0.h, #0 +; CHECK-NEXT: mov z0.h, p0/z, #1 // =0x1 +; CHECK-NEXT: ret + %ld = load , ptr %in + %cmp = icmp eq %ld, zeroinitializer + %ex = zext %cmp to + ret %ex +} + +define @extload_icmp_nxv16i8(ptr %in) #0 { +; CHECK-LABEL: extload_icmp_nxv16i8: +; CHECK: // %bb.0: +; CHECK-NEXT: ptrue p0.b +; CHECK-NEXT: ld1b { z0.b }, p0/z, [x0] +; CHECK-NEXT: cmpeq p0.b, p0/z, z0.b, #0 +; CHECK-NEXT: mov z0.b, p0/z, #1 // =0x1 +; CHECK-NEXT: ret + %ld = load , ptr %in + %cmp = icmp eq %ld, zeroinitializer + %ex = zext %cmp to + ret %ex +} + +define @extload_icmp_nxv4i16(ptr %in) #0 { +; CHECK-LABEL: extload_icmp_nxv4i16: +; CHECK: // %bb.0: +; CHECK-NEXT: ptrue p0.s +; CHECK-NEXT: ld1h { z0.s }, p0/z, [x0] +; CHECK-NEXT: cmpeq p0.s, p0/z, z0.s, #0 +; CHECK-NEXT: mov z0.s, p0/z, #1 // =0x1 +; CHECK-NEXT: ret + %ld = load , ptr %in + %cmp = icmp eq %ld, zeroinitializer + %ex = zext %cmp to + ret %ex +} + +define @extload_icmp_nxv8i16(ptr %in) #0 { +; CHECK-LABEL: extload_icmp_nxv8i16: +; CHECK: // %bb.0: +; CHECK-NEXT: ptrue p0.h +; CHECK-NEXT: ld1h { z0.h }, p0/z, [x0] +; CHECK-NEXT: cmpeq p0.h, p0/z, z0.h, #0 +; CHECK-NEXT: mov z0.h, p0/z, #1 // =0x1 +; CHECK-NEXT: ret + %ld = load , ptr %in + %cmp = icmp eq %ld, zeroinitializer + %ex = zext %cmp to + ret %ex +} + +define @extload_icmp_nxv2i32(ptr %in) #0 { +; CHECK-LABEL: extload_icmp_nxv2i32: +; CHECK: // %bb.0: +; CHECK-NEXT: ptrue p0.d +; CHECK-NEXT: ld1w { z0.d }, p0/z, [x0] +; CHECK-NEXT: cmpeq p0.d, p0/z, z0.d, #0 +; CHECK-NEXT: mov z0.d, p0/z, #1 // =0x1 +; CHECK-NEXT: ret + %ld = load , ptr %in + %cmp = icmp eq %ld, zeroinitializer + %ex = zext %cmp to + ret %ex +} + +define @extload_icmp_nxv4i32(ptr %in) #0 { +; CHECK-LABEL: extload_icmp_nxv4i32: +; CHECK: // %bb.0: +; CHECK-NEXT: ptrue p0.s +; CHECK-NEXT: ld1w { z0.s }, p0/z, [x0] +; CHECK-NEXT: cmpeq p0.s, p0/z, z0.s, #0 +; CHECK-NEXT: mov z0.s, p0/z, #1 // =0x1 +; CHECK-NEXT: ret + %ld = load , ptr %in + %cmp = icmp eq %ld, zeroinitializer + %ex = zext %cmp to + ret %ex +} + +define @extload_icmp_nxv2i64(ptr %in) #0 { +; CHECK-LABEL: extload_icmp_nxv2i64: +; CHECK: // %bb.0: +; CHECK-NEXT: ptrue p0.d +; CHECK-NEXT: ld1d { z0.d }, p0/z, [x0] +; CHECK-NEXT: cmpeq p0.d, p0/z, z0.d, #0 +; CHECK-NEXT: mov z0.d, p0/z, #1 // =0x1 +; CHECK-NEXT: ret + %ld = load , ptr %in + %cmp = icmp eq %ld, zeroinitializer + %ex = zext %cmp to + ret %ex +} + + + +attributes #0 = { "target-features"="+sve" }