diff --git a/llvm/lib/Target/X86/X86ISelLowering.cpp b/llvm/lib/Target/X86/X86ISelLowering.cpp --- a/llvm/lib/Target/X86/X86ISelLowering.cpp +++ b/llvm/lib/Target/X86/X86ISelLowering.cpp @@ -28757,8 +28757,7 @@ N->getMemOperand(), N->getAddressingMode(), N->getExtensionType(), N->isExpandingLoad()); // Emit a blend. - SDValue Select = DAG.getNode(ISD::VSELECT, dl, MaskVT, Mask, NewLoad, - PassThru); + SDValue Select = DAG.getNode(ISD::VSELECT, dl, VT, Mask, NewLoad, PassThru); return DAG.getMergeValues({ Select, NewLoad.getValue(1) }, dl); } @@ -28794,10 +28793,10 @@ PassThru, N->getMemoryVT(), N->getMemOperand(), N->getAddressingMode(), N->getExtensionType(), N->isExpandingLoad()); - SDValue Exract = DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, VT, - NewLoad.getValue(0), - DAG.getIntPtrConstant(0, dl)); - SDValue RetOps[] = {Exract, NewLoad.getValue(1)}; + SDValue Extract = + DAG.getNode(ISD::EXTRACT_SUBVECTOR, dl, VT, NewLoad.getValue(0), + DAG.getIntPtrConstant(0, dl)); + SDValue RetOps[] = {Extract, NewLoad.getValue(1)}; return DAG.getMergeValues(RetOps, dl); } diff --git a/llvm/test/CodeGen/X86/avx-bug-45563.ll b/llvm/test/CodeGen/X86/avx-bug-45563.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/X86/avx-bug-45563.ll @@ -0,0 +1,21 @@ +; RUN: llc < %s -debug-only=isel -O3 -mattr=avx 2>&1 | FileCheck %s + +; Bug 45563: +; The LowerMLOAD() method AVX masked load branch should +; use the operand vector type rather than the mask type. +; Given, for example: +; v4f64,ch = masked_load .. +; The select should be: +; v4f64 = vselect .. +; instead of: +; v4i64 = vselect .. + +define <16 x double> @bug45563(<16 x double>* %addr, <16 x double> %dst, <16 x i64> %e, <16 x i64> %f) { +; CHECK-LABEL: bug45563: +; CHECK: v4f64 = vselect + %mask = icmp slt <16 x i64> %e, %f + %res = call <16 x double> @llvm.masked.load.v16f64.p0v16f64(<16 x double>* %addr, i32 4, <16 x i1>%mask, <16 x double> %dst) + ret <16 x double> %res +} + +declare <16 x double> @llvm.masked.load.v16f64.p0v16f64(<16 x double>* %addr, i32 %align, <16 x i1> %mask, <16 x double> %dst)