diff --git a/llvm/lib/Target/VE/VEISelLowering.cpp b/llvm/lib/Target/VE/VEISelLowering.cpp --- a/llvm/lib/Target/VE/VEISelLowering.cpp +++ b/llvm/lib/Target/VE/VEISelLowering.cpp @@ -1428,11 +1428,10 @@ SDValue VETargetLowering::lowerLOAD(SDValue Op, SelectionDAG &DAG) const { LoadSDNode *LdNode = cast(Op.getNode()); - EVT MemVT = LdNode->getMemoryVT(); - // Dispatch to vector isel. - if (MemVT.isVector() && !isMaskType(MemVT)) + // If VPU is enabled, always expand non-mask vector loads to VVP + if (Subtarget->enableVPU() && MemVT.isVector() && !isMaskType(MemVT)) return lowerToVVP(Op, DAG); SDValue BasePtr = LdNode->getBasePtr(); @@ -1542,11 +1541,11 @@ SDValue VETargetLowering::lowerSTORE(SDValue Op, SelectionDAG &DAG) const { StoreSDNode *StNode = cast(Op.getNode()); assert(StNode && StNode->getOffset().isUndef() && "Unexpected node type"); - - // always expand non-mask vector loads to VVP EVT MemVT = StNode->getMemoryVT(); - if (MemVT.isVector() && !isMaskType(MemVT)) - return lowerToVVP(Op, DAG); + + // If VPU is enabled, always expand non-mask vector stores to VVP + if (Subtarget->enableVPU() && MemVT.isVector() && !isMaskType(MemVT)) + return lowerToVVP(Op, DAG); SDValue BasePtr = StNode->getBasePtr(); if (isa(BasePtr.getNode())) { diff --git a/llvm/test/CodeGen/VE/Vector/ticket-64420.ll b/llvm/test/CodeGen/VE/Vector/ticket-64420.ll new file mode 100644 --- /dev/null +++ b/llvm/test/CodeGen/VE/Vector/ticket-64420.ll @@ -0,0 +1,32 @@ +; RUN: llc < %s -mtriple=ve -mattr=-vpu | FileCheck --check-prefix=SCALAR %s + +; Check vector and scalar code generation for vector load instruction. +; For the case of scalar, generates 2 stores of 8 bytes length. + +; This is taken from a ticket below. +; https://github.com/llvm/llvm-project/issues/64420 + +; SCALAR-LABEL: func: +; SCALAR: # %bb.1: +; SCALAR-NEXT: st %s1, 8(, %s0) +; SCALAR-NEXT: st %s1, (, %s0) +; SCALAR-NEXT: b.l.t (, %s10) + +; ModuleID = 'bugpoint-reduced-simplified.bc' +source_filename = "test.c" +target datalayout = "e-m:e-i64:64-n32:64-S128-v64:64:64-v128:64:64-v256:64:64-v512:64:64-v1024:64:64-v2048:64:64-v4096:64:64-v8192:64:64-v16384:64:64" +target triple = "ve-unknown-linux-gnu" + +define dso_local void @func(ptr %_0) unnamed_addr #0 { +start: + br i1 poison, label %bb7, label %panic3 + +bb7: ; preds = %start + store <4 x i32> zeroinitializer, ptr %_0, align 4 + ret void + +panic3: ; preds = %start + unreachable +} + +attributes #0 = { "target-features"="+vpu" }