This is an archive of the discontinued LLVM Phabricator instance.

[RISCV] Custom lower ISD::VSCALE.
ClosedPublic

Authored by craig.topper on Jan 7 2021, 11:24 AM.

Download Raw Diff

Details

Reviewers

HsiangKai
evandro
frasercrmck
rogfer01

Commits

rGdfc1901d513e: [RISCV] Custom lower ISD::VSCALE.

Summary

This patch custom lowers ISD::VSCALE into a csrr vlenb followed
by a shift right by 3 followed by a multiply by the scale amount.

I've added computeKnownBits support to indicate that the csrr vlenb
always produces 3 trailng bits of 0s so the shift right is "exact".
This allows the shift and multiply sequence to be nicely optimized
into a single shift or removed completely when the scale amount is
a power of 2.

The non power of 2 case multiplying by 24 is still producing
suboptimal code. We could remove the right shift and use a
multiply by 3. Hopefully we can improve DAG combine to fix that
since it's not unique to this sequence.

This replaces D94144.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

craig.topper created this revision.Jan 7 2021, 11:24 AM

Herald added subscribers: NickHung, luismarques, apazos and 24 others. · View Herald TranscriptJan 7 2021, 11:24 AM

craig.topper requested review of this revision.Jan 7 2021, 11:24 AM

Herald added a project: Restricted Project. · View Herald TranscriptJan 7 2021, 11:24 AM

Herald added a subscriber: MaskRay. · View Herald Transcript

craig.topper edited the summary of this revision. (Show Details)Jan 7 2021, 11:25 AM

Harbormaster completed remote builds in B84358: Diff 315190.Jan 7 2021, 12:26 PM

HsiangKai added inline comments.Jan 13 2021, 7:18 AM

llvm/lib/Target/RISCV/RISCVISelLowering.cpp
697	I think we need add comments to explain why we need to shift right 3 bits.
1901	In V specification v1.0, VLEN=128 at least. We could assume VLENB is at least 16 bytes.

-Add comments about why we shift by 3.
-Add FIXMEs for the 1.0 change to VLEN>=128.

Harbormaster completed remote builds in B85056: Diff 316462.Jan 13 2021, 11:54 AM

-Remove a FIXME. Just because the minimum VLEN might be defined as 128 doesn't mean we need to change our type mappings.
-Reword the description of why we divide by 8 to not talk about VLEN.

LGTM.

This revision is now accepted and ready to land.Jan 13 2021, 5:05 PM

This revision was landed with ongoing or failed builds.Jan 13 2021, 5:33 PM

Closed by commit rGdfc1901d513e: [RISCV] Custom lower ISD::VSCALE. (authored by craig.topper). · Explain Why

This revision was automatically updated to reflect the committed changes.

craig.topper added a commit: rGdfc1901d513e: [RISCV] Custom lower ISD::VSCALE..

Harbormaster completed remote builds in B85102: Diff 316537.Jan 13 2021, 5:33 PM

Revision Contents

Path

Size

llvm/

lib/

Target/

RISCV/

RISCVISelLowering.h

7 lines

RISCVISelLowering.cpp

39 lines

RISCVInstrInfoVPseudos.td

7 lines

RISCVMCInstLower.cpp

9 lines

test/

CodeGen/

RISCV/

rvv/

rvv-vscale.i32.ll

54 lines

rvv-vscale.i64.ll

54 lines

Diff 316540

llvm/lib/Target/RISCV/RISCVISelLowering.h

Show First 20 Lines • Show All 79 Lines • ▼ Show 20 Lines	enum NodeType : unsigned {
// Vector Extension		// Vector Extension
// VMV_X_S matches the semantics of vmv.x.s. The result is always XLenVT		// VMV_X_S matches the semantics of vmv.x.s. The result is always XLenVT
// sign extended from the vector element size. NOTE: The result size will		// sign extended from the vector element size. NOTE: The result size will
// never be less than the vector element size.		// never be less than the vector element size.
VMV_X_S,		VMV_X_S,
// Splats an i64 scalar to a vector type (with element type i64) where the		// Splats an i64 scalar to a vector type (with element type i64) where the
// scalar is a sign-extended i32.		// scalar is a sign-extended i32.
SPLAT_VECTOR_I64,		SPLAT_VECTOR_I64,
		// Read VLENB CSR
		READ_VLENB,
};		};
} // namespace RISCVISD		} // namespace RISCVISD

class RISCVTargetLowering : public TargetLowering {		class RISCVTargetLowering : public TargetLowering {
const RISCVSubtarget &Subtarget;		const RISCVSubtarget &Subtarget;

public:		public:
explicit RISCVTargetLowering(const TargetMachine &TM,		explicit RISCVTargetLowering(const TargetMachine &TM,
Show All 22 Lines	public:

// Provide custom lowering hooks for some operations.		// Provide custom lowering hooks for some operations.
SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;		SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results,		void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue> &Results,
SelectionDAG &DAG) const override;		SelectionDAG &DAG) const override;

SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;		SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;

		void computeKnownBitsForTargetNode(const SDValue Op,
		KnownBits &Known,
		const APInt &DemandedElts,
		const SelectionDAG &DAG,
		unsigned Depth) const override;
unsigned ComputeNumSignBitsForTargetNode(SDValue Op,		unsigned ComputeNumSignBitsForTargetNode(SDValue Op,
const APInt &DemandedElts,		const APInt &DemandedElts,
const SelectionDAG &DAG,		const SelectionDAG &DAG,
unsigned Depth) const override;		unsigned Depth) const override;

// This method returns the name of a target specific DAG node.		// This method returns the name of a target specific DAG node.
const char *getTargetNodeName(unsigned Opcode) const override;		const char *getTargetNodeName(unsigned Opcode) const override;

▲ Show 20 Lines • Show All 168 Lines • Show Last 20 Lines

llvm/lib/Target/RISCV/RISCVISelLowering.cpp

Show All 26 Lines
#include "llvm/CodeGen/MachineRegisterInfo.h"		#include "llvm/CodeGen/MachineRegisterInfo.h"
#include "llvm/CodeGen/TargetLoweringObjectFileImpl.h"		#include "llvm/CodeGen/TargetLoweringObjectFileImpl.h"
#include "llvm/CodeGen/ValueTypes.h"		#include "llvm/CodeGen/ValueTypes.h"
#include "llvm/IR/DiagnosticInfo.h"		#include "llvm/IR/DiagnosticInfo.h"
#include "llvm/IR/DiagnosticPrinter.h"		#include "llvm/IR/DiagnosticPrinter.h"
#include "llvm/IR/IntrinsicsRISCV.h"		#include "llvm/IR/IntrinsicsRISCV.h"
#include "llvm/Support/Debug.h"		#include "llvm/Support/Debug.h"
#include "llvm/Support/ErrorHandling.h"		#include "llvm/Support/ErrorHandling.h"
		#include "llvm/Support/KnownBits.h"
#include "llvm/Support/MathExtras.h"		#include "llvm/Support/MathExtras.h"
#include "llvm/Support/raw_ostream.h"		#include "llvm/Support/raw_ostream.h"

using namespace llvm;		using namespace llvm;

#define DEBUG_TYPE "riscv-lower"		#define DEBUG_TYPE "riscv-lower"

STATISTIC(NumTailCalls, "Number of tail calls");		STATISTIC(NumTailCalls, "Number of tail calls");
▲ Show 20 Lines • Show All 302 Lines • ▼ Show 20 Lines	if (Subtarget.hasStdExtA()) {
setMaxAtomicSizeInBitsSupported(0);		setMaxAtomicSizeInBitsSupported(0);
}		}

setBooleanContents(ZeroOrOneBooleanContent);		setBooleanContents(ZeroOrOneBooleanContent);

if (Subtarget.hasStdExtV()) {		if (Subtarget.hasStdExtV()) {
setBooleanVectorContents(ZeroOrOneBooleanContent);		setBooleanVectorContents(ZeroOrOneBooleanContent);

		setOperationAction(ISD::VSCALE, XLenVT, Custom);

// RVV intrinsics may have illegal operands.		// RVV intrinsics may have illegal operands.
// We also need to custom legalize vmv.x.s.		// We also need to custom legalize vmv.x.s.
setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i8, Custom);		setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i8, Custom);
setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i16, Custom);		setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i16, Custom);
setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i8, Custom);		setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i8, Custom);
setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i16, Custom);		setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i16, Custom);
setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i32, Custom);		setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::i32, Custom);
setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i32, Custom);		setOperationAction(ISD::INTRINSIC_W_CHAIN, MVT::i32, Custom);
▲ Show 20 Lines • Show All 320 Lines • ▼ Show 20 Lines	case ISD::BITREVERSE: {
// If this is BSWAP rather than BITREVERSE, clear the lower 3 bits.		// If this is BSWAP rather than BITREVERSE, clear the lower 3 bits.
if (Op.getOpcode() == ISD::BSWAP)		if (Op.getOpcode() == ISD::BSWAP)
Imm &= ~0x7U;		Imm &= ~0x7U;
return DAG.getNode(RISCVISD::GREVI, DL, VT, Op.getOperand(0),		return DAG.getNode(RISCVISD::GREVI, DL, VT, Op.getOperand(0),
DAG.getTargetConstant(Imm, DL, Subtarget.getXLenVT()));		DAG.getTargetConstant(Imm, DL, Subtarget.getXLenVT()));
}		}
case ISD::SPLAT_VECTOR:		case ISD::SPLAT_VECTOR:
return lowerSPLATVECTOR(Op, DAG);		return lowerSPLATVECTOR(Op, DAG);
		case ISD::VSCALE: {
		MVT VT = Op.getSimpleValueType();
		SDLoc DL(Op);
		SDValue VLENB = DAG.getNode(RISCVISD::READ_VLENB, DL, VT);
		// We define our scalable vector types for lmul=1 to use a 64 bit known
		// minimum size. e.g. <vscale x 2 x i32>. VLENB is in bytes so we calculate
		HsiangKaiUnsubmitted Not Done Reply Inline Actions I think we need add comments to explain why we need to shift right 3 bits. HsiangKai: I think we need add comments to explain why we need to shift right 3 bits.
		// vscale as VLENB / 8.
		SDValue VScale = DAG.getNode(ISD::SRL, DL, VT, VLENB,
		DAG.getConstant(3, DL, VT));
		return DAG.getNode(ISD::MUL, DL, VT, VScale, Op.getOperand(0));
		}
}		}
}		}

static SDValue getTargetNode(GlobalAddressSDNode *N, SDLoc DL, EVT Ty,		static SDValue getTargetNode(GlobalAddressSDNode *N, SDLoc DL, EVT Ty,
SelectionDAG &DAG, unsigned Flags) {		SelectionDAG &DAG, unsigned Flags) {
return DAG.getTargetGlobalAddress(N->getGlobal(), DL, Ty, 0, Flags);		return DAG.getTargetGlobalAddress(N->getGlobal(), DL, Ty, 0, Flags);
}		}

▲ Show 20 Lines • Show All 1,165 Lines • ▼ Show 20 Lines	if (C1 && C2) {
// combine should be prevented.		// combine should be prevented.
if (C1Cost < ShiftedC1Cost)		if (C1Cost < ShiftedC1Cost)
return false;		return false;
}		}
}		}
return true;		return true;
}		}

		void RISCVTargetLowering::computeKnownBitsForTargetNode(const SDValue Op,
		KnownBits &Known,
		const APInt &DemandedElts,
		const SelectionDAG &DAG,
		unsigned Depth) const {
		unsigned Opc = Op.getOpcode();
		assert((Opc >= ISD::BUILTIN_OP_END \|\|
		Opc == ISD::INTRINSIC_WO_CHAIN \|\|
		Opc == ISD::INTRINSIC_W_CHAIN \|\|
		Opc == ISD::INTRINSIC_VOID) &&
		"Should use MaskedValueIsZero if you don't know whether Op"
		" is a target node!");

		Known.resetAll();
		switch (Opc) {
		default: break;
		case RISCVISD::READ_VLENB:
		// We assume VLENB is at least 8 bytes.
		HsiangKaiUnsubmitted Not Done Reply Inline Actions In V specification v1.0, VLEN=128 at least. We could assume VLENB is at least 16 bytes. HsiangKai: In V specification v1.0, VLEN=128 at least. We could assume VLENB is at least 16 bytes.
		// FIXME: The 1.0 draft spec defines minimum VLEN as 128 bits.
		Known.Zero.setLowBits(3);
		break;
		}
		}

unsigned RISCVTargetLowering::ComputeNumSignBitsForTargetNode(		unsigned RISCVTargetLowering::ComputeNumSignBitsForTargetNode(
SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG,		SDValue Op, const APInt &DemandedElts, const SelectionDAG &DAG,
unsigned Depth) const {		unsigned Depth) const {
switch (Op.getOpcode()) {		switch (Op.getOpcode()) {
default:		default:
break;		break;
case RISCVISD::SLLW:		case RISCVISD::SLLW:
case RISCVISD::SRAW:		case RISCVISD::SRAW:
▲ Show 20 Lines • Show All 1,657 Lines • ▼ Show 20 Lines	#define NODE_NAME_CASE(NODE) \
NODE_NAME_CASE(FMV_X_ANYEXTW_RV64)		NODE_NAME_CASE(FMV_X_ANYEXTW_RV64)
NODE_NAME_CASE(READ_CYCLE_WIDE)		NODE_NAME_CASE(READ_CYCLE_WIDE)
NODE_NAME_CASE(GREVI)		NODE_NAME_CASE(GREVI)
NODE_NAME_CASE(GREVIW)		NODE_NAME_CASE(GREVIW)
NODE_NAME_CASE(GORCI)		NODE_NAME_CASE(GORCI)
NODE_NAME_CASE(GORCIW)		NODE_NAME_CASE(GORCIW)
NODE_NAME_CASE(VMV_X_S)		NODE_NAME_CASE(VMV_X_S)
NODE_NAME_CASE(SPLAT_VECTOR_I64)		NODE_NAME_CASE(SPLAT_VECTOR_I64)
		NODE_NAME_CASE(READ_VLENB)
}		}
// clang-format on		// clang-format on
return nullptr;		return nullptr;
#undef NODE_NAME_CASE		#undef NODE_NAME_CASE
}		}

/// getConstraintType - Given a constraint letter, return the type of		/// getConstraintType - Given a constraint letter, return the type of
/// constraint it is for this target.		/// constraint it is for this target.
▲ Show 20 Lines • Show All 449 Lines • Show Last 20 Lines

llvm/lib/Target/RISCV/RISCVInstrInfoVPseudos.td

	Show All 11 Lines
	///			///
	/// This file is included from RISCVInstrInfoV.td			/// This file is included from RISCVInstrInfoV.td
	///			///
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

	def riscv_vmv_x_s : SDNode<"RISCVISD::VMV_X_S",			def riscv_vmv_x_s : SDNode<"RISCVISD::VMV_X_S",
	SDTypeProfile<1, 1, [SDTCisInt<0>, SDTCisVec<1>,			SDTypeProfile<1, 1, [SDTCisInt<0>, SDTCisVec<1>,
	SDTCisInt<1>]>>;			SDTCisInt<1>]>>;
				def riscv_read_vlenb : SDNode<"RISCVISD::READ_VLENB",
				SDTypeProfile<1, 0, [SDTCisVT<0, XLenVT>]>>;

	// X0 has special meaning for vsetvl/vsetvli.			// X0 has special meaning for vsetvl/vsetvli.
	// rd \| rs1 \| AVL value \| Effect on vl			// rd \| rs1 \| AVL value \| Effect on vl
	//--------------------------------------------------------------			//--------------------------------------------------------------
	// !X0 \| X0 \| VLMAX \| Set vl to VLMAX			// !X0 \| X0 \| VLMAX \| Set vl to VLMAX
	// X0 \| X0 \| Value in vl \| Keep current vl, just change vtype.			// X0 \| X0 \| Value in vl \| Keep current vl, just change vtype.
	def NoX0 : SDNodeXForm<undef,			def NoX0 : SDNodeXForm<undef,
	[{			[{
	▲ Show 20 Lines • Show All 2,364 Lines • ▼ Show 20 Lines
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	let hasSideEffects = 0, mayLoad = 0, mayStore = 0 in {			let hasSideEffects = 0, mayLoad = 0, mayStore = 0 in {
	def PseudoVMV1R_V : VPseudo<VMV1R_V, V_M1, (outs VR:$vd), (ins VR:$vs2)>;			def PseudoVMV1R_V : VPseudo<VMV1R_V, V_M1, (outs VR:$vd), (ins VR:$vs2)>;
	def PseudoVMV2R_V : VPseudo<VMV2R_V, V_M2, (outs VRM2:$vd), (ins VRM2:$vs2)>;			def PseudoVMV2R_V : VPseudo<VMV2R_V, V_M2, (outs VRM2:$vd), (ins VRM2:$vs2)>;
	def PseudoVMV4R_V : VPseudo<VMV4R_V, V_M4, (outs VRM4:$vd), (ins VRM4:$vs2)>;			def PseudoVMV4R_V : VPseudo<VMV4R_V, V_M4, (outs VRM4:$vd), (ins VRM4:$vs2)>;
	def PseudoVMV8R_V : VPseudo<VMV8R_V, V_M8, (outs VRM8:$vd), (ins VRM8:$vs2)>;			def PseudoVMV8R_V : VPseudo<VMV8R_V, V_M8, (outs VRM8:$vd), (ins VRM8:$vs2)>;
	}			}

				let hasSideEffects = 0, mayLoad = 0, mayStore = 0, isCodeGenOnly = 1 in {
				def PseudoReadVLENB : Pseudo<(outs GPR:$rd), (ins),
				[(set GPR:$rd, (riscv_read_vlenb))]>;
				}

	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	// 6. Configuration-Setting Instructions			// 6. Configuration-Setting Instructions
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

	// Pseudos.			// Pseudos.
	let hasSideEffects = 1, mayLoad = 0, mayStore = 0, Defs = [VL, VTYPE] in {			let hasSideEffects = 1, mayLoad = 0, mayStore = 0, Defs = [VL, VTYPE] in {
	def PseudoVSETVLI : Pseudo<(outs GPR:$rd), (ins GPR:$rs1, VTypeIOp:$vtypei), []>;			def PseudoVSETVLI : Pseudo<(outs GPR:$rd), (ins GPR:$rs1, VTypeIOp:$vtypei), []>;

	▲ Show 20 Lines • Show All 1,209 Lines • Show Last 20 Lines

llvm/lib/Target/RISCV/RISCVMCInstLower.cpp

Show First 20 Lines • Show All 204 Lines • ▼ Show 20 Lines	void llvm::LowerRISCVMachineInstrToMCInst(const MachineInstr *MI, MCInst &OutMI,

OutMI.setOpcode(MI->getOpcode());		OutMI.setOpcode(MI->getOpcode());

for (const MachineOperand &MO : MI->operands()) {		for (const MachineOperand &MO : MI->operands()) {
MCOperand MCOp;		MCOperand MCOp;
if (LowerRISCVMachineOperandToMCOperand(MO, MCOp, AP))		if (LowerRISCVMachineOperandToMCOperand(MO, MCOp, AP))
OutMI.addOperand(MCOp);		OutMI.addOperand(MCOp);
}		}

		if (OutMI.getOpcode() == RISCV::PseudoReadVLENB) {
		OutMI.setOpcode(RISCV::CSRRS);
		OutMI.addOperand(MCOperand::createImm(
		RISCVSysReg::lookupSysRegByName("VLENB")->Encoding));
		OutMI.addOperand(MCOperand::createReg(RISCV::X0));
		return;
		}

}		}

llvm/test/CodeGen/RISCV/rvv/rvv-vscale.i32.ll

This file was added.

				; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
				; RUN: llc -mtriple riscv32 -mattr=+m,+experimental-v < %s \
				; RUN: \| FileCheck %s

				define i32 @vscale_zero() nounwind {
				; CHECK-LABEL: vscale_zero:
				; CHECK: # %bb.0: # %entry
				; CHECK-NEXT: mv a0, zero
				; CHECK-NEXT: ret
				entry:
				%0 = call i32 @llvm.vscale.i32()
				%1 = mul i32 %0, 0
				ret i32 %1
				}

				define i32 @vscale_one() nounwind {
				; CHECK-LABEL: vscale_one:
				; CHECK: # %bb.0: # %entry
				; CHECK-NEXT: csrr a0, vlenb
				; CHECK-NEXT: srli a0, a0, 3
				; CHECK-NEXT: ret
				entry:
				%0 = call i32 @llvm.vscale.i32()
				%1 = mul i32 %0, 1
				ret i32 %1
				}

				define i32 @vscale_uimmpow2xlen() nounwind {
				; CHECK-LABEL: vscale_uimmpow2xlen:
				; CHECK: # %bb.0: # %entry
				; CHECK-NEXT: csrr a0, vlenb
				; CHECK-NEXT: slli a0, a0, 3
				; CHECK-NEXT: ret
				entry:
				%0 = call i32 @llvm.vscale.i32()
				%1 = mul i32 %0, 64
				ret i32 %1
				}

				define i32 @vscale_non_pow2() nounwind {
				; CHECK-LABEL: vscale_non_pow2:
				; CHECK: # %bb.0: # %entry
				; CHECK-NEXT: csrr a0, vlenb
				; CHECK-NEXT: srli a0, a0, 3
				; CHECK-NEXT: addi a1, zero, 24
				; CHECK-NEXT: mul a0, a0, a1
				; CHECK-NEXT: ret
				entry:
				%0 = call i32 @llvm.vscale.i32()
				%1 = mul i32 %0, 24
				ret i32 %1
				}

				declare i32 @llvm.vscale.i32()

llvm/test/CodeGen/RISCV/rvv/rvv-vscale.i64.ll

This file was added.

				; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
				; RUN: llc -mtriple riscv64 -mattr=+m,+experimental-v < %s \
				; RUN: \| FileCheck %s

				define i64 @vscale_zero() nounwind {
				; CHECK-LABEL: vscale_zero:
				; CHECK: # %bb.0: # %entry
				; CHECK-NEXT: mv a0, zero
				; CHECK-NEXT: ret
				entry:
				%0 = call i64 @llvm.vscale.i64()
				%1 = mul i64 %0, 0
				ret i64 %1
				}

				define i64 @vscale_one() nounwind {
				; CHECK-LABEL: vscale_one:
				; CHECK: # %bb.0: # %entry
				; CHECK-NEXT: csrr a0, vlenb
				; CHECK-NEXT: srli a0, a0, 3
				; CHECK-NEXT: ret
				entry:
				%0 = call i64 @llvm.vscale.i64()
				%1 = mul i64 %0, 1
				ret i64 %1
				}

				define i64 @vscale_uimmpow2xlen() nounwind {
				; CHECK-LABEL: vscale_uimmpow2xlen:
				; CHECK: # %bb.0: # %entry
				; CHECK-NEXT: csrr a0, vlenb
				; CHECK-NEXT: slli a0, a0, 3
				; CHECK-NEXT: ret
				entry:
				%0 = call i64 @llvm.vscale.i64()
				%1 = mul i64 %0, 64
				ret i64 %1
				}

				define i64 @vscale_non_pow2() nounwind {
				; CHECK-LABEL: vscale_non_pow2:
				; CHECK: # %bb.0: # %entry
				; CHECK-NEXT: csrr a0, vlenb
				; CHECK-NEXT: srli a0, a0, 3
				; CHECK-NEXT: addi a1, zero, 24
				; CHECK-NEXT: mul a0, a0, a1
				; CHECK-NEXT: ret
				entry:
				%0 = call i64 @llvm.vscale.i64()
				%1 = mul i64 %0, 24
				ret i64 %1
				}

				declare i64 @llvm.vscale.i64()