Index: lib/Target/ARM64/ARM64InstrFormats.td =================================================================== --- lib/Target/ARM64/ARM64InstrFormats.td +++ lib/Target/ARM64/ARM64InstrFormats.td @@ -6867,10 +6867,12 @@ def d : BaseSIMDScalarShift { + [(set (i64 FPR64:$Rd), (OpNode (i64 FPR64:$Rn), (i32 vecshiftL64:$imm)))]> { let Inst{21-16} = imm{5-0}; } + + def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rn), (i32 vecshiftL64:$imm))), + (!cast(NAME # "d") FPR64:$Rn, vecshiftL64:$imm)>; } multiclass SIMDScalarRShiftBHSD opc, string asm> { Index: tools/clang/lib/CodeGen/CGBuiltin.cpp =================================================================== --- tools/clang/lib/CodeGen/CGBuiltin.cpp +++ tools/clang/lib/CodeGen/CGBuiltin.cpp @@ -5526,10 +5526,8 @@ case NEON::BI__builtin_neon_vqshlud_n_s64: { Ops.push_back(EmitScalarExpr(E->getArg(1))); Ops[1] = Builder.CreateZExt(Ops[1], Int64Ty); - llvm::Type *VTy = llvm::VectorType::get(Int64Ty, 1); - Ops[0] = EmitNeonCall(CGM.getIntrinsic(Intrinsic::arm64_neon_sqshlu, VTy), - Ops, "vqshlu_n"); - return Builder.CreateBitCast(Ops[0], Int64Ty); + return EmitNeonCall(CGM.getIntrinsic(Intrinsic::arm64_neon_sqshlu, Int64Ty), + Ops, "vqshlu_n"); } case NEON::BI__builtin_neon_vqshld_n_u64: case NEON::BI__builtin_neon_vqshld_n_s64: { @@ -5538,9 +5536,7 @@ : Intrinsic::arm64_neon_sqshl; Ops.push_back(EmitScalarExpr(E->getArg(1))); Ops[1] = Builder.CreateZExt(Ops[1], Int64Ty); - llvm::Type *VTy = llvm::VectorType::get(Int64Ty, 1); - Ops[0] = EmitNeonCall(CGM.getIntrinsic(Int, VTy), Ops, "vqshl_n"); - return Builder.CreateBitCast(Ops[0], Int64Ty); + return EmitNeonCall(CGM.getIntrinsic(Int, Int64Ty), Ops, "vqshl_n"); } case NEON::BI__builtin_neon_vrshrd_n_u64: case NEON::BI__builtin_neon_vrshrd_n_s64: { @@ -5548,9 +5544,9 @@ ? Intrinsic::arm64_neon_urshl : Intrinsic::arm64_neon_srshl; Ops.push_back(EmitScalarExpr(E->getArg(1))); - llvm::Type *VTy = llvm::VectorType::get(Int64Ty, 1); - Ops[0] = EmitNeonCall(CGM.getIntrinsic(Int, VTy), Ops, "vrshr_n", 1, true); - return Builder.CreateBitCast(Ops[0], Int64Ty); + int SV = cast(Ops[1])->getSExtValue(); + Ops[1] = ConstantInt::get(Int64Ty, -SV); + return EmitNeonCall(CGM.getIntrinsic(Int, Int64Ty), Ops, "vrshr_n"); } case NEON::BI__builtin_neon_vrsrad_n_u64: case NEON::BI__builtin_neon_vrsrad_n_s64: { Index: tools/clang/test/CodeGen/arm64-scalar-test.c =================================================================== --- tools/clang/test/CodeGen/arm64-scalar-test.c +++ tools/clang/test/CodeGen/arm64-scalar-test.c @@ -114,6 +114,12 @@ // CHECK: sqshl {{d[0-9]+}}, {{d[0-9]+}}, {{d[0-9]+}} } +// CHECK: test_vqshld_s64_i +int64_t test_vqshld_s64_i(int64_t a) { + return vqshld_s64(a, 36); +// CHECK: sqshl {{d[0-9]+}}, {{d[0-9]+}}, #36 +} + // CHECK: test_vqshlb_u8 uint8_t test_vqshlb_u8(uint8_t a, uint8_t b) { return vqshlb_u8(a, b); @@ -138,6 +144,12 @@ // CHECK: uqshl {{d[0-9]+}}, {{d[0-9]+}}, {{d[0-9]+}} } +// CHECK: test_vqshld_u64_i +uint64_t test_vqshld_u64_i(uint64_t a) { + return vqshld_u64(a, 36); +// CHECK: uqshl {{d[0-9]+}}, {{d[0-9]+}}, #36 +} + // CHECK: test_vshld_u64 uint64_t test_vshld_u64(uint64_t a, uint64_t b) { return vshld_u64(a, b);