Index: lib/Target/WebAssembly/WebAssemblyISelLowering.cpp =================================================================== --- lib/Target/WebAssembly/WebAssemblyISelLowering.cpp +++ lib/Target/WebAssembly/WebAssemblyISelLowering.cpp @@ -174,11 +174,24 @@ // - Floating-point extending loads. // - Floating-point truncating stores. // - i1 extending loads. + // - extending/truncating SIMD loads/stores setLoadExtAction(ISD::EXTLOAD, MVT::f64, MVT::f32, Expand); setTruncStoreAction(MVT::f64, MVT::f32, Expand); for (auto T : MVT::integer_valuetypes()) for (auto Ext : {ISD::EXTLOAD, ISD::ZEXTLOAD, ISD::SEXTLOAD}) setLoadExtAction(Ext, T, MVT::i1, Promote); + if (Subtarget->hasSIMD128()) { + for (auto T : {MVT::v16i8, MVT::v8i16, MVT::v4i32, MVT::v2i64, MVT::v4f32, + MVT::v2f64}) { + for (auto MemT : MVT::vector_valuetypes()) { + if (MVT(T) != MemT) { + setTruncStoreAction(T, MemT, Expand); + for (auto Ext : {ISD::EXTLOAD, ISD::ZEXTLOAD, ISD::SEXTLOAD}) + setLoadExtAction(Ext, T, MemT, Expand); + } + } + } + } // Trap lowers to wasm unreachable setOperationAction(ISD::TRAP, MVT::Other, Legal); Index: test/CodeGen/WebAssembly/simd-ext-load-trunc-store.ll =================================================================== --- /dev/null +++ test/CodeGen/WebAssembly/simd-ext-load-trunc-store.ll @@ -0,0 +1,60 @@ +; RUN: llc < %s -asm-verbose=false -disable-wasm-fallthrough-return-opt -wasm-disable-explicit-locals -wasm-keep-registers -wasm-enable-unimplemented-simd -mattr=+simd128 | FileCheck %s + +; Check that store in memory with smaller lanes are loaded and stored +; as expected. This is a regression test for part of bug 39275. + +target datalayout = "e-m:e-p:32:32-i64:64-n32:64-S128" +target triple = "wasm32-unknown-unknown" + +; CHECK-LABEL: load_ext_2xi32: +; CHECK-NEXT: .param i32{{$}} +; CHECK-NEXT: .result v128{{$}} +; CHECK-NEXT: i64.load32_u $push[[L0:[0-9]+]]=, 0($0){{$}} +; CHECK-NEXT: i64x2.splat $push[[L1:[0-9]+]]=, $pop[[L0]]{{$}} +; CHECK-NEXT: i64.load32_u $push[[L2:[0-9]+]]=, 4($0){{$}} +; CHECK-NEXT: i64x2.replace_lane $push[[R:[0-9]+]]=, $pop[[L1]], 1, $pop[[L2]]{{$}} +; CHECK-NEXT: return $pop[[R]]{{$}} +define <2 x i32> @load_ext_2xi32(<2 x i32>* %p) { + %1 = load <2 x i32>, <2 x i32>* %p, align 4 + ret <2 x i32> %1 +} + +; CHECK-LABEL: load_zext_2xi32: +; CHECK-NEXT: .param i32{{$}} +; CHECK-NEXT: .result v128{{$}} +; CHECK-NEXT: i64.load32_u $push[[L0:[0-9]+]]=, 0($0){{$}} +; CHECK-NEXT: i64x2.splat $push[[L1:[0-9]+]]=, $pop[[L0]]{{$}} +; CHECK-NEXT: i64.load32_u $push[[L2:[0-9]+]]=, 4($0){{$}} +; CHECK-NEXT: i64x2.replace_lane $push[[R:[0-9]+]]=, $pop[[L1]], 1, $pop[[L2]]{{$}} +; CHECK-NEXT: return $pop[[R]]{{$}} +define <2 x i64> @load_zext_2xi32(<2 x i32>* %p) { + %1 = load <2 x i32>, <2 x i32>* %p, align 4 + %2 = zext <2 x i32> %1 to <2 x i64> + ret <2 x i64> %2 +} + +; CHECK-LABEL: load_sext_2xi32: +; CHECK-NEXT: .param i32{{$}} +; CHECK-NEXT: .result v128{{$}} +; CHECK-NEXT: i64.load32_s $push[[L0:[0-9]+]]=, 0($0){{$}} +; CHECK-NEXT: i64x2.splat $push[[L1:[0-9]+]]=, $pop[[L0]]{{$}} +; CHECK-NEXT: i64.load32_s $push[[L2:[0-9]+]]=, 4($0){{$}} +; CHECK-NEXT: i64x2.replace_lane $push[[R:[0-9]+]]=, $pop[[L1]], 1, $pop[[L2]]{{$}} +; CHECK-NEXT: return $pop[[R]]{{$}} +define <2 x i64> @load_sext_2xi32(<2 x i32>* %p) { + %1 = load <2 x i32>, <2 x i32>* %p, align 4 + %2 = sext <2 x i32> %1 to <2 x i64> + ret <2 x i64> %2 +} + +; CHECK-LABEL: store_trunc_2xi32: +; CHECK-NEXT: .param i32, v128{{$}} +; CHECK-NEXT: i64x2.extract_lane $push[[L0:[0-9]+]]=, $1, 1 +; CHECK-NEXT: i64.store32 4($0), $pop[[L0]] +; CHECK-NEXT: i64x2.extract_lane $push[[L1:[0-9]+]]=, $1, 0 +; CHECK-NEXT: i64.store32 0($0), $pop[[L1]] +; CHECK-NEXT: return +define void @store_trunc_2xi32(<2 x i32>* %p, <2 x i32> %x) { + store <2 x i32> %x, <2 x i32>* %p, align 4 + ret void +}