Index: llvm/trunk/lib/Target/X86/X86InstrAVX512.td =================================================================== --- llvm/trunk/lib/Target/X86/X86InstrAVX512.td +++ llvm/trunk/lib/Target/X86/X86InstrAVX512.td @@ -739,7 +739,7 @@ vextract128_extract, EXTRACT_get_vextract128_imm, [HasAVX512, NoDQI]>; defm : vextract_for_size_lowering<"VEXTRACTF64x4Z", v16f32_info, v8f32x_info, - vextract128_extract, EXTRACT_get_vextract128_imm, [HasAVX512, NoDQI]>; + vextract256_extract, EXTRACT_get_vextract256_imm, [HasAVX512, NoDQI]>; defm : vextract_for_size_lowering<"VEXTRACTI64x4Z", v16i32_info, v8i32x_info, vextract256_extract, EXTRACT_get_vextract256_imm, [HasAVX512, NoDQI]>; Index: llvm/trunk/test/CodeGen/X86/vector-shuffle-512-v16.ll =================================================================== --- llvm/trunk/test/CodeGen/X86/vector-shuffle-512-v16.ll +++ llvm/trunk/test/CodeGen/X86/vector-shuffle-512-v16.ll @@ -120,3 +120,14 @@ ret <16 x i32> %c } +define <8 x float> @shuffle_v16f32_extract_256(float* %RET, float* %a) { +; ALL-LABEL: shuffle_v16f32_extract_256: +; ALL: # BB#0: +; ALL-NEXT: vmovups (%rsi), %zmm0 +; ALL-NEXT: vextractf64x4 $1, %zmm0, %ymm0 +; ALL-NEXT: retq + %ptr_a = bitcast float* %a to <16 x float>* + %v_a = load <16 x float>, <16 x float>* %ptr_a, align 4 + %v2 = shufflevector <16 x float> %v_a, <16 x float> undef, <8 x i32> + ret <8 x float> %v2 +}