This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
clang/test/
-
test/
-
CodeGen/
-
SystemZ/
-
builtins-systemz-zvector-constrained.c
-
builtins-systemz-zvector.c
-
builtins-systemz-zvector2-constrained.c
-
builtins-systemz-zvector2.c
-
X86/
-
avx-shuffle-builtins.c
-
aarch64-bf16-ldst-intrinsics.c
-
aarch64-neon-vcmla.c
-
aarch64-sve-intrinsics/
-
acle_sve_abd.c
-
acle_sve_acge.c
-
acle_sve_acgt.c
-
acle_sve_acle.c
-
acle_sve_aclt.c
-
acle_sve_add.c
-
acle_sve_and.c
-
acle_sve_asr.c
-
acle_sve_bfdot.c
-
acle_sve_bfmlalb.c
-
acle_sve_bfmlalt.c
-
acle_sve_bic.c
-
acle_sve_cmpeq.c
-
acle_sve_cmpge.c
-
acle_sve_cmpgt.c
-
acle_sve_cmple.c
-
acle_sve_cmplt.c
-
acle_sve_cmpne.c
-
acle_sve_cmpuo.c
-
acle_sve_div.c
-
acle_sve_divr.c
-
acle_sve_dot.c
-
acle_sve_dup-bfloat.c
-
acle_sve_dup.c
-
acle_sve_dupq-bfloat.c
-
acle_sve_dupq.c
-
acle_sve_eor.c
-
acle_sve_lsl.c
-
acle_sve_lsr.c
-
acle_sve_mad.c
-
acle_sve_max.c
-
acle_sve_maxnm.c
-
acle_sve_min.c
-
acle_sve_minnm.c
-
acle_sve_mla.c
-
acle_sve_mls.c
-
acle_sve_msb.c
-
acle_sve_mul.c
-
acle_sve_mulh.c
-
acle_sve_mulx.c
-
acle_sve_nmad.c
-
acle_sve_nmla.c
-
acle_sve_nmls.c
-
acle_sve_nmsb.c
-
acle_sve_orr.c
-
acle_sve_qadd.c
-
acle_sve_qsub.c
-
acle_sve_scale.c
-
acle_sve_sub.c
-
acle_sve_subr.c
-
acle_sve_sudot.c
-
acle_sve_usdot.c
-
aarch64-sve2-intrinsics/
-
acle_sve2_aba.c
-
acle_sve2_abalb.c
-
acle_sve2_abalt.c
-
acle_sve2_abdlb.c
-
acle_sve2_abdlt.c
-
acle_sve2_adclb.c
-
acle_sve2_adclt.c
-
acle_sve2_addhnb.c
-
acle_sve2_addhnt.c
-
acle_sve2_addlb.c
-
acle_sve2_addlbt.c
-
acle_sve2_addlt.c
-
acle_sve2_addwb.c
-
acle_sve2_addwt.c
-
acle_sve2_bcax.c
-
acle_sve2_bdep.c
-
acle_sve2_bext.c
-
acle_sve2_bgrp.c
-
acle_sve2_bsl.c
-
acle_sve2_bsl1n.c
-
acle_sve2_bsl2n.c
-
acle_sve2_eor3.c
-
acle_sve2_eorbt.c
-
acle_sve2_eortb.c
-
acle_sve2_hadd.c
-
acle_sve2_hsub.c
-
acle_sve2_hsubr.c
-
acle_sve2_mlalb.c
-
acle_sve2_mlalt.c
-
acle_sve2_mlslb.c
-
acle_sve2_mlslt.c
-
acle_sve2_mullb.c
-
acle_sve2_mullt.c
-
acle_sve2_nbsl.c
-
acle_sve2_pmul.c
-
acle_sve2_pmullb.c
-
acle_sve2_pmullb_128.c
-
acle_sve2_pmullt.c
-
acle_sve2_pmullt_128.c
-
acle_sve2_qadd.c
-
acle_sve2_qdmlalb.c
-
acle_sve2_qdmlalbt.c
-
acle_sve2_qdmlalt.c
-
acle_sve2_qdmlslb.c
-
acle_sve2_qdmlslbt.c
-
acle_sve2_qdmlslt.c
-
acle_sve2_qdmulh.c
-
acle_sve2_qdmullb.c
-
acle_sve2_qdmullt.c
-
acle_sve2_qrdmlah.c
-
acle_sve2_qrdmlsh.c
-
acle_sve2_qrdmulh.c
-
acle_sve2_qrshl.c
-
acle_sve2_qshl.c
-
acle_sve2_qsub.c
-
acle_sve2_qsubr.c
-
acle_sve2_raddhnb.c
-
acle_sve2_raddhnt.c
-
acle_sve2_rhadd.c
-
acle_sve2_rshl.c
-
acle_sve2_rsubhnb.c
-
acle_sve2_rsubhnt.c
-
acle_sve2_sbclb.c
-
acle_sve2_sbclt.c
-
acle_sve2_sqadd.c
-
acle_sve2_subhnb.c
-
acle_sve2_subhnt.c
-
acle_sve2_sublb.c
-
acle_sve2_sublbt.c
-
acle_sve2_sublt.c
-
acle_sve2_subltb.c
-
acle_sve2_subwb.c
-
acle_sve2_subwt.c
-
acle_sve2_uqadd.c
-
Headers/
-
wasm.c
-
llvm/
-
lib/Transforms/InstCombine/
-
Transforms/
-
InstCombine/
2
InstCombineVectorOps.cpp
-
test/Transforms/
-
Transforms/
-
InstCombine/
-
AArch64/
-
sve-intrinsic-opts-dup.ll
-
sve-intrinsic-opts-lasta-lastb.ll
-
sve-intrinsic-opts-unpkhi-unpklo.ll
-
sve-intrinsic-tbl-dupx.ll
-
AMDGPU/
-
amdgcn-demanded-vector-elts-inseltpoison.ll
-
amdgcn-demanded-vector-elts.ll
-
ExtractCast.ll
-
X86/
-
x86-addsub-inseltpoison.ll
-
x86-addsub.ll
-
x86-avx512-inseltpoison.ll
-
x86-avx512.ll
-
x86-fma.ll
-
x86-insertps.ll
-
x86-pshufb-inseltpoison.ll
-
x86-pshufb.ll
-
x86-sse-inseltpoison.ll
-
x86-sse.ll
-
x86-sse2-inseltpoison.ll
-
x86-sse2.ll
-
x86-sse41-inseltpoison.ll
-
x86-sse41.ll
-
x86-vec_demanded_elts-inseltpoison.ll
-
x86-vec_demanded_elts.ll
-
x86-vector-shifts-inseltpoison.ll
-
x86-vector-shifts.ll
-
x86-vpermil-inseltpoison.ll
-
x86-vpermil.ll
-
x86-xop-inseltpoison.ll
-
x86-xop.ll
-
bitcast-bigendian.ll
-
bitcast-inselt-bitcast.ll
-
bitcast-inseltpoison.ll
-
bitcast-vec-canon-inseltpoison.ll
-
bitcast-vec-canon.ll
-
bitcast.ll
-
broadcast-inseltpoison.ll
-
broadcast.ll
-
cast_ptr.ll
-
extractelement-inseltpoison.ll
-
extractelement.ll
-
fmul-inseltpoison.ll
-
fmul.ll
-
gep-inbounds-null.ll
-
gep-vector-indices.ll
-
getelementptr.ll
-
icmp-bc-vec-inseltpoison.ll
-
icmp-bc-vec.ll
-
inselt-binop-inseltpoison.ll
-
inselt-binop.ll
-
insert-const-shuf.ll
-
insert-extract-shuffle-inseltpoison.ll
-
insert-extract-shuffle.ll
-
insertelement-bitcast.ll
-
masked_intrinsics-inseltpoison.ll
-
masked_intrinsics.ll
-
masked_intrinsics_keep_metadata.ll
-
minmax-fold.ll
-
multi-size-address-space-pointer.ll
-
pr38984-inseltpoison.ll
-
pr38984.ll
-
reduction-add-sext-zext-i1.ll
-
reduction-and-sext-zext-i1.ll
-
reduction-mul-sext-zext-i1.ll
-
reduction-or-sext-zext-i1.ll
-
reduction-smax-sext-zext-i1.ll
-
reduction-smin-sext-zext-i1.ll
-
reduction-umax-sext-zext-i1.ll
-
reduction-umin-sext-zext-i1.ll
-
reduction-xor-sext-zext-i1.ll
-
scalarization-inseltpoison.ll
-
scalarization.ll
-
select-extractelement-inseltpoison.ll
-
select-extractelement.ll
-
select-safe-impliedcond-transforms.ll
-
shift-add-inseltpoison.ll
-
shift-add.ll
-
shufflevec-bitcast-inseltpoison.ll
-
shufflevec-bitcast.ll
-
shufflevector-div-rem-inseltpoison.ll
-
shufflevector-div-rem.ll
-
sincospi.ll
-
sink-into-catchswitch.ll
-
trunc-extractelement-inseltpoison.ll
-
trunc-extractelement.ll
-
trunc-inseltpoison.ll
-
trunc.ll
-
type_pun-inseltpoison.ll
-
type_pun.ll
-
vec_demanded_elts-inseltpoison.ll
-
vec_demanded_elts.ll
-
vec_extract_2elts.ll
-
vec_gep_scalar_arg-inseltpoison.ll
-
vec_gep_scalar_arg.ll
-
vec_phi_extract-inseltpoison.ll
-
vec_phi_extract.ll
-
vec_shuffle-inseltpoison.ll
-
vec_shuffle.ll
-
vector-casts-inseltpoison.ll
-
vector-casts.ll
-
vector-reverse.ll
-
vector_insertelt_shuffle-inseltpoison.ll
-
vector_insertelt_shuffle.ll
-
vscale_cmp.ll
-
vscale_extractelement-inseltpoison.ll
-
vscale_extractelement.ll
-
vscale_insertelement-inseltpoison.ll
-
vscale_insertelement.ll
-
LoopVectorize/
-
AArch64/
-
aarch64-predication.ll
-
intrinsiccost.ll
-
sve-cond-inv-loads.ll
-
sve-gather-scatter.ll
-
sve-inductions.ll
-
sve-widen-phi.ll
-
ARM/
-
mve-saddsatcost.ll
-
pointer_iv.ll
-
SystemZ/
-
addressing.ll
-
X86/
-
consecutive-ptr-uniforms.ll
-
gather_scatter.ll
-
intrinsiccost.ll
-
invariant-load-gather.ll
-
invariant-store-vectorization.ll
-
metadata-enable.ll
-
parallel-loops.ll
-
small-size.ll
-
x86-interleaved-accesses-masked-group.ll
-
x86-interleaved-store-accesses-with-gaps.ll
-
bsd_regex.ll
-
extract-last-veclane.ll
-
first-order-recurrence.ll
-
float-induction.ll
-
induction.ll
-
interleaved-accesses-pred-stores.ll
-
interleaved-accesses.ll
-
invariant-store-vectorization-2.ll
-
invariant-store-vectorization.ll
-
loop-scalars.ll
-
reduction-inloop-pred.ll
-
reduction-inloop-uf4.ll
-
reduction-inloop.ll
-
scalable-inductions.ll
-
vector-geps.ll
-
PhaseOrdering/
-
AArch64/
-
hoisting-sinking-required-for-vectorization.ll
-
peel-multiple-unreachable-exits-for-vectorization.ll
-
ARM/
-
mve-floatreduce.ll
-
X86/
-
vdiv-nounroll.ll
-
vdiv.ll
-
vector-reductions-logical.ll
-
vector-reductions.ll
-
SLPVectorizer/
-
AArch64/
-
gather-cost.ll
-
gather-reduce.ll
-
getelementptr.ll
-
transpose-inseltpoison.ll
-
transpose.ll
-
WebAssembly/
-
no-vectorize-rotate.ll
-
X86/
-
alternate-calls-inseltpoison.ll
-
alternate-calls.ll
-
alternate-fp-inseltpoison.ll
-
alternate-fp.ll
-
alternate-int-inseltpoison.ll
-
alternate-int.ll
-
blending-shuffle-inseltpoison.ll
-
blending-shuffle.ll
-
cmp_commute-inseltpoison.ll
-
cmp_commute.ll
-
minimum-sizes.ll
-
operandorder.ll
-
pr40522.ll
-
pr46983.ll
-
pr47623.ll
-
pr47629-inseltpoison.ll
-
pr47629.ll
-
pr47642.ll
-
pr49081.ll

Differential D115387

[instcombine] Canonicalize constant index type to i64 for extractelement/insertelement
ClosedPublic

Authored by reames on Dec 8 2021, 1:03 PM.

Download Raw Diff

Details

Reviewers

spatel
craig.topper
lebedev.ri
nikic

Commits

rGe6ad9ef4e7ae: [instcombine] Canonicalize constant index type to i64 for…

Summary

The basic idea to this is that a) having a single canonical type makes CSE easier, and b) many of our transforms are inconsistent about which types we end up with based on visit order.

I'm restricting this to constants as for non-constants, we'd have to decide whether the simplicity was worth extra instructions. For constants, there are no extra instructions.

A couple process notes:

Sorry for the lack of context, there's so many test changes that phabricator choked on a full context diff.
This isn't all of the test diffs, only the autogened ones. If we're happy with the direction, I'll autogen a bunch of files, and then update the rest before submit.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

reames created this revision.Dec 8 2021, 1:03 PM

Herald added subscribers: dmgreen, arphaman, zzheng and 6 others. · View Herald TranscriptDec 8 2021, 1:03 PM

reames requested review of this revision.Dec 8 2021, 1:03 PM

Herald added a project: Restricted Project. · View Herald TranscriptDec 8 2021, 1:03 PM

Herald added a subscriber: aheejin. · View Herald Transcript

Canonicalizing this sounds generally reasonable, but why towards i64 rather than i32? We require i32 for shuffle masks, and it's the canonical type for struct indices, so it seems like the more natural choice, and would probably result in less test diffs.

reames mentioned this in D115394: [instcombine] Do demanded elts last when visiting extractelement.Dec 8 2021, 1:34 PM

Hm, I see now that IRBuilder will use an i64 by default, which is presumably the reason for the choice.

In D115387#3180930, @nikic wrote:

Hm, I see now that IRBuilder will use an i64 by default, which is presumably the reason for the choice.

Actually, the choice was much more arbitrary than that. I tried both, and saw huge diffs with each. Given that, I went with what I tend to write.

I could argue that this matches the canonicalization for GEP indices on most 64 bit targets, but really, I think this is pretty arbitrary. If we were doing non-constants, we'd probably care a lot more about the choice, but with only constants we really shouldn't need to care as all the actual values are going to be extremely small (and thus representable with anything the target chooses pretty easily).

Harbormaster completed remote builds in B138262: Diff 392898.Dec 8 2021, 4:33 PM

Okay, in that case this looks good to me, we don't seem to have any clearly preferred type here. Given the test churn, waiting for a second opinion would be good.

llvm/lib/Transforms/InstCombine/InstCombineVectorOps.cpp
382	Something like `auto *NewIdx = ConstantInt::get(IndexC->getContext(), IndexC->getValue().zextOrTrunc(64))` might be more elegant?

Whatever we choose will be wrong anyway so let's go for i32 unless we actually need those uppper 32 bits to be usable.

In D115387#3182240, @lebedev.ri wrote:

Whatever we choose will be wrong anyway so let's go for i32 unless we actually need those uppper 32 bits to be usable.

If no target has a chance of codegen'ing anything close to that limit, I'd go for i32. For example, this may not finish in any practical timeframe with llc?

define void @f(<1048576 x i8>* %x) {
  %v = load <1048576 x i8>, <1048576 x i8>* %x
  %add = add <1048576 x i8> %v, %v
  store <1048576 x i8> %add, <1048576 x i8>* %x
  ret void
}

No matter what value is chosen, we should make a helper function and/or give the bitwidth a name, so we're not using a magic constant in multiple places.

Sounds like the consensus is i32? I'll give it another day for further discussion, and will then update the patch if that's the direction we want to go in.

In D115387#3183235, @reames wrote:

Sounds like the consensus is i32? I'll give it another day for further discussion, and will then update the patch if that's the direction we want to go in.

Would we update IRBuilder to use i32 and perhaps change the interface from uint64_t to unsigned?

In D115387#3183282, @craig.topper wrote:

In D115387#3183235, @reames wrote:

Sounds like the consensus is i32? I'll give it another day for further discussion, and will then update the patch if that's the direction we want to go in.

Would we update IRBuilder to use i32 and perhaps change the interface from uint64_t to unsigned?

Can we not increase the scope of the patch? This is purely a minor cleanup as far as I'm concerned, and if it grows too much, I'll simply abandon it as not worth the effort.

I am particularly concerns about changing argument types of the public API given possibility for silent downcast.

In D115387#3183352, @reames wrote:

In D115387#3183282, @craig.topper wrote:

In D115387#3183235, @reames wrote:

Sounds like the consensus is i32? I'll give it another day for further discussion, and will then update the patch if that's the direction we want to go in.

Would we update IRBuilder to use i32 and perhaps change the interface from uint64_t to unsigned?

Can we not increase the scope of the patch? This is purely a minor cleanup as far as I'm concerned, and if it grows too much, I'll simply abandon it as not worth the effort.

I am particularly concerns about changing argument types of the public API given possibility for silent downcast.

I guess my point was that it seems silly to have IRBuilder make something that InstCombine will always change. So maybe that's a vote for using i64 and not i32?

Can we go with I64 since some canonicalization is better than nothing, and if someone cares about making it I32, do that in a separate patch? Aside from some large test churn, I don't really see any downside to changing this (arbitrary) choice later.

In D115387#3183444, @reames wrote:

Can we go with I64 since some canonicalization is better than nothing, and if someone cares about making it I32, do that in a separate patch? Aside from some large test churn, I don't really see any downside to changing this (arbitrary) choice later.

No objection to i64 from me.

Incorporate style suggestion. Once this is LGTMed, I'll autogen all the relevant tests and rebase once more before commit.

LGTM

This revision is now accepted and ready to land.Dec 13 2021, 9:54 AM

llvm/lib/Transforms/InstCombine/InstCombineVectorOps.cpp
370	Pull out the repeated `64` constant?

reames mentioned this in rG1a18de3d0a25: Autogen a bunch of instcombine and vectorizer tests.Dec 13 2021, 10:41 AM

reames mentioned this in rGbbfaf0b170b6: Autogen more vectorizer tests in advance of D115387..Dec 13 2021, 11:04 AM

Harbormaster completed remote builds in B139010: Diff 393946.Dec 13 2021, 11:13 AM

I'm abandoning work on this. Sorry for doing that for an already approved patch, but the work required to finish the last update on the test turns out to be significantly more than I'd thought, and just isn't worth it.

The clang tests effected by this seem to be primarily intrinsic tests. These tests don't autogenerate correctly, despite claiming to be autogened. A single attempt at autogenning them takes more than an hour of runtime. The tests check both IR and assembly. Each test contains hundreds of sub-tests, so updating them by hand is not really an option.

IMHO, these intrinsic tests should not be in tree. I'm frustrated enough at the moment to just delete them, but that hardly seems like a constructive response. Given that, I'm just going to walk away since this patch was solely motivated by a desire to cleanup from the beginning.

reames mentioned this in rGbbba86764ae8: Revert "Autogen more vectorizer tests in advance of D115387.".Dec 13 2021, 12:48 PM

In D115387#3190135, @reames wrote:

I'm abandoning work on this. Sorry for doing that for an already approved patch, but the work required to finish the last update on the test turns out to be significantly more than I'd thought, and just isn't worth it.

The clang tests effected by this seem to be primarily intrinsic tests. These tests don't autogenerate correctly, despite claiming to be autogened. A single attempt at autogenning them takes more than an hour of runtime. The tests check both IR and assembly. Each test contains hundreds of sub-tests, so updating them by hand is not really an option.

IMHO, these intrinsic tests should not be in tree. I'm frustrated enough at the moment to just delete them, but that hardly seems like a constructive response. Given that, I'm just going to walk away since this patch was solely motivated by a desire to cleanup from the beginning.

Can you point to some examples of the affected tests?

In D115387#3190168, @craig.topper wrote:

Can you point to some examples of the affected tests?

Here are the ones which still fail after using update_cc_test_checks.py

Clang :: CodeGen/SystemZ/builtins-systemz-zvector-constrained.c
Clang :: CodeGen/SystemZ/builtins-systemz-zvector.c
Clang :: CodeGen/SystemZ/builtins-systemz-zvector2-constrained.c
Clang :: CodeGen/SystemZ/builtins-systemz-zvector2.c
Clang :: CodeGen/X86/avx-shuffle-builtins.c
Clang :: CodeGen/aarch64-bf16-ldst-intrinsics.c
Clang :: CodeGen/aarch64-neon-vcmla.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_abdlb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_abdlt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_adclb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_adclt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_addhnb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_addhnt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_addlb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_addlbt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_addlt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_addwb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_addwt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_bcax.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_bdep.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_bext.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_bgrp.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_bsl.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_bsl1n.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_bsl2n.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_eor3.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_eorbt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_eortb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_hadd.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_hsub.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_hsubr.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_mlalb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_mlalt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_mlslb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_mlslt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_mullb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_mullt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_nbsl.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_pmul.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_pmullb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_pmullb_128.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_pmullt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_pmullt_128.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qadd.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmlalb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmlalbt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmlalt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmlslb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmlslbt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmlslt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmulh.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmullb.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qdmullt.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qrdmlah.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qrdmlsh.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qrdmulh.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qrshl.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qshl.c
Clang :: CodeGen/aarch64-sve2-intrinsics/acle_sve2_qsub.c

Ignore my rant above. Had lunch and rechecked history, and noticed user error on my part. The tests are still very slow, but it's possible the auto-update will work when run properly. We'll see.

reames mentioned this in rGeb052f6b8f78: Reapply: Autogen more vectorizer tests in advance of D115387..Dec 13 2021, 3:49 PM

Reopening as I've gotten all the tests worked through.

This revision is now accepted and ready to land.Dec 13 2021, 4:30 PM

This revision was landed with ongoing or failed builds.Dec 13 2021, 4:57 PM

Closed by commit rGe6ad9ef4e7ae: [instcombine] Canonicalize constant index type to i64 for… (authored by reames). · Explain Why

This revision was automatically updated to reflect the committed changes.

reames added a commit: rGe6ad9ef4e7ae: [instcombine] Canonicalize constant index type to i64 for….

Herald added a project: Restricted Project. · View Herald TranscriptDec 13 2021, 4:57 PM

Herald added subscribers: cfe-commits, kerbowa, pengfei and 2 others. · View Herald Transcript

Large Diff

This large diff affects 308 files. Files without inline comments have been collapsed. Expand All Files

Revision Contents

Path

Size

clang/

test/

CodeGen/

SystemZ/

builtins-systemz-zvector-constrained.c

2 lines

builtins-systemz-zvector.c

18 lines

builtins-systemz-zvector2-constrained.c

16 lines

builtins-systemz-zvector2.c

16 lines

X86/

avx-shuffle-builtins.c

6 lines

aarch64-bf16-ldst-intrinsics.c

1325 lines

aarch64-neon-vcmla.c

8 lines

aarch64-sve-intrinsics/

133 lines

8 lines

8 lines

8 lines

8 lines

132 lines

96 lines

84 lines

4 lines

4 lines

4 lines

96 lines

56 lines

68 lines

68 lines

68 lines

68 lines

56 lines

12 lines

84 lines

84 lines

16 lines

acle_sve_dup-bfloat.c

8 lines

acle_sve_dup.c

104 lines

acle_sve_dupq-bfloat.c

32 lines

416 lines

96 lines

36 lines

36 lines

132 lines

132 lines

36 lines

132 lines

36 lines

132 lines

132 lines

132 lines

132 lines

96 lines

36 lines

36 lines

36 lines

36 lines

36 lines

96 lines

32 lines

32 lines

36 lines

132 lines

132 lines

4 lines

4 lines

aarch64-sve2-intrinsics/

32 lines

24 lines

24 lines

24 lines

24 lines

8 lines

8 lines

24 lines

24 lines

24 lines

12 lines

24 lines

24 lines

24 lines

32 lines

16 lines

16 lines

16 lines

32 lines

32 lines

32 lines

32 lines

32 lines

32 lines

96 lines

96 lines

96 lines

28 lines

28 lines

28 lines

28 lines

24 lines

24 lines

32 lines

4 lines

16 lines

acle_sve2_pmullb_128.c

4 lines

acle_sve2_pmullt.c

16 lines

acle_sve2_pmullt_128.c

4 lines

96 lines

12 lines

12 lines

12 lines

12 lines

12 lines

12 lines

16 lines

12 lines

12 lines

16 lines

16 lines

16 lines

96 lines

96 lines

96 lines

96 lines

24 lines

24 lines

96 lines

96 lines

24 lines

24 lines

8 lines

8 lines

48 lines

24 lines

24 lines

24 lines

12 lines

24 lines

12 lines

24 lines

24 lines

48 lines

Headers/

wasm.c

364 lines

llvm/

lib/

Transforms/

InstCombine/

InstCombineVectorOps.cpp

21 lines

test/

Transforms/

InstCombine/

AArch64/

sve-intrinsic-opts-dup.ll

2 lines

sve-intrinsic-opts-lasta-lastb.ll

2 lines

sve-intrinsic-opts-unpkhi-unpklo.ll

8 lines

sve-intrinsic-tbl-dupx.ll

24 lines

AMDGPU/

amdgcn-demanded-vector-elts-inseltpoison.ll

136 lines

amdgcn-demanded-vector-elts.ll

136 lines

ExtractCast.ll

4 lines

X86/

x86-addsub-inseltpoison.ll

40 lines

x86-addsub.ll

40 lines

x86-avx512-inseltpoison.ll

74 lines

x86-avx512.ll

74 lines

x86-fma.ll

6 lines

x86-insertps.ll

2 lines

x86-pshufb-inseltpoison.ll

2 lines

x86-pshufb.ll

2 lines

x86-sse-inseltpoison.ll

86 lines

x86-sse.ll

86 lines

x86-sse2-inseltpoison.ll

78 lines

x86-sse2.ll

78 lines

x86-sse41-inseltpoison.ll

16 lines

x86-sse41.ll

16 lines

x86-vec_demanded_elts-inseltpoison.ll

18 lines

x86-vec_demanded_elts.ll

18 lines

x86-vector-shifts-inseltpoison.ll

18 lines

x86-vector-shifts.ll

22 lines

x86-vpermil-inseltpoison.ll

2 lines

x86-vpermil.ll

2 lines

x86-xop-inseltpoison.ll

8 lines

x86-xop.ll

8 lines

bitcast-bigendian.ll

18 lines

bitcast-inselt-bitcast.ll

34 lines

bitcast-inseltpoison.ll

28 lines

bitcast-vec-canon-inseltpoison.ll

14 lines

bitcast-vec-canon.ll

14 lines

bitcast.ll

28 lines

broadcast-inseltpoison.ll

40 lines

broadcast.ll

40 lines

cast_ptr.ll

10 lines

extractelement-inseltpoison.ll

40 lines

44 lines

2 lines

2 lines

2 lines

gep-vector-indices.ll

16 lines

getelementptr.ll

4 lines

icmp-bc-vec-inseltpoison.ll

4 lines

icmp-bc-vec.ll

4 lines

inselt-binop-inseltpoison.ll

108 lines

inselt-binop.ll

108 lines

insert-const-shuf.ll

12 lines

insert-extract-shuffle-inseltpoison.ll

112 lines

insert-extract-shuffle.ll

120 lines

insertelement-bitcast.ll

10 lines

masked_intrinsics-inseltpoison.ll

4 lines

masked_intrinsics.ll

4 lines

masked_intrinsics_keep_metadata.ll

2 lines

minmax-fold.ll

6 lines

multi-size-address-space-pointer.ll

2 lines

pr38984-inseltpoison.ll

2 lines

pr38984.ll

2 lines

reduction-add-sext-zext-i1.ll

4 lines

reduction-and-sext-zext-i1.ll

4 lines

reduction-mul-sext-zext-i1.ll

4 lines

reduction-or-sext-zext-i1.ll

4 lines

reduction-smax-sext-zext-i1.ll

4 lines

reduction-smin-sext-zext-i1.ll

4 lines

reduction-umax-sext-zext-i1.ll

4 lines

reduction-umin-sext-zext-i1.ll

4 lines

reduction-xor-sext-zext-i1.ll

4 lines

scalarization-inseltpoison.ll

40 lines

scalarization.ll

40 lines

select-extractelement-inseltpoison.ll

18 lines

select-extractelement.ll

60 lines

select-safe-impliedcond-transforms.ll

2 lines

shift-add-inseltpoison.ll

6 lines

shift-add.ll

6 lines

shufflevec-bitcast-inseltpoison.ll

4 lines

shufflevec-bitcast.ll

10 lines

shufflevector-div-rem-inseltpoison.ll

16 lines

shufflevector-div-rem.ll

16 lines

sincospi.ll

8 lines

sink-into-catchswitch.ll

2 lines

trunc-extractelement-inseltpoison.ll

36 lines

trunc-extractelement.ll

36 lines

trunc-inseltpoison.ll

6 lines

trunc.ll

6 lines

type_pun-inseltpoison.ll

20 lines

type_pun.ll

20 lines

vec_demanded_elts-inseltpoison.ll

64 lines

vec_demanded_elts.ll

64 lines

vec_extract_2elts.ll

2 lines

vec_gep_scalar_arg-inseltpoison.ll

2 lines

vec_gep_scalar_arg.ll

2 lines

vec_phi_extract-inseltpoison.ll

8 lines

vec_phi_extract.ll

8 lines

vec_shuffle-inseltpoison.ll

32 lines

vec_shuffle.ll

32 lines

vector-casts-inseltpoison.ll

6 lines

vector-casts.ll

6 lines

vector-reverse.ll

4 lines

vector_insertelt_shuffle-inseltpoison.ll

8 lines

vector_insertelt_shuffle.ll

8 lines

vscale_cmp.ll

2 lines

vscale_extractelement-inseltpoison.ll

36 lines

vscale_extractelement.ll

40 lines

vscale_insertelement-inseltpoison.ll

26 lines

vscale_insertelement.ll

26 lines

LoopVectorize/

AArch64/

aarch64-predication.ll

16 lines

intrinsiccost.ll

20 lines

sve-cond-inv-loads.ll

6 lines

sve-gather-scatter.ll

8 lines

sve-inductions.ll

2 lines

sve-widen-phi.ll

6 lines

ARM/

mve-saddsatcost.ll

4 lines

pointer_iv.ll

38 lines

SystemZ/

addressing.ll

4 lines

X86/

consecutive-ptr-uniforms.ll

4 lines

gather_scatter.ll

76 lines

intrinsiccost.ll

32 lines

invariant-load-gather.ll

12 lines

invariant-store-vectorization.ll

24 lines

metadata-enable.ll

150 lines

parallel-loops.ll

8 lines

small-size.ll

44 lines

x86-interleaved-accesses-masked-group.ll

1814 lines

x86-interleaved-store-accesses-with-gaps.ll

134 lines

bsd_regex.ll

8 lines

extract-last-veclane.ll

4 lines

first-order-recurrence.ll

234 lines

float-induction.ll

96 lines

induction.ll

348 lines

interleaved-accesses-pred-stores.ll

34 lines

interleaved-accesses.ll

106 lines

invariant-store-vectorization-2.ll

16 lines

invariant-store-vectorization.ll

14 lines

loop-scalars.ll

4 lines

reduction-inloop-pred.ll

314 lines

reduction-inloop-uf4.ll

72 lines

reduction-inloop.ll

3 lines

scalable-inductions.ll

12 lines

vector-geps.ll

2 lines

PhaseOrdering/

AArch64/

hoisting-sinking-required-for-vectorization.ll

2 lines

peel-multiple-unreachable-exits-for-vectorization.ll

4 lines

ARM/

mve-floatreduce.ll

12 lines

X86/

vdiv-nounroll.ll

2 lines

vdiv.ll

8 lines

vector-reductions-logical.ll

30 lines

vector-reductions.ll

18 lines

SLPVectorizer/

AArch64/

gather-cost.ll

8 lines

gather-reduce.ll

64 lines

getelementptr.ll

42 lines

transpose-inseltpoison.ll

24 lines

transpose.ll

24 lines

WebAssembly/

no-vectorize-rotate.ll

8 lines

X86/

alternate-calls-inseltpoison.ll

24 lines

alternate-calls.ll

24 lines

alternate-fp-inseltpoison.ll

10 lines

alternate-fp.ll

10 lines

alternate-int-inseltpoison.ll

90 lines

alternate-int.ll

90 lines

blending-shuffle-inseltpoison.ll

24 lines

blending-shuffle.ll

24 lines

cmp_commute-inseltpoison.ll

12 lines

12 lines

16 lines

28 lines

32 lines

54 lines

4 lines

pr47629-inseltpoison.ll

376 lines

pr47629.ll

376 lines

pr47642.ll

8 lines

pr49081.ll

4 lines

This is an archive of the discontinued LLVM Phabricator instance.

[instcombine] Canonicalize constant index type to i64 for extractelement/insertelementClosedPublic

Details

Diff Detail

Event Timeline

Large Diff

Revision Contents

Diff 394088

clang/test/CodeGen/SystemZ/builtins-systemz-zvector-constrained.c

clang/test/CodeGen/SystemZ/builtins-systemz-zvector.c

clang/test/CodeGen/SystemZ/builtins-systemz-zvector2-constrained.c

clang/test/CodeGen/SystemZ/builtins-systemz-zvector2.c

clang/test/CodeGen/X86/avx-shuffle-builtins.c

clang/test/CodeGen/aarch64-bf16-ldst-intrinsics.c

clang/test/CodeGen/aarch64-neon-vcmla.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_abd.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_acge.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_acgt.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_acle.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_aclt.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_add.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_and.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_asr.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_bfdot.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_bfmlalb.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_bfmlalt.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_bic.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_cmpeq.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_cmpge.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_cmpgt.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_cmple.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_cmplt.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_cmpne.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_cmpuo.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_div.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_divr.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_dot.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_dup-bfloat.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_dup.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_dupq-bfloat.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_dupq.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_eor.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_lsl.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_lsr.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_mad.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_max.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_maxnm.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_min.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_minnm.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_mla.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_mls.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_msb.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_mul.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_mulh.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_mulx.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_nmad.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_nmla.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_nmls.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_nmsb.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_orr.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_qadd.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_qsub.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_scale.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_sub.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_subr.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_sudot.c

clang/test/CodeGen/aarch64-sve-intrinsics/acle_sve_usdot.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_aba.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_abalb.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_abalt.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_abdlb.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_abdlt.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_adclb.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_adclt.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_addhnb.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_addhnt.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_addlb.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_addlbt.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_addlt.c

clang/test/CodeGen/aarch64-sve2-intrinsics/acle_sve2_addwb.c

[instcombine] Canonicalize constant index type to i64 for extractelement/insertelement
ClosedPublic