Please use GitHub pull requests for new patches. Avoid migrating existing patches. Phabricator shutdown timeline
Changeset View
Changeset View
Standalone View
Standalone View
llvm/test/CodeGen/AMDGPU/GlobalISel/global-value.ll
; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py | ; NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py | ||||
; RUN: llc -global-isel -mtriple=amdgcn-amd-amdhsa -mcpu=hawaii -stop-after=legalizer < %s | FileCheck -check-prefix=HSA %s | ; RUN: llc -global-isel -mtriple=amdgcn-amd-amdhsa -mcpu=hawaii -stop-after=legalizer < %s | FileCheck -check-prefix=GCN %s | ||||
; RUN: llc -global-isel -mtriple=amdgcn-amd-amdpal -mcpu=hawaii -stop-after=legalizer < %s | FileCheck -check-prefix=PAL %s | ; RUN: llc -global-isel -mtriple=amdgcn-amd-amdpal -mcpu=hawaii -stop-after=legalizer < %s | FileCheck -check-prefix=GCN %s | ||||
@external_constant = external addrspace(4) constant i32, align 4 | @external_constant = external addrspace(4) constant i32, align 4 | ||||
@external_constant32 = external addrspace(6) constant i32, align 4 | @external_constant32 = external addrspace(6) constant i32, align 4 | ||||
@external_global = external addrspace(1) global i32, align 4 | @external_global = external addrspace(1) global i32, align 4 | ||||
@external_other = external addrspace(999) global i32, align 4 | @external_other = external addrspace(999) global i32, align 4 | ||||
@internal_constant = internal addrspace(4) constant i32 9, align 4 | @internal_constant = internal addrspace(4) constant i32 9, align 4 | ||||
@internal_constant32 = internal addrspace(6) constant i32 9, align 4 | @internal_constant32 = internal addrspace(6) constant i32 9, align 4 | ||||
@internal_global = internal addrspace(1) global i32 9, align 4 | @internal_global = internal addrspace(1) global i32 9, align 4 | ||||
@internal_other = internal addrspace(999) global i32 9, align 4 | @internal_other = internal addrspace(999) global i32 9, align 4 | ||||
define i32 addrspace(4)* @external_constant_got() { | define i32 addrspace(4)* @external_constant_got() { | ||||
; HSA-LABEL: name: external_constant_got | ; GCN-LABEL: name: external_constant_got | ||||
; HSA: bb.1 (%ir-block.0): | ; GCN: bb.1 (%ir-block.0): | ||||
; HSA: liveins: $sgpr30_sgpr31 | ; GCN: liveins: $sgpr30_sgpr31 | ||||
; HSA: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ; GCN: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ||||
; HSA: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_constant + 4, target-flags(amdgpu-gotprel32-hi) @external_constant + 4, implicit-def $scc | ; GCN: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_constant + 4, target-flags(amdgpu-gotprel32-hi) @external_constant + 4, implicit-def $scc | ||||
; HSA: [[LOAD:%[0-9]+]]:_(p4) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | ; GCN: [[LOAD:%[0-9]+]]:_(p4) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | ||||
; HSA: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[LOAD]](p4) | ; GCN: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[LOAD]](p4) | ||||
; HSA: $vgpr0 = COPY [[UV]](s32) | ; GCN: $vgpr0 = COPY [[UV]](s32) | ||||
; HSA: $vgpr1 = COPY [[UV1]](s32) | ; GCN: $vgpr1 = COPY [[UV1]](s32) | ||||
; HSA: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ; GCN: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ||||
; HSA: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ; GCN: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ||||
; PAL-LABEL: name: external_constant_got | |||||
; PAL: bb.1 (%ir-block.0): | |||||
; PAL: liveins: $sgpr30_sgpr31 | |||||
; PAL: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | |||||
; PAL: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET @external_constant + 4, 0, implicit-def $scc | |||||
; PAL: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p4) | |||||
; PAL: $vgpr0 = COPY [[UV]](s32) | |||||
; PAL: $vgpr1 = COPY [[UV1]](s32) | |||||
; PAL: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | |||||
; PAL: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | |||||
ret i32 addrspace(4)* @external_constant | ret i32 addrspace(4)* @external_constant | ||||
} | } | ||||
define i32 addrspace(1)* @external_global_got() { | define i32 addrspace(1)* @external_global_got() { | ||||
; HSA-LABEL: name: external_global_got | ; GCN-LABEL: name: external_global_got | ||||
; HSA: bb.1 (%ir-block.0): | ; GCN: bb.1 (%ir-block.0): | ||||
; HSA: liveins: $sgpr30_sgpr31 | ; GCN: liveins: $sgpr30_sgpr31 | ||||
; HSA: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ; GCN: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ||||
; HSA: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_global + 4, target-flags(amdgpu-gotprel32-hi) @external_global + 4, implicit-def $scc | ; GCN: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_global + 4, target-flags(amdgpu-gotprel32-hi) @external_global + 4, implicit-def $scc | ||||
; HSA: [[LOAD:%[0-9]+]]:_(p1) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | ; GCN: [[LOAD:%[0-9]+]]:_(p1) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | ||||
; HSA: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[LOAD]](p1) | ; GCN: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[LOAD]](p1) | ||||
; HSA: $vgpr0 = COPY [[UV]](s32) | ; GCN: $vgpr0 = COPY [[UV]](s32) | ||||
; HSA: $vgpr1 = COPY [[UV1]](s32) | ; GCN: $vgpr1 = COPY [[UV1]](s32) | ||||
; HSA: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ; GCN: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ||||
; HSA: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ; GCN: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ||||
; PAL-LABEL: name: external_global_got | |||||
; PAL: bb.1 (%ir-block.0): | |||||
; PAL: liveins: $sgpr30_sgpr31 | |||||
; PAL: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | |||||
; PAL: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_global + 4, target-flags(amdgpu-gotprel32-hi) @external_global + 4, implicit-def $scc | |||||
; PAL: [[LOAD:%[0-9]+]]:_(p1) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | |||||
; PAL: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[LOAD]](p1) | |||||
; PAL: $vgpr0 = COPY [[UV]](s32) | |||||
; PAL: $vgpr1 = COPY [[UV1]](s32) | |||||
; PAL: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | |||||
; PAL: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | |||||
ret i32 addrspace(1)* @external_global | ret i32 addrspace(1)* @external_global | ||||
} | } | ||||
define i32 addrspace(999)* @external_other_got() { | define i32 addrspace(999)* @external_other_got() { | ||||
; HSA-LABEL: name: external_other_got | ; GCN-LABEL: name: external_other_got | ||||
; HSA: bb.1 (%ir-block.0): | ; GCN: bb.1 (%ir-block.0): | ||||
; HSA: liveins: $sgpr30_sgpr31 | ; GCN: liveins: $sgpr30_sgpr31 | ||||
; HSA: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ; GCN: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ||||
; HSA: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_other + 4, target-flags(amdgpu-gotprel32-hi) @external_other + 4, implicit-def $scc | ; GCN: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_other + 4, target-flags(amdgpu-gotprel32-hi) @external_other + 4, implicit-def $scc | ||||
; HSA: [[LOAD:%[0-9]+]]:_(p999) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | ; GCN: [[LOAD:%[0-9]+]]:_(p999) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | ||||
; HSA: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[LOAD]](p999) | ; GCN: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[LOAD]](p999) | ||||
; HSA: $vgpr0 = COPY [[UV]](s32) | ; GCN: $vgpr0 = COPY [[UV]](s32) | ||||
; HSA: $vgpr1 = COPY [[UV1]](s32) | ; GCN: $vgpr1 = COPY [[UV1]](s32) | ||||
; HSA: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ; GCN: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ||||
; HSA: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ; GCN: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ||||
; PAL-LABEL: name: external_other_got | |||||
; PAL: bb.1 (%ir-block.0): | |||||
; PAL: liveins: $sgpr30_sgpr31 | |||||
; PAL: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | |||||
; PAL: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_other + 4, target-flags(amdgpu-gotprel32-hi) @external_other + 4, implicit-def $scc | |||||
; PAL: [[LOAD:%[0-9]+]]:_(p999) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | |||||
; PAL: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[LOAD]](p999) | |||||
; PAL: $vgpr0 = COPY [[UV]](s32) | |||||
; PAL: $vgpr1 = COPY [[UV1]](s32) | |||||
; PAL: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | |||||
; PAL: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | |||||
ret i32 addrspace(999)* @external_other | ret i32 addrspace(999)* @external_other | ||||
} | } | ||||
define i32 addrspace(4)* @internal_constant_pcrel() { | define i32 addrspace(4)* @internal_constant_pcrel() { | ||||
; HSA-LABEL: name: internal_constant_pcrel | ; GCN-LABEL: name: internal_constant_pcrel | ||||
; HSA: bb.1 (%ir-block.0): | ; GCN: bb.1 (%ir-block.0): | ||||
; HSA: liveins: $sgpr30_sgpr31 | ; GCN: liveins: $sgpr30_sgpr31 | ||||
; HSA: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ; GCN: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ||||
; HSA: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_constant + 4, target-flags(amdgpu-rel32-hi) @internal_constant + 4, implicit-def $scc | ; GCN: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_constant + 4, target-flags(amdgpu-rel32-hi) @internal_constant + 4, implicit-def $scc | ||||
; HSA: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p4) | ; GCN: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p4) | ||||
; HSA: $vgpr0 = COPY [[UV]](s32) | ; GCN: $vgpr0 = COPY [[UV]](s32) | ||||
; HSA: $vgpr1 = COPY [[UV1]](s32) | ; GCN: $vgpr1 = COPY [[UV1]](s32) | ||||
; HSA: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ; GCN: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ||||
; HSA: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ; GCN: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ||||
; PAL-LABEL: name: internal_constant_pcrel | |||||
; PAL: bb.1 (%ir-block.0): | |||||
; PAL: liveins: $sgpr30_sgpr31 | |||||
; PAL: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | |||||
; PAL: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET @internal_constant + 4, 0, implicit-def $scc | |||||
; PAL: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p4) | |||||
; PAL: $vgpr0 = COPY [[UV]](s32) | |||||
; PAL: $vgpr1 = COPY [[UV1]](s32) | |||||
; PAL: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | |||||
; PAL: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | |||||
ret i32 addrspace(4)* @internal_constant | ret i32 addrspace(4)* @internal_constant | ||||
} | } | ||||
define i32 addrspace(1)* @internal_global_pcrel() { | define i32 addrspace(1)* @internal_global_pcrel() { | ||||
; HSA-LABEL: name: internal_global_pcrel | ; GCN-LABEL: name: internal_global_pcrel | ||||
; HSA: bb.1 (%ir-block.0): | ; GCN: bb.1 (%ir-block.0): | ||||
; HSA: liveins: $sgpr30_sgpr31 | ; GCN: liveins: $sgpr30_sgpr31 | ||||
; HSA: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ; GCN: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ||||
; HSA: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p1) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_global + 4, target-flags(amdgpu-rel32-hi) @internal_global + 4, implicit-def $scc | ; GCN: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p1) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_global + 4, target-flags(amdgpu-rel32-hi) @internal_global + 4, implicit-def $scc | ||||
; HSA: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p1) | ; GCN: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p1) | ||||
; HSA: $vgpr0 = COPY [[UV]](s32) | ; GCN: $vgpr0 = COPY [[UV]](s32) | ||||
; HSA: $vgpr1 = COPY [[UV1]](s32) | ; GCN: $vgpr1 = COPY [[UV1]](s32) | ||||
; HSA: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ; GCN: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ||||
; HSA: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ; GCN: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ||||
; PAL-LABEL: name: internal_global_pcrel | |||||
; PAL: bb.1 (%ir-block.0): | |||||
; PAL: liveins: $sgpr30_sgpr31 | |||||
; PAL: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | |||||
; PAL: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p1) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_global + 4, target-flags(amdgpu-rel32-hi) @internal_global + 4, implicit-def $scc | |||||
; PAL: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p1) | |||||
; PAL: $vgpr0 = COPY [[UV]](s32) | |||||
; PAL: $vgpr1 = COPY [[UV1]](s32) | |||||
; PAL: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | |||||
; PAL: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | |||||
ret i32 addrspace(1)* @internal_global | ret i32 addrspace(1)* @internal_global | ||||
} | } | ||||
define i32 addrspace(999)* @internal_other_pcrel() { | define i32 addrspace(999)* @internal_other_pcrel() { | ||||
; HSA-LABEL: name: internal_other_pcrel | ; GCN-LABEL: name: internal_other_pcrel | ||||
; HSA: bb.1 (%ir-block.0): | ; GCN: bb.1 (%ir-block.0): | ||||
; HSA: liveins: $sgpr30_sgpr31 | ; GCN: liveins: $sgpr30_sgpr31 | ||||
; HSA: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ; GCN: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ||||
; HSA: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p999) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_other + 4, target-flags(amdgpu-rel32-hi) @internal_other + 4, implicit-def $scc | ; GCN: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p999) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_other + 4, target-flags(amdgpu-rel32-hi) @internal_other + 4, implicit-def $scc | ||||
; HSA: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p999) | ; GCN: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p999) | ||||
; HSA: $vgpr0 = COPY [[UV]](s32) | ; GCN: $vgpr0 = COPY [[UV]](s32) | ||||
; HSA: $vgpr1 = COPY [[UV1]](s32) | ; GCN: $vgpr1 = COPY [[UV1]](s32) | ||||
; HSA: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ; GCN: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ||||
; HSA: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ; GCN: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | ||||
; PAL-LABEL: name: internal_other_pcrel | |||||
; PAL: bb.1 (%ir-block.0): | |||||
; PAL: liveins: $sgpr30_sgpr31 | |||||
; PAL: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | |||||
; PAL: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p999) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_other + 4, target-flags(amdgpu-rel32-hi) @internal_other + 4, implicit-def $scc | |||||
; PAL: [[UV:%[0-9]+]]:_(s32), [[UV1:%[0-9]+]]:_(s32) = G_UNMERGE_VALUES [[SI_PC_ADD_REL_OFFSET]](p999) | |||||
; PAL: $vgpr0 = COPY [[UV]](s32) | |||||
; PAL: $vgpr1 = COPY [[UV1]](s32) | |||||
; PAL: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | |||||
; PAL: S_SETPC_B64_return [[COPY1]], implicit $vgpr0, implicit $vgpr1 | |||||
ret i32 addrspace(999)* @internal_other | ret i32 addrspace(999)* @internal_other | ||||
} | } | ||||
define i32 addrspace(6)* @external_constant32_got() { | define i32 addrspace(6)* @external_constant32_got() { | ||||
; HSA-LABEL: name: external_constant32_got | ; GCN-LABEL: name: external_constant32_got | ||||
; HSA: bb.1 (%ir-block.0): | ; GCN: bb.1 (%ir-block.0): | ||||
; HSA: liveins: $sgpr30_sgpr31 | ; GCN: liveins: $sgpr30_sgpr31 | ||||
; HSA: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ; GCN: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ||||
; HSA: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_constant32 + 4, target-flags(amdgpu-gotprel32-hi) @external_constant32 + 4, implicit-def $scc | ; GCN: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-gotprel32-lo) @external_constant32 + 4, target-flags(amdgpu-gotprel32-hi) @external_constant32 + 4, implicit-def $scc | ||||
; HSA: [[LOAD:%[0-9]+]]:_(p4) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | ; GCN: [[LOAD:%[0-9]+]]:_(p4) = G_LOAD [[SI_PC_ADD_REL_OFFSET]](p4) :: (dereferenceable invariant load 8 from got, addrspace 4) | ||||
; HSA: [[EXTRACT:%[0-9]+]]:_(p6) = G_EXTRACT [[LOAD]](p4), 0 | ; GCN: [[EXTRACT:%[0-9]+]]:_(p6) = G_EXTRACT [[LOAD]](p4), 0 | ||||
; HSA: $vgpr0 = COPY [[EXTRACT]](p6) | ; GCN: $vgpr0 = COPY [[EXTRACT]](p6) | ||||
; HSA: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ; GCN: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ||||
; HSA: S_SETPC_B64_return [[COPY1]], implicit $vgpr0 | ; GCN: S_SETPC_B64_return [[COPY1]], implicit $vgpr0 | ||||
; PAL-LABEL: name: external_constant32_got | |||||
; PAL: bb.1 (%ir-block.0): | |||||
; PAL: liveins: $sgpr30_sgpr31 | |||||
; PAL: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | |||||
; PAL: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET @external_constant32 + 4, 0, implicit-def $scc | |||||
; PAL: [[EXTRACT:%[0-9]+]]:_(p6) = G_EXTRACT [[SI_PC_ADD_REL_OFFSET]](p4), 0 | |||||
; PAL: $vgpr0 = COPY [[EXTRACT]](p6) | |||||
; PAL: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | |||||
; PAL: S_SETPC_B64_return [[COPY1]], implicit $vgpr0 | |||||
ret i32 addrspace(6)* @external_constant32 | ret i32 addrspace(6)* @external_constant32 | ||||
} | } | ||||
define i32 addrspace(6)* @internal_constant32_pcrel() { | define i32 addrspace(6)* @internal_constant32_pcrel() { | ||||
; HSA-LABEL: name: internal_constant32_pcrel | ; GCN-LABEL: name: internal_constant32_pcrel | ||||
; HSA: bb.1 (%ir-block.0): | ; GCN: bb.1 (%ir-block.0): | ||||
; HSA: liveins: $sgpr30_sgpr31 | ; GCN: liveins: $sgpr30_sgpr31 | ||||
; HSA: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ; GCN: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | ||||
; HSA: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_constant32 + 4, target-flags(amdgpu-rel32-hi) @internal_constant32 + 4, implicit-def $scc | ; GCN: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET target-flags(amdgpu-rel32-lo) @internal_constant32 + 4, target-flags(amdgpu-rel32-hi) @internal_constant32 + 4, implicit-def $scc | ||||
; HSA: [[EXTRACT:%[0-9]+]]:_(p6) = G_EXTRACT [[SI_PC_ADD_REL_OFFSET]](p4), 0 | ; GCN: [[EXTRACT:%[0-9]+]]:_(p6) = G_EXTRACT [[SI_PC_ADD_REL_OFFSET]](p4), 0 | ||||
; HSA: $vgpr0 = COPY [[EXTRACT]](p6) | ; GCN: $vgpr0 = COPY [[EXTRACT]](p6) | ||||
; HSA: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ; GCN: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | ||||
; HSA: S_SETPC_B64_return [[COPY1]], implicit $vgpr0 | ; GCN: S_SETPC_B64_return [[COPY1]], implicit $vgpr0 | ||||
; PAL-LABEL: name: internal_constant32_pcrel | |||||
; PAL: bb.1 (%ir-block.0): | |||||
; PAL: liveins: $sgpr30_sgpr31 | |||||
; PAL: [[COPY:%[0-9]+]]:sgpr_64 = COPY $sgpr30_sgpr31 | |||||
; PAL: [[SI_PC_ADD_REL_OFFSET:%[0-9]+]]:sreg_64(p4) = SI_PC_ADD_REL_OFFSET @internal_constant32 + 4, 0, implicit-def $scc | |||||
; PAL: [[EXTRACT:%[0-9]+]]:_(p6) = G_EXTRACT [[SI_PC_ADD_REL_OFFSET]](p4), 0 | |||||
; PAL: $vgpr0 = COPY [[EXTRACT]](p6) | |||||
; PAL: [[COPY1:%[0-9]+]]:ccr_sgpr_64 = COPY [[COPY]] | |||||
; PAL: S_SETPC_B64_return [[COPY1]], implicit $vgpr0 | |||||
ret i32 addrspace(6)* @internal_constant32 | ret i32 addrspace(6)* @internal_constant32 | ||||
} | } |