mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-11-22 18:54:02 +01:00
02f664086c
The addend in a REL32 reloc needs to be adjusted to account for the offset from the PC value returned by the s_getpc instruction to the point where the reloc is applied. This was being done correctly for (GOTPC)REL32_LO but not for (GOTPC)REL32_HI. This will only make a difference if the target symbol happens to get loaded almost exactly a multiple of 4G away from the relocated instructions. Differential Revision: https://reviews.llvm.org/D86938
24 lines
991 B
YAML
24 lines
991 B
YAML
# RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -start-after=livedebugvalues -verify-machineinstrs -o - %s | FileCheck -check-prefix=GCN %s
|
|
|
|
# GCN-LABEL: foo:
|
|
# GCN: s_getpc_b64 vcc
|
|
# GCN: s_add_u32 vcc_lo, vcc_lo, bar@rel32@lo+4
|
|
# GCN: s_addc_u32 vcc_hi, vcc_hi, bar@rel32@hi+12
|
|
--- |
|
|
define amdgpu_kernel void @foo() {
|
|
ret void
|
|
}
|
|
@bar = external protected local_unnamed_addr addrspace(4) externally_initialized global i32, align 4
|
|
---
|
|
name: foo
|
|
tracksRegLiveness: true
|
|
frameInfo:
|
|
hasCalls: true
|
|
body: |
|
|
bb.0:
|
|
BUNDLE implicit-def $vcc, implicit-def $vcc_lo, implicit-def $vcc_lo_lo16, implicit-def $vcc_lo_hi16, implicit-def $vcc_hi, implicit-def $vcc_hi_lo16, implicit-def $vcc_hi_hi16, implicit-def $scc {
|
|
$vcc = S_GETPC_B64
|
|
$vcc_lo = S_ADD_U32 internal $vcc_lo, target-flags(amdgpu-rel32-lo) @bar + 4, implicit-def $scc
|
|
$vcc_hi = S_ADDC_U32 internal $vcc_hi, target-flags(amdgpu-rel32-hi) @bar + 12, implicit-def $scc, implicit internal $scc
|
|
}
|