Index: ELF/InputSection.h =================================================================== --- ELF/InputSection.h +++ ELF/InputSection.h @@ -46,6 +46,7 @@ R_PPC_OPD, R_PPC_PLT_OPD, R_PPC_TOC, + R_RELAX_GOT, R_RELAX_TLS_GD_TO_IE, R_RELAX_TLS_GD_TO_LE, R_RELAX_TLS_IE_TO_LE, @@ -63,7 +64,7 @@ return Expr == R_GOT || Expr == R_GOT_OFF || Expr == R_MIPS_GOT_LOCAL || Expr == R_MIPS_GOT_LOCAL_PAGE || Expr == R_GOT_PAGE_PC || Expr == R_GOT_PC || Expr == R_GOT_FROM_END || Expr == R_TLSGD || - Expr == R_TLSGD_PC; + Expr == R_TLSGD_PC || Expr == R_RELAX_GOT; } struct Relocation { Index: ELF/InputSection.cpp =================================================================== --- ELF/InputSection.cpp +++ ELF/InputSection.cpp @@ -249,6 +249,7 @@ return SymVA - P; } case R_PC: + case R_RELAX_GOT: return Body.getVA(A) - P; case R_PAGE_PC: return getAArch64Page(Body.getVA(A)) - getAArch64Page(P); @@ -323,6 +324,9 @@ } switch (Expr) { + case R_RELAX_GOT: + Target->relaxGot(BufLoc, SymVA); + break; case R_RELAX_TLS_IE_TO_LE: Target->relaxTlsIeToLe(BufLoc, Type, SymVA); break; Index: ELF/Target.h =================================================================== --- ELF/Target.h +++ ELF/Target.h @@ -88,10 +88,17 @@ uint32_t ThunkSize = 0; + virtual bool canRelaxGot(uint32_t Type, const SymbolBody &S, + const uint8_t *Data, uint64_t Offset) const; + virtual void relaxGot(uint8_t *Loc, uint64_t Val) const; + virtual void relaxTlsGdToIe(uint8_t *Loc, uint32_t Type, uint64_t Val) const; virtual void relaxTlsGdToLe(uint8_t *Loc, uint32_t Type, uint64_t Val) const; virtual void relaxTlsIeToLe(uint8_t *Loc, uint32_t Type, uint64_t Val) const; virtual void relaxTlsLdToLe(uint8_t *Loc, uint32_t Type, uint64_t Val) const; + +protected: + bool isRelaxable(const SymbolBody &S) const; }; uint64_t getPPC64TocBase(); Index: ELF/Target.cpp =================================================================== --- ELF/Target.cpp +++ ELF/Target.cpp @@ -113,6 +113,10 @@ int32_t Index, unsigned RelOff) const override; void relocateOne(uint8_t *Loc, uint32_t Type, uint64_t Val) const override; + bool canRelaxGot(uint32_t Type, const SymbolBody &S, const uint8_t *Data, + uint64_t Offset) const override; + void relaxGot(uint8_t *Loc, uint64_t Val) const override; + void relaxTlsGdToIe(uint8_t *Loc, uint32_t Type, uint64_t Val) const override; void relaxTlsGdToLe(uint8_t *Loc, uint32_t Type, uint64_t Val) const override; void relaxTlsIeToLe(uint8_t *Loc, uint32_t Type, uint64_t Val) const override; @@ -232,6 +236,23 @@ return false; } +bool TargetInfo::isRelaxable(const SymbolBody &S) const { + if (S.isUndefined() || S.isPreemptible()) + return false; + if (S.isGnuIFunc()) + return false; + return (S.getName() != "_DYNAMIC"); +} + +bool TargetInfo::canRelaxGot(uint32_t Type, const SymbolBody &S, + const uint8_t *Data, uint64_t Offset) const { + return false; +} + +void TargetInfo::relaxGot(uint8_t *Loc, uint64_t Val) const { + llvm_unreachable("Should not have claimed to be relaxable"); +} + void TargetInfo::relaxTlsGdToLe(uint8_t *Loc, uint32_t Type, uint64_t Val) const { llvm_unreachable("Should not have claimed to be relaxable"); @@ -727,6 +748,23 @@ } } +bool X86_64TargetInfo::canRelaxGot(uint32_t Type, const SymbolBody &S, + const uint8_t *Data, uint64_t Offset) const { + if (Type != R_X86_64_REX_GOTPCRELX && Type != R_X86_64_GOTPCRELX) + return false; + // Convert mov foo@GOTPCREL(%rip), %reg to lea foo(%rip), %reg. + if (Offset < 2 || Data[Offset - 2] != 0x8b) + return false; + return isRelaxable(S); +} + +void X86_64TargetInfo::relaxGot(uint8_t *Loc, uint64_t Val) const { + if (Val + 0x80000000 > 0xFFFFFFFF) + fatal("Relaxation overflow"); + Loc[-2] = 0x8d; + relocateOne(Loc, R_X86_64_PC32, Val); +} + // Relocation masks following the #lo(value), #hi(value), #ha(value), // #higher(value), #highera(value), #highest(value), and #highesta(value) // macros defined in section 4.5.1. Relocation Types of the PPC-elf64abi Index: ELF/Writer.cpp =================================================================== --- ELF/Writer.cpp +++ ELF/Writer.cpp @@ -70,7 +70,8 @@ void scanRelocs(InputSection &C); void scanRelocs(InputSectionBase &S, const Elf_Shdr &RelSec); RelExpr adjustExpr(const elf::ObjectFile &File, SymbolBody &S, - bool IsWrite, RelExpr Expr, uint32_t Type); + bool IsWrite, RelExpr Expr, uint32_t Type, + const uint8_t *Data, uintX_t Offset); template uintX_t computeAddend(const elf::ObjectFile &File, const uint8_t *SectionData, const RelTy *End, @@ -457,7 +458,7 @@ if (E == R_SIZE || E == R_GOT_FROM_END || E == R_GOT_OFF || E == R_MIPS_GOT_LOCAL || E == R_MIPS_GOT_LOCAL_PAGE || E == R_GOT_PAGE_PC || E == R_GOT_PC || E == R_PLT_PC || E == R_TLSGD_PC || - E == R_TLSGD || E == R_PPC_PLT_OPD) + E == R_TLSGD || E == R_PPC_PLT_OPD || E == R_RELAX_GOT) return true; // These never do, except if the entire file is position dependent or if @@ -520,7 +521,8 @@ template RelExpr Writer::adjustExpr(const elf::ObjectFile &File, SymbolBody &Body, bool IsWrite, RelExpr Expr, - uint32_t Type) { + uint32_t Type, const uint8_t *Data, + uintX_t Offset) { if (Target->needsThunk(Type, File, Body)) return R_THUNK; bool Preemptible = Body.isPreemptible(); @@ -529,6 +531,9 @@ else if (needsPlt(Expr) && !Preemptible) Expr = fromPlt(Expr); + if (Target->canRelaxGot(Type, Body, Data, Offset)) + return R_RELAX_GOT; + if (IsWrite || isStaticLinkTimeConstant(Expr, Type, Body)) return Expr; @@ -655,7 +660,8 @@ continue; bool Preemptible = Body.isPreemptible(); - Expr = adjustExpr(File, Body, IsWrite, Expr, Type); + Expr = adjustExpr(File, Body, IsWrite, Expr, Type, + C.getSectionData().data(), Offset); if (HasError) continue; @@ -740,6 +746,8 @@ } if (refersToGotEntry(Expr)) { + if (Expr == R_RELAX_GOT) + continue; if (Body.isInGot()) continue; Out::Got->addEntry(Body); Index: test/ELF/Inputs/gotpc-relax-und-dso.s =================================================================== --- test/ELF/Inputs/gotpc-relax-und-dso.s +++ test/ELF/Inputs/gotpc-relax-und-dso.s @@ -0,0 +1,4 @@ +.globl dsofoo +.type dsofoo, @function +dsofoo: + nop Index: test/ELF/gotpc-relax-und-dso.s =================================================================== --- test/ELF/gotpc-relax-und-dso.s +++ test/ELF/gotpc-relax-und-dso.s @@ -0,0 +1,82 @@ +# REQUIRES: x86 +# RUN: llvm-mc -filetype=obj -relax-relocations -triple=x86_64-unknown-linux %s -o %t.o +# RUN: llvm-mc -filetype=obj -relax-relocations -triple=x86_64-pc-linux %S/Inputs/gotpc-relax-und-dso.s -o %tdso.o +# RUN: ld.lld -shared %tdso.o -o %t.so +# RUN: ld.lld -shared %t.o %t.so -o %tout +# RUN: llvm-readobj -r -s %tout | FileCheck --check-prefix=RELOC %s +# RUN: llvm-objdump -d %tout | FileCheck --check-prefix=DISASM %s + +# RELOC: Relocations [ +# RELOC-NEXT: Section ({{.*}}) .rela.dyn { +# RELOC-NEXT: 0x20B8 R_X86_64_RELATIVE - 0x2000 +# RELOC-NEXT: 0x20A8 R_X86_64_GLOB_DAT dsofoo 0x0 +# RELOC-NEXT: 0x20B0 R_X86_64_GLOB_DAT foo 0x0 +# RELOC-NEXT: 0x20A0 R_X86_64_GLOB_DAT und 0x0 +# RELOC-NEXT: } +# RELOC-NEXT: ] + +# 0x101e + 7 - 36 = 0x1001 +# 0x1025 + 7 - 43 = 0x1001 +# DISASM: Disassembly of section .text: +# DISASM-NEXT: foo: +# DISASM-NEXT: 1000: 90 nop +# DISASM: hid: +# DISASM-NEXT: 1001: 90 nop +# DISASM: _start: +# DISASM-NEXT: 1002: 48 8b 05 97 10 00 00 movq 4247(%rip), %rax +# DISASM-NEXT: 1009: 48 8b 05 90 10 00 00 movq 4240(%rip), %rax +# DISASM-NEXT: 1010: 48 8b 05 91 10 00 00 movq 4241(%rip), %rax +# DISASM-NEXT: 1017: 48 8b 05 8a 10 00 00 movq 4234(%rip), %rax +# DISASM-NEXT: 101e: 48 8d 05 dc ff ff ff leaq -36(%rip), %rax +# DISASM-NEXT: 1025: 48 8d 05 d5 ff ff ff leaq -43(%rip), %rax +# DISASM-NEXT: 102c: 48 8b 05 7d 10 00 00 movq 4221(%rip), %rax +# DISASM-NEXT: 1033: 48 8b 05 76 10 00 00 movq 4214(%rip), %rax +# DISASM-NEXT: 103a: 48 8b 05 77 10 00 00 movq 4215(%rip), %rax +# DISASM-NEXT: 1041: 48 8b 05 70 10 00 00 movq 4208(%rip), %rax +# DISASM-NEXT: 1048: 8b 05 52 10 00 00 movl 4178(%rip), %eax +# DISASM-NEXT: 104e: 8b 05 4c 10 00 00 movl 4172(%rip), %eax +# DISASM-NEXT: 1054: 8b 05 4e 10 00 00 movl 4174(%rip), %eax +# DISASM-NEXT: 105a: 8b 05 48 10 00 00 movl 4168(%rip), %eax +# DISASM-NEXT: 1060: 8d 05 9b ff ff ff leal -101(%rip), %eax +# DISASM-NEXT: 1066: 8d 05 95 ff ff ff leal -107(%rip), %eax +# DISASM-NEXT: 106c: 8b 05 3e 10 00 00 movl 4158(%rip), %eax +# DISASM-NEXT: 1072: 8b 05 38 10 00 00 movl 4152(%rip), %eax +# DISASM-NEXT: 1078: 8b 05 3a 10 00 00 movl 4154(%rip), %eax +# DISASM-NEXT: 107e: 8b 05 34 10 00 00 movl 4148(%rip), %eax + +.text +.globl foo +.type foo, @function +foo: + nop + +.globl hid +.hidden hid +.type hid, @function +hid: + nop + +.globl _start +.type _start, @function +_start: + movq und@GOTPCREL(%rip), %rax + movq und@GOTPCREL(%rip), %rax + movq dsofoo@GOTPCREL(%rip), %rax + movq dsofoo@GOTPCREL(%rip), %rax + movq hid@GOTPCREL(%rip), %rax + movq hid@GOTPCREL(%rip), %rax + movq foo@GOTPCREL(%rip), %rax + movq foo@GOTPCREL(%rip), %rax + movq _DYNAMIC@GOTPCREL(%rip), %rax + movq _DYNAMIC@GOTPCREL(%rip), %rax + + movl und@GOTPCREL(%rip), %eax + movl und@GOTPCREL(%rip), %eax + movl dsofoo@GOTPCREL(%rip), %eax + movl dsofoo@GOTPCREL(%rip), %eax + movl hid@GOTPCREL(%rip), %eax + movl hid@GOTPCREL(%rip), %eax + movl foo@GOTPCREL(%rip), %eax + movl foo@GOTPCREL(%rip), %eax + movl _DYNAMIC@GOTPCREL(%rip), %eax + movl _DYNAMIC@GOTPCREL(%rip), %eax Index: test/ELF/gotpc-relax.s =================================================================== --- test/ELF/gotpc-relax.s +++ test/ELF/gotpc-relax.s @@ -0,0 +1,69 @@ +# REQUIRES: x86 +# RUN: llvm-mc -filetype=obj -relax-relocations -triple=x86_64-unknown-linux %s -o %t.o +# RUN: ld.lld %t.o -o %t1 +# RUN: llvm-readobj -r %t1 | FileCheck --check-prefix=RELOC %s +# RUN: llvm-objdump -d %t1 | FileCheck --check-prefix=DISASM %s + +## There is no relocations. +# RELOC: Relocations [ +# RELOC: ] + +# 0x11003 + 7 - 10 = 0x11000 +# 0x1100a + 7 - 17 = 0x11000 +# 0x11011 + 7 - 23 = 0x11001 +# 0x11018 + 7 - 30 = 0x11001 +# DISASM: Disassembly of section .text: +# DISASM-NEXT: foo: +# DISASM-NEXT: 11000: 90 nop +# DISASM: hid: +# DISASM-NEXT: 11001: 90 nop +# DISASM: ifunc: +# DISASM-NEXT: 11002: c3 retq +# DISASM: _start: +# DISASM-NEXT: 11003: 48 8d 05 f6 ff ff ff leaq -10(%rip), %rax +# DISASM-NEXT: 1100a: 48 8d 05 ef ff ff ff leaq -17(%rip), %rax +# DISASM-NEXT: 11011: 48 8d 05 e9 ff ff ff leaq -23(%rip), %rax +# DISASM-NEXT: 11018: 48 8d 05 e2 ff ff ff leaq -30(%rip), %rax +# DISASM-NEXT: 1101f: 48 8b 05 da 0f 00 00 movq 4058(%rip), %rax +# DISASM-NEXT: 11026: 48 8b 05 d3 0f 00 00 movq 4051(%rip), %rax +# DISASM-NEXT: 1102d: 8d 05 cd ff ff ff leal -51(%rip), %eax +# DISASM-NEXT: 11033: 8d 05 c7 ff ff ff leal -57(%rip), %eax +# DISASM-NEXT: 11039: 8d 05 c2 ff ff ff leal -62(%rip), %eax +# DISASM-NEXT: 1103f: 8d 05 bc ff ff ff leal -68(%rip), %eax +# DISASM-NEXT: 11045: 8b 05 b5 0f 00 00 movl 4021(%rip), %eax +# DISASM-NEXT: 1104b: 8b 05 af 0f 00 00 movl 4015(%rip), %eax + +.text +.globl foo +.type foo, @function +foo: + nop + +.globl hid +.hidden hid +.type hid, @function +hid: + nop + +.text +.type ifunc STT_GNU_IFUNC +.globl ifunc +.type ifunc, @function +ifunc: + ret + +.globl _start +.type _start, @function +_start: + movq foo@GOTPCREL(%rip), %rax + movq foo@GOTPCREL(%rip), %rax + movq hid@GOTPCREL(%rip), %rax + movq hid@GOTPCREL(%rip), %rax + movq ifunc@GOTPCREL(%rip), %rax + movq ifunc@GOTPCREL(%rip), %rax + movl foo@GOTPCREL(%rip), %eax + movl foo@GOTPCREL(%rip), %eax + movl hid@GOTPCREL(%rip), %eax + movl hid@GOTPCREL(%rip), %eax + movl ifunc@GOTPCREL(%rip), %eax + movl ifunc@GOTPCREL(%rip), %eax