Index: ELF/Symbols.h =================================================================== --- ELF/Symbols.h +++ ELF/Symbols.h @@ -335,6 +335,12 @@ // output file's symbol table. It has weak binding and can be substituted. static Elf_Sym Ignored; + // The content for _etext and etext symbols. + static Elf_Sym Etext; + + // The content for _edata and edata symbols. + static Elf_Sym Edata; + // The content for _end and end symbols. static Elf_Sym End; @@ -348,6 +354,8 @@ }; template typename ElfSym::Elf_Sym ElfSym::Ignored; +template typename ElfSym::Elf_Sym ElfSym::Etext; +template typename ElfSym::Elf_Sym ElfSym::Edata; template typename ElfSym::Elf_Sym ElfSym::End; template typename ElfSym::Elf_Sym ElfSym::MipsGp; template Index: ELF/Symbols.cpp =================================================================== --- ELF/Symbols.cpp +++ ELF/Symbols.cpp @@ -213,6 +213,8 @@ } template static void doInitSymbols() { + ElfSym::Etext.setBinding(STB_GLOBAL); + ElfSym::Edata.setBinding(STB_GLOBAL); ElfSym::End.setBinding(STB_GLOBAL); ElfSym::Ignored.setBinding(STB_WEAK); ElfSym::Ignored.setVisibility(STV_HIDDEN); Index: ELF/Writer.cpp =================================================================== --- ELF/Writer.cpp +++ ELF/Writer.cpp @@ -903,20 +903,27 @@ if (!isOutputDynamic()) Symtab.addIgnored("__tls_get_addr"); + auto defineWithAlias = [this](StringRef Name, StringRef Alias, Elf_Sym &Sym) { + if (Symtab.find(Name)) + Symtab.addAbsolute(Name, Sym); + if (SymbolBody *B = Symtab.find(Alias)) + if (B->isUndefined()) + Symtab.addAbsolute(Alias, Sym); + }; + // If the "_end" symbol is referenced, it is expected to point to the address // right after the data segment. Usually, this symbol points to the end // of .bss section or to the end of .data section if .bss section is absent. // We don't know the final address of _end yet, so just add a symbol here, // and fix ElfSym::End.st_value later. - if (Symtab.find("_end")) - Symtab.addAbsolute("_end", ElfSym::End); - // Define "end" as an alias to "_end" if it is used but not defined. // We don't want to define that unconditionally because we don't want to // break programs that uses "end" as a regular symbol. - if (SymbolBody *B = Symtab.find("end")) - if (B->isUndefined()) - Symtab.addAbsolute("end", ElfSym::End); + defineWithAlias("_end", "end", ElfSym::End); + + // _etext and _edata are very similar to _end. + defineWithAlias("_etext", "etext", ElfSym::Etext); + defineWithAlias("_edata", "edata", ElfSym::Edata); } // Sort input sections by section name suffixes for @@ -1347,10 +1354,11 @@ if (PageAlign.count(Sec)) Align = std::max(Align, Target->PageSize); - if (Sec->getType() != SHT_NOBITS) + const bool HasBits = Sec->getType() != SHT_NOBITS; + if (HasBits) FileOff = alignTo(FileOff, Align); Sec->setFileOffset(FileOff); - if (Sec->getType() != SHT_NOBITS) + if (HasBits) FileOff += Sec->getSize(); // We only assign VAs to allocated sections. @@ -1364,6 +1372,14 @@ Sec->setVA(TVA); ThreadBssOffset = TVA - VA + Sec->getSize(); } + + const bool Alloc = Sec->getFlags() & SHF_ALLOC; + // _etext points to location after the last read-only loadable segment. + // _edata points to the end of the last non SHT_NOBITS section. + if (Alloc && !(Sec->getFlags() & SHF_WRITE)) + ElfSym::Etext.st_value = VA; + if (Alloc && HasBits) + ElfSym::Edata.st_value = VA; } // Add space for section headers. Index: test/ELF/edata-etext.s =================================================================== --- test/ELF/edata-etext.s +++ test/ELF/edata-etext.s @@ -0,0 +1,117 @@ +# REQUIRES: x86 +# RUN: llvm-mc -filetype=obj -triple=x86_64-pc-linux %s -o %t.o +# RUN: ld.lld %t.o -o %t +# RUN: llvm-readobj -sections -symbols %t | FileCheck %s + +## This checks that: +## 1) Address of _etext is the first location after the last read-only loadable segment. +## 2) Address of _edata points to the end of the last non SHT_NOBITS section. +## That is how gold/bfd do. At the same time specs says: "If the address of _edata is +## greater than the address of _etext, the address of _end is same as the address +## of _edata." (https://docs.oracle.com/cd/E53394_01/html/E54766/u-etext-3c.html). +## 3) Address of _end is different from _edata because of 2. +# CHECK: Section { +# CHECK: Index: 1 +# CHECK: Name: .text +# CHECK-NEXT: Type: SHT_PROGBITS +# CHECK-NEXT: Flags [ +# CHECK-NEXT: SHF_ALLOC +# CHECK-NEXT: SHF_EXECINSTR +# CHECK-NEXT: ] +# CHECK-NEXT: Address: 0x11000 +# CHECK-NEXT: Offset: 0x1000 +# CHECK-NEXT: Size: 1 +# CHECK-NEXT: Link: +# CHECK-NEXT: Info: +# CHECK-NEXT: AddressAlignment: +# CHECK-NEXT: EntrySize: 0 +# CHECK-NEXT: } +# CHECK-NEXT: Section { +# CHECK-NEXT: Index: 2 +# CHECK-NEXT: Name: .data +# CHECK-NEXT: Type: SHT_PROGBITS +# CHECK-NEXT: Flags [ +# CHECK-NEXT: SHF_ALLOC +# CHECK-NEXT: SHF_WRITE +# CHECK-NEXT: ] +# CHECK-NEXT: Address: 0x12000 +# CHECK-NEXT: Offset: 0x2000 +# CHECK-NEXT: Size: 2 +# CHECK-NEXT: Link: +# CHECK-NEXT: Info: +# CHECK-NEXT: AddressAlignment: +# CHECK-NEXT: EntrySize: +# CHECK-NEXT: } +# CHECK-NEXT: Section { +# CHECK-NEXT: Index: 3 +# CHECK-NEXT: Name: .bss +# CHECK-NEXT: Type: SHT_NOBITS +# CHECK-NEXT: Flags [ +# CHECK-NEXT: SHF_ALLOC +# CHECK-NEXT: SHF_WRITE +# CHECK-NEXT: ] +# CHECK-NEXT: Address: 0x12004 +# CHECK-NEXT: Offset: 0x2002 +# CHECK-NEXT: Size: 6 +# CHECK-NEXT: Link: +# CHECK-NEXT: Info: +# CHECK-NEXT: AddressAlignment: +# CHECK-NEXT: EntrySize: +# CHECK-NEXT: } +# CHECK: Symbols [ +# CHECK-NEXT: Symbol { +# CHECK-NEXT: Name: +# CHECK-NEXT: Value: 0x0 +# CHECK-NEXT: Size: 0 +# CHECK-NEXT: Binding: Local +# CHECK-NEXT: Type: None +# CHECK-NEXT: Other: 0 +# CHECK-NEXT: Section: Undefined +# CHECK-NEXT: } +# CHECK-NEXT: Symbol { +# CHECK-NEXT: Name: _start +# CHECK-NEXT: Value: 0x11000 +# CHECK-NEXT: Size: 0 +# CHECK-NEXT: Binding: Global +# CHECK-NEXT: Type: None +# CHECK-NEXT: Other: 0 +# CHECK-NEXT: Section: .text +# CHECK-NEXT: } +# CHECK-NEXT: Symbol { +# CHECK-NEXT: Name: _edata +# CHECK-NEXT: Value: 0x12002 +# CHECK-NEXT: Size: 0 +# CHECK-NEXT: Binding: Global +# CHECK-NEXT: Type: None +# CHECK-NEXT: Other: 0 +# CHECK-NEXT: Section: Absolute +# CHECK-NEXT: } +# CHECK-NEXT: Symbol { +# CHECK-NEXT: Name: _end +# CHECK-NEXT: Value: 0x1200A +# CHECK-NEXT: Size: 0 +# CHECK-NEXT: Binding: Global +# CHECK-NEXT: Type: None +# CHECK-NEXT: Other: 0 +# CHECK-NEXT: Section: Absolute +# CHECK-NEXT: } +# CHECK-NEXT: Symbol { +# CHECK-NEXT: Name: _etext +# CHECK-NEXT: Value: 0x11001 +# CHECK-NEXT: Size: 0 +# CHECK-NEXT: Binding: Global +# CHECK-NEXT: Type: None +# CHECK-NEXT: Other: 0 +# CHECK-NEXT: Section: Absolute +# CHECK-NEXT: } +# CHECK-NEXT: ] + +.global _start,_end,_etext,_edata +.text +_start: + nop +.data + .word 1 +.bss + .align 4 + .space 6