//===- LinkerScript.h -------------------------------------------*- C++ -*-===// // // The LLVM Linker // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// #ifndef LLD_ELF_LINKER_SCRIPT_H #define LLD_ELF_LINKER_SCRIPT_H #include "Config.h" #include "Strings.h" #include "Writer.h" #include "lld/Core/LLVM.h" #include "llvm/ADT/DenseMap.h" #include "llvm/ADT/DenseSet.h" #include "llvm/ADT/MapVector.h" #include "llvm/Support/Allocator.h" #include "llvm/Support/MemoryBuffer.h" #include "llvm/Support/Regex.h" #include namespace lld { namespace elf { class DefinedCommon; class ScriptParser; class SymbolBody; template class InputSectionBase; template class InputSection; template class OutputSectionBase; template class OutputSectionFactory; class InputSectionData; // This represents an expression in the linker script. // ScriptParser::readExpr reads an expression and returns an Expr. // Later, we evaluate the expression by calling the function // with the value of special context variable ".". typedef std::function Expr; // Parses a linker script. Calling this function updates // Config and ScriptConfig. void readLinkerScript(MemoryBufferRef MB); // Parses a version script. void readVersionScript(MemoryBufferRef MB); // This enum is used to implement linker script SECTIONS command. // https://sourceware.org/binutils/docs/ld/SECTIONS.html#SECTIONS enum SectionsCommandKind { AssignmentKind, // . = expr or = expr OutputSectionKind, InputSectionKind, AssertKind, // ASSERT(expr) BytesDataKind // BYTE(expr), SHORT(expr), LONG(expr) or QUAD(expr) }; struct BaseCommand { BaseCommand(int K) : Kind(K) {} virtual ~BaseCommand() {} int Kind; }; // This represents ". = " or " = ". struct SymbolAssignment : BaseCommand { SymbolAssignment(StringRef Name, Expr E, bool IsAbsolute) : BaseCommand(AssignmentKind), Name(Name), Expression(E), IsAbsolute(IsAbsolute) {} static bool classof(const BaseCommand *C); // The LHS of an expression. Name is either a symbol name or ".". StringRef Name; SymbolBody *Sym = nullptr; // The RHS of an expression. Expr Expression; // Command attributes for PROVIDE, HIDDEN and PROVIDE_HIDDEN. bool Provide = false; bool Hidden = false; bool IsAbsolute; }; // Linker scripts allow additional constraints to be put on ouput sections. // If an output section is marked as ONLY_IF_RO, the section is created // only if its input sections are read-only. Likewise, an output section // with ONLY_IF_RW is created if all input sections are RW. enum class ConstraintKind { NoConstraint, ReadOnly, ReadWrite }; struct OutputSectionCommand : BaseCommand { OutputSectionCommand(StringRef Name) : BaseCommand(OutputSectionKind), Name(Name) {} static bool classof(const BaseCommand *C); StringRef Name; Expr AddrExpr; Expr AlignExpr; Expr LMAExpr; Expr SubalignExpr; std::vector> Commands; std::vector Phdrs; std::vector Filler; ConstraintKind Constraint = ConstraintKind::NoConstraint; }; // This struct represents one section match pattern in SECTIONS() command. // It can optionally have negative match pattern for EXCLUDED_FILE command. // Also it may be surrounded with SORT() command, so contains sorting rules. struct SectionPattern { SectionPattern(llvm::Regex &&Re1, llvm::Regex &&Re2) : ExcludedFileRe(std::forward(Re1)), SectionRe(std::forward(Re2)) {} SectionPattern(SectionPattern &&Other) { std::swap(ExcludedFileRe, Other.ExcludedFileRe); std::swap(SectionRe, Other.SectionRe); std::swap(SortOuter, Other.SortOuter); std::swap(SortInner, Other.SortInner); } llvm::Regex ExcludedFileRe; llvm::Regex SectionRe; SortSectionPolicy SortOuter; SortSectionPolicy SortInner; }; struct InputSectionDescription : BaseCommand { InputSectionDescription(StringRef FilePattern) : BaseCommand(InputSectionKind), FileRe(compileGlobPatterns({FilePattern})) {} static bool classof(const BaseCommand *C); llvm::Regex FileRe; // Input sections that matches at least one of SectionPatterns // will be associated with this InputSectionDescription. std::vector SectionPatterns; std::vector Sections; }; // Represents an ASSERT(). struct AssertCommand : BaseCommand { AssertCommand(Expr E) : BaseCommand(AssertKind), Expression(E) {} static bool classof(const BaseCommand *C); Expr Expression; }; // Represents BYTE(), SHORT(), LONG(), or QUAD(). struct BytesDataCommand : BaseCommand { BytesDataCommand(uint64_t Data, unsigned Size) : BaseCommand(BytesDataKind), Data(Data), Size(Size) {} static bool classof(const BaseCommand *C); uint64_t Data; unsigned Offset; unsigned Size; }; struct PhdrsCommand { StringRef Name; unsigned Type; bool HasFilehdr; bool HasPhdrs; unsigned Flags; Expr LMAExpr; }; class LinkerScriptBase { protected: ~LinkerScriptBase() = default; public: virtual uint64_t getOutputSectionAddress(StringRef Name) = 0; virtual uint64_t getOutputSectionSize(StringRef Name) = 0; virtual uint64_t getOutputSectionAlign(StringRef Name) = 0; virtual uint64_t getOutputSectionLMA(StringRef Name) = 0; virtual uint64_t getHeaderSize() = 0; virtual uint64_t getSymbolValue(StringRef S) = 0; virtual bool isDefined(StringRef S) = 0; }; // ScriptConfiguration holds linker script parse results. struct ScriptConfiguration { // Used to assign addresses to sections. std::vector> Commands; // Used to assign sections to headers. std::vector PhdrsCommands; bool HasSections = false; llvm::BumpPtrAllocator Alloc; // List of section patterns specified with KEEP commands. They will // be kept even if they are unused and --gc-sections is specified. std::vector KeptSections; }; extern ScriptConfiguration *ScriptConfig; // This is a runner of the linker script. template class LinkerScript final : public LinkerScriptBase { typedef typename ELFT::uint uintX_t; public: LinkerScript(); ~LinkerScript(); void processCommands(OutputSectionFactory &Factory); void createSections(OutputSectionFactory &Factory); void adjustSectionsBeforeSorting(); std::vector> createPhdrs(); bool ignoreInterpSection(); ArrayRef getFiller(StringRef Name); void writeDataBytes(StringRef Name, uint8_t *Buf); bool hasLMA(StringRef Name); bool shouldKeep(InputSectionBase *S); void assignOffsets(OutputSectionCommand *Cmd); void assignAddresses(std::vector> &Phdrs); bool hasPhdrsCommands(); uint64_t getOutputSectionAddress(StringRef Name) override; uint64_t getOutputSectionSize(StringRef Name) override; uint64_t getOutputSectionAlign(StringRef Name) override; uint64_t getOutputSectionLMA(StringRef Name) override; uint64_t getHeaderSize() override; uint64_t getSymbolValue(StringRef S) override; bool isDefined(StringRef S) override; std::vector *> *OutputSections; int getSectionIndex(StringRef Name); private: void computeInputSections(InputSectionDescription *); void addSection(OutputSectionFactory &Factory, InputSectionBase *Sec, StringRef Name); void discard(ArrayRef *> V); std::vector *> createInputSectionList(OutputSectionCommand &Cmd); // "ScriptConfig" is a bit too long, so define a short name for it. ScriptConfiguration &Opt = *ScriptConfig; std::vector getPhdrIndices(StringRef SectionName); size_t getPhdrIndex(StringRef PhdrName); uintX_t Dot; uintX_t LMAOffset = 0; OutputSectionBase *CurOutSec = nullptr; uintX_t ThreadBssOffset = 0; void switchTo(OutputSectionBase *Sec); void flush(); void output(InputSection *Sec); void process(BaseCommand &Base); llvm::DenseSet *> AlreadyOutputOS; llvm::DenseSet AlreadyOutputIS; }; // Variable template is a C++14 feature, so we can't template // a global variable. Use a struct to workaround. template struct Script { static LinkerScript *X; }; template LinkerScript *Script::X; extern LinkerScriptBase *ScriptBase; } // namespace elf } // namespace lld #endif