mirror of
https://github.com/rui314/mold.git
synced 2025-01-07 18:02:15 +03:00
1335 lines
29 KiB
C++
1335 lines
29 KiB
C++
#pragma once
|
|
|
|
#ifndef _GNU_SOURCE
|
|
#define _GNU_SOURCE
|
|
#endif
|
|
|
|
#include "elf.h"
|
|
|
|
#include <atomic>
|
|
#include <cassert>
|
|
#include <cstdint>
|
|
#include <functional>
|
|
#include <iostream>
|
|
#include <map>
|
|
#include <mutex>
|
|
#include <set>
|
|
#include <span>
|
|
#include <sstream>
|
|
#include <string>
|
|
#include <string_view>
|
|
#include <tbb/concurrent_hash_map.h>
|
|
#include <tbb/enumerable_thread_specific.h>
|
|
#include <tbb/spin_mutex.h>
|
|
#include <vector>
|
|
|
|
static constexpr i64 SECTOR_SIZE = 512;
|
|
static constexpr i64 PAGE_SIZE = 4096;
|
|
static constexpr i64 GOT_SIZE = 8;
|
|
static constexpr i64 PLT_SIZE = 16;
|
|
static constexpr i64 SHA256_SIZE = 32;
|
|
|
|
typedef uint8_t u8;
|
|
typedef uint16_t u16;
|
|
typedef uint32_t u32;
|
|
typedef uint64_t u64;
|
|
|
|
typedef int8_t i8;
|
|
typedef int16_t i16;
|
|
typedef int32_t i32;
|
|
typedef int64_t i64;
|
|
|
|
class InputChunk;
|
|
class InputFile;
|
|
class InputSection;
|
|
class MergeableSection;
|
|
class MergedSection;
|
|
class ObjectFile;
|
|
class OutputChunk;
|
|
class OutputSection;
|
|
class SharedFile;
|
|
class Symbol;
|
|
|
|
enum class BuildIdKind : u8 { NONE, MD5, SHA1, SHA256, UUID };
|
|
|
|
struct Config {
|
|
BuildIdKind build_id = BuildIdKind::NONE;
|
|
bool allow_multiple_definition = false;
|
|
bool discard_all = false;
|
|
bool discard_locals = false;
|
|
bool eh_frame_hdr = true;
|
|
bool export_dynamic = false;
|
|
bool fork = true;
|
|
bool gc_sections = false;
|
|
bool hash_style_gnu = false;
|
|
bool hash_style_sysv = true;
|
|
bool icf = false;
|
|
bool is_static = false;
|
|
bool perf = false;
|
|
bool pie = false;
|
|
bool preload = false;
|
|
bool print_gc_sections = false;
|
|
bool print_icf_sections = false;
|
|
bool print_map = false;
|
|
bool quick_exit = true;
|
|
bool relax = true;
|
|
bool stat = false;
|
|
bool strip_all = false;
|
|
bool trace = false;
|
|
bool z_now = false;
|
|
i64 filler = -1;
|
|
i64 thread_count = -1;
|
|
std::string dynamic_linker = "/lib64/ld-linux-x86-64.so.2";
|
|
std::string entry = "_start";
|
|
std::string output;
|
|
std::string rpaths;
|
|
std::string sysroot;
|
|
std::vector<std::string> globals;
|
|
std::vector<std::string_view> library_paths;
|
|
std::vector<std::string_view> trace_symbol;
|
|
std::vector<std::string_view> version_script;
|
|
u64 image_base = 0x200000;
|
|
};
|
|
|
|
inline Config config;
|
|
|
|
void cleanup();
|
|
|
|
class SyncOut {
|
|
public:
|
|
SyncOut(std::ostream &out = std::cout) : out(out) {}
|
|
|
|
~SyncOut() {
|
|
static std::mutex mu;
|
|
std::lock_guard lock(mu);
|
|
out << ss.str() << "\n";
|
|
}
|
|
|
|
template <class T> SyncOut &operator<<(T &&val) {
|
|
ss << std::forward<T>(val);
|
|
return *this;
|
|
}
|
|
|
|
private:
|
|
std::ostream &out;
|
|
std::stringstream ss;
|
|
};
|
|
|
|
class Error {
|
|
public:
|
|
Error() {
|
|
has_error = true;
|
|
}
|
|
|
|
template <class T> Error &operator<<(T &&val) {
|
|
out << std::forward<T>(val);
|
|
return *this;
|
|
}
|
|
|
|
static void checkpoint() {
|
|
if (!has_error)
|
|
return;
|
|
cleanup();
|
|
_exit(1);
|
|
}
|
|
|
|
private:
|
|
static inline std::atomic_bool has_error = false;
|
|
SyncOut out{std::cerr};
|
|
};
|
|
|
|
class Fatal {
|
|
public:
|
|
[[noreturn]] ~Fatal() {
|
|
out.~SyncOut();
|
|
cleanup();
|
|
_exit(1);
|
|
}
|
|
|
|
template <class T> Fatal &operator<<(T &&val) {
|
|
out << std::forward<T>(val);
|
|
return *this;
|
|
}
|
|
|
|
private:
|
|
SyncOut out{std::cerr};
|
|
};
|
|
|
|
#define unreachable() \
|
|
do { Fatal() << "internal error at " << __FILE__ << ":" << __LINE__; } while (0)
|
|
|
|
std::ostream &operator<<(std::ostream &out, const InputFile &file);
|
|
|
|
//
|
|
// Interned string
|
|
//
|
|
|
|
namespace tbb {
|
|
template<> struct tbb_hash_compare<std::string_view> {
|
|
static size_t hash(const std::string_view &k) {
|
|
return std::hash<std::string_view>()(k);
|
|
}
|
|
|
|
static bool equal(const std::string_view &k1, const std::string_view &k2) {
|
|
return k1 == k2;
|
|
}
|
|
};
|
|
}
|
|
|
|
template<typename ValueT> class ConcurrentMap {
|
|
public:
|
|
ValueT *insert(std::string_view key, const ValueT &val) {
|
|
typename decltype(map)::const_accessor acc;
|
|
map.insert(acc, std::make_pair(key, val));
|
|
return const_cast<ValueT *>(&acc->second);
|
|
}
|
|
|
|
tbb::concurrent_hash_map<std::string_view, ValueT> map;
|
|
};
|
|
|
|
//
|
|
// Symbol
|
|
//
|
|
|
|
struct SectionFragment {
|
|
SectionFragment(std::string_view data) : data(data) {}
|
|
|
|
SectionFragment(const SectionFragment &other)
|
|
: isec(other.isec.load()), data(other.data), offset(other.offset) {}
|
|
|
|
inline u64 get_addr() const;
|
|
|
|
std::atomic<MergeableSection *> isec = nullptr;
|
|
std::string_view data;
|
|
u32 offset = -1;
|
|
u16 alignment = 1;
|
|
std::atomic_bool is_alive = !config.gc_sections;
|
|
};
|
|
|
|
struct SectionFragmentRef {
|
|
SectionFragment *frag = nullptr;
|
|
i32 addend = 0;
|
|
};
|
|
|
|
struct SectionFragmentKey {
|
|
std::string_view data;
|
|
u32 alignment;
|
|
};
|
|
|
|
namespace tbb {
|
|
template<> struct tbb_hash_compare<SectionFragmentKey> {
|
|
static size_t hash(const SectionFragmentKey &k) {
|
|
return std::hash<std::string_view>()(k.data) ^ std::hash<u32>()(k.alignment);
|
|
}
|
|
|
|
static bool equal(const SectionFragmentKey &k1, const SectionFragmentKey &k2) {
|
|
return k1.data == k2.data && k1.alignment == k2.alignment;
|
|
}
|
|
};
|
|
}
|
|
|
|
enum {
|
|
NEEDS_GOT = 1 << 0,
|
|
NEEDS_PLT = 1 << 1,
|
|
NEEDS_GOTTPOFF = 1 << 2,
|
|
NEEDS_TLSGD = 1 << 3,
|
|
NEEDS_TLSLD = 1 << 4,
|
|
NEEDS_COPYREL = 1 << 5,
|
|
NEEDS_DYNSYM = 1 << 6,
|
|
};
|
|
|
|
class Symbol {
|
|
public:
|
|
Symbol() = default;
|
|
Symbol(std::string_view name) : name(name) {}
|
|
Symbol(const Symbol &other) : name(other.name) {}
|
|
|
|
static Symbol *intern(std::string_view name) {
|
|
static ConcurrentMap<Symbol> map;
|
|
return map.insert(name, {name});
|
|
}
|
|
|
|
inline u64 get_addr() const;
|
|
inline u64 get_got_addr() const;
|
|
inline u64 get_gotplt_addr() const;
|
|
inline u64 get_gottpoff_addr() const;
|
|
inline u64 get_tlsgd_addr() const;
|
|
inline u64 get_plt_addr() const;
|
|
|
|
inline bool is_alive() const;
|
|
inline bool is_absolute() const;
|
|
inline bool is_relative() const { return !is_absolute(); }
|
|
|
|
std::string_view name;
|
|
InputFile *file = nullptr;
|
|
const ElfSym *esym = nullptr;
|
|
InputSection *input_section = nullptr;
|
|
SectionFragment *frag = nullptr;
|
|
|
|
u64 value = -1;
|
|
u32 got_idx = -1;
|
|
u32 gotplt_idx = -1;
|
|
u32 gottpoff_idx = -1;
|
|
u32 tlsgd_idx = -1;
|
|
u32 plt_idx = -1;
|
|
u32 dynsym_idx = -1;
|
|
u16 shndx = 0;
|
|
u16 ver_idx = 0;
|
|
|
|
std::atomic_uint8_t flags = 0;
|
|
u8 st_type = STT_NOTYPE;
|
|
|
|
tbb::spin_mutex mu;
|
|
|
|
u8 is_placeholder : 1 = false;
|
|
u8 is_imported : 1 = false;
|
|
u8 is_weak : 1 = false;
|
|
u8 is_undef_weak : 1 = false;
|
|
u8 write_symtab : 1 = false;
|
|
u8 traced : 1 = false;
|
|
u8 has_relplt : 1 = false;
|
|
u8 has_copyrel : 1 = false;
|
|
};
|
|
|
|
//
|
|
// input_sections.cc
|
|
//
|
|
|
|
class InputChunk {
|
|
public:
|
|
virtual void copy_buf() {}
|
|
inline u64 get_addr() const;
|
|
std::string_view get_contents() const;
|
|
|
|
ObjectFile *file;
|
|
const ElfShdr &shdr;
|
|
OutputSection *output_section = nullptr;
|
|
|
|
std::string_view name;
|
|
u32 offset = -1;
|
|
|
|
protected:
|
|
InputChunk(ObjectFile *file, const ElfShdr &shdr, std::string_view name);
|
|
};
|
|
|
|
enum RelType : u8 {
|
|
R_NONE = 1,
|
|
R_ABS,
|
|
R_ABS_DYN,
|
|
R_DYN,
|
|
R_PC,
|
|
R_GOT,
|
|
R_GOTPC,
|
|
R_GOTPCREL,
|
|
R_TLSGD,
|
|
R_TLSGD_RELAX_LE,
|
|
R_TLSLD,
|
|
R_TLSLD_RELAX_LE,
|
|
R_DTPOFF,
|
|
R_TPOFF,
|
|
R_GOTTPOFF,
|
|
};
|
|
|
|
struct EhReloc {
|
|
Symbol &sym;
|
|
u32 type;
|
|
u32 offset;
|
|
i64 addend;
|
|
};
|
|
|
|
inline bool operator==(const EhReloc &a, const EhReloc &b) {
|
|
return std::tuple(&a.sym, a.type, a.offset, a.addend) ==
|
|
std::tuple(&b.sym, b.type, b.offset, b.addend);
|
|
}
|
|
|
|
struct CieRecord;
|
|
|
|
struct FdeRecord {
|
|
FdeRecord(std::string_view contents, std::vector<EhReloc> &&rels,
|
|
u32 cie_idx)
|
|
: contents(contents), rels(std::move(rels)), cie_idx(cie_idx) {}
|
|
|
|
FdeRecord(const FdeRecord &&other)
|
|
: contents(other.contents), rels(std::move(other.rels)),
|
|
cie_idx(other.cie_idx), offset(other.offset),
|
|
is_alive(other.is_alive.load()) {}
|
|
|
|
std::string_view contents;
|
|
std::vector<EhReloc> rels;
|
|
u32 cie_idx = -1;
|
|
u32 offset = -1;
|
|
std::atomic_bool is_alive = true;
|
|
};
|
|
|
|
struct CieRecord {
|
|
bool should_merge(const CieRecord &other) const;
|
|
|
|
std::string_view contents;
|
|
std::vector<EhReloc> rels;
|
|
std::vector<FdeRecord> fdes;
|
|
|
|
// For .eh_frame
|
|
u32 offset = -1;
|
|
u32 leader_offset = -1;
|
|
u32 fde_size = -1;
|
|
|
|
// For .eh_frame_hdr
|
|
u32 num_fdes = 0;
|
|
u32 fde_idx = -1;
|
|
};
|
|
|
|
class InputSection : public InputChunk {
|
|
public:
|
|
InputSection(ObjectFile *file, const ElfShdr &shdr, std::string_view name,
|
|
i64 section_idx)
|
|
: InputChunk(file, shdr, name), section_idx(section_idx) {}
|
|
|
|
void copy_buf() override;
|
|
void scan_relocations();
|
|
void report_undefined_symbols();
|
|
void apply_reloc_alloc(u8 *base);
|
|
void apply_reloc_nonalloc(u8 *base);
|
|
void kill();
|
|
inline i64 get_priority() const;
|
|
|
|
std::span<ElfRela> rels;
|
|
std::vector<bool> has_fragments;
|
|
std::vector<SectionFragmentRef> rel_fragments;
|
|
std::vector<RelType> rel_types;
|
|
std::span<FdeRecord> fdes;
|
|
u64 reldyn_offset = 0;
|
|
u32 section_idx = -1;
|
|
bool is_comdat_member = false;
|
|
bool is_ehframe = false;
|
|
|
|
// For COMDAT de-duplication and garbage collection
|
|
bool is_alive = true;
|
|
|
|
// For garbage collection
|
|
std::atomic_bool is_visited = false;
|
|
|
|
// For ICF
|
|
bool icf_eligible = false;
|
|
bool icf_leaf = false;
|
|
InputSection *leader = nullptr;
|
|
u32 icf_idx = -1;
|
|
};
|
|
|
|
class MergeableSection : public InputChunk {
|
|
public:
|
|
MergeableSection(InputSection *isec);
|
|
|
|
MergedSection &parent;
|
|
std::vector<SectionFragment *> fragments;
|
|
std::vector<u32> frag_offsets;
|
|
u32 size = 0;
|
|
u32 padding = 0;
|
|
};
|
|
|
|
//
|
|
// output_chunks.cc
|
|
//
|
|
|
|
class OutputChunk {
|
|
public:
|
|
enum Kind : u8 { HEADER, REGULAR, SYNTHETIC };
|
|
|
|
virtual void copy_buf() {}
|
|
virtual void update_shdr() {}
|
|
|
|
std::string_view name;
|
|
i64 shndx = 0;
|
|
Kind kind;
|
|
bool starts_new_ptload = false;
|
|
ElfShdr shdr = { .sh_addralign = 1 };
|
|
|
|
protected:
|
|
OutputChunk(Kind kind) : kind(kind) {}
|
|
};
|
|
|
|
// ELF header
|
|
class OutputEhdr : public OutputChunk {
|
|
public:
|
|
OutputEhdr() : OutputChunk(HEADER) {
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_size = sizeof(ElfEhdr);
|
|
}
|
|
|
|
void copy_buf() override;
|
|
};
|
|
|
|
// Section header
|
|
class OutputShdr : public OutputChunk {
|
|
public:
|
|
OutputShdr() : OutputChunk(HEADER) {
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
};
|
|
|
|
// Program header
|
|
class OutputPhdr : public OutputChunk {
|
|
public:
|
|
OutputPhdr() : OutputChunk(HEADER) {
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
};
|
|
|
|
class InterpSection : public OutputChunk {
|
|
public:
|
|
InterpSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".interp";
|
|
shdr.sh_type = SHT_PROGBITS;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_size = config.dynamic_linker.size() + 1;
|
|
}
|
|
|
|
void copy_buf() override;
|
|
};
|
|
|
|
// Sections
|
|
class OutputSection : public OutputChunk {
|
|
public:
|
|
static OutputSection *get_instance(std::string_view name, u64 type, u64 flags);
|
|
|
|
OutputSection(std::string_view name, u32 type, u64 flags)
|
|
: OutputChunk(REGULAR) {
|
|
this->name = name;
|
|
shdr.sh_type = type;
|
|
shdr.sh_flags = flags;
|
|
idx = instances.size();
|
|
instances.push_back(this);
|
|
}
|
|
|
|
void copy_buf() override;
|
|
|
|
static inline std::vector<OutputSection *> instances;
|
|
|
|
std::vector<InputSection *> members;
|
|
u32 idx;
|
|
};
|
|
|
|
class GotSection : public OutputChunk {
|
|
public:
|
|
GotSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".got";
|
|
shdr.sh_type = SHT_PROGBITS;
|
|
shdr.sh_flags = SHF_ALLOC | SHF_WRITE;
|
|
shdr.sh_addralign = GOT_SIZE;
|
|
}
|
|
|
|
void add_got_symbol(Symbol *sym);
|
|
void add_gottpoff_symbol(Symbol *sym);
|
|
void add_tlsgd_symbol(Symbol *sym);
|
|
void add_tlsld();
|
|
|
|
u64 get_tlsld_addr() const {
|
|
assert(tlsld_idx != -1);
|
|
return shdr.sh_addr + tlsld_idx * GOT_SIZE;
|
|
}
|
|
|
|
void copy_buf() override;
|
|
|
|
std::vector<Symbol *> got_syms;
|
|
std::vector<Symbol *> gottpoff_syms;
|
|
std::vector<Symbol *> tlsgd_syms;
|
|
u32 tlsld_idx = -1;
|
|
};
|
|
|
|
class GotPltSection : public OutputChunk {
|
|
public:
|
|
GotPltSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".got.plt";
|
|
shdr.sh_type = SHT_PROGBITS;
|
|
shdr.sh_flags = SHF_ALLOC | SHF_WRITE;
|
|
shdr.sh_addralign = GOT_SIZE;
|
|
shdr.sh_size = GOT_SIZE * 3;
|
|
}
|
|
|
|
void copy_buf() override;
|
|
};
|
|
|
|
class PltSection : public OutputChunk {
|
|
public:
|
|
PltSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".plt";
|
|
shdr.sh_type = SHT_PROGBITS;
|
|
shdr.sh_flags = SHF_ALLOC | SHF_EXECINSTR;
|
|
shdr.sh_addralign = 8;
|
|
shdr.sh_size = PLT_SIZE;
|
|
}
|
|
|
|
void add_symbol(Symbol *sym);
|
|
void copy_buf() override;
|
|
|
|
std::vector<Symbol *> symbols;
|
|
};
|
|
|
|
class RelPltSection : public OutputChunk {
|
|
public:
|
|
RelPltSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".rela.plt";
|
|
shdr.sh_type = SHT_RELA;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_entsize = sizeof(ElfRela);
|
|
shdr.sh_addralign = 8;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
};
|
|
|
|
class RelDynSection : public OutputChunk {
|
|
public:
|
|
RelDynSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".rela.dyn";
|
|
shdr.sh_type = SHT_RELA;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_entsize = sizeof(ElfRela);
|
|
shdr.sh_addralign = 8;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
};
|
|
|
|
class StrtabSection : public OutputChunk {
|
|
public:
|
|
StrtabSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".strtab";
|
|
shdr.sh_type = SHT_STRTAB;
|
|
shdr.sh_size = 1;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
};
|
|
|
|
class ShstrtabSection : public OutputChunk {
|
|
public:
|
|
ShstrtabSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".shstrtab";
|
|
shdr.sh_type = SHT_STRTAB;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
};
|
|
|
|
class DynstrSection : public OutputChunk {
|
|
public:
|
|
DynstrSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".dynstr";
|
|
shdr.sh_type = SHT_STRTAB;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_size = 1;
|
|
}
|
|
|
|
i64 add_string(std::string_view str);
|
|
i64 find_string(std::string_view str);
|
|
void copy_buf() override;
|
|
|
|
private:
|
|
std::unordered_map<std::string_view, i64> strings;
|
|
};
|
|
|
|
class DynamicSection : public OutputChunk {
|
|
public:
|
|
DynamicSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".dynamic";
|
|
shdr.sh_type = SHT_DYNAMIC;
|
|
shdr.sh_flags = SHF_ALLOC | SHF_WRITE;
|
|
shdr.sh_addralign = 8;
|
|
shdr.sh_entsize = sizeof(ElfDyn);
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
};
|
|
|
|
class SymtabSection : public OutputChunk {
|
|
public:
|
|
SymtabSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".symtab";
|
|
shdr.sh_type = SHT_SYMTAB;
|
|
shdr.sh_entsize = sizeof(ElfSym);
|
|
shdr.sh_addralign = 8;
|
|
shdr.sh_size = sizeof(ElfSym);
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
};
|
|
|
|
class DynsymSection : public OutputChunk {
|
|
public:
|
|
DynsymSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".dynsym";
|
|
shdr.sh_type = SHT_DYNSYM;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_entsize = sizeof(ElfSym);
|
|
shdr.sh_addralign = 8;
|
|
shdr.sh_size = sizeof(ElfSym);
|
|
}
|
|
|
|
void add_symbol(Symbol *sym);
|
|
void sort_symbols();
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
|
|
std::vector<Symbol *> symbols = {nullptr};
|
|
std::vector<u32> name_indices = {(u32)-1};
|
|
};
|
|
|
|
class HashSection : public OutputChunk {
|
|
public:
|
|
HashSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".hash";
|
|
shdr.sh_type = SHT_HASH;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_entsize = 4;
|
|
shdr.sh_addralign = 4;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
};
|
|
|
|
class GnuHashSection : public OutputChunk {
|
|
public:
|
|
GnuHashSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".gnu.hash";
|
|
shdr.sh_type = SHT_GNU_HASH;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_addralign = 8;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
|
|
static constexpr i64 LOAD_FACTOR = 8;
|
|
static constexpr i64 HEADER_SIZE = 16;
|
|
static constexpr i64 BLOOM_SHIFT = 26;
|
|
static constexpr i64 ELFCLASS_BITS = 64;
|
|
|
|
u32 num_buckets = -1;
|
|
u32 symoffset = -1;
|
|
u32 num_bloom = 1;
|
|
};
|
|
|
|
class MergedSection : public OutputChunk {
|
|
public:
|
|
static MergedSection *get_instance(std::string_view name, u64 type, u64 flags);
|
|
|
|
static inline std::vector<MergedSection *> instances;
|
|
|
|
SectionFragment *insert(std::string_view data, u32 alignment) {
|
|
typename decltype(map)::const_accessor acc;
|
|
map.insert(acc, std::pair(SectionFragmentKey{data, alignment},
|
|
SectionFragment(data)));
|
|
return const_cast<SectionFragment *>(&acc->second);
|
|
}
|
|
|
|
void copy_buf() override;
|
|
|
|
private:
|
|
MergedSection(std::string_view name, u64 flags, u32 type)
|
|
: OutputChunk(SYNTHETIC) {
|
|
this->name = name;
|
|
shdr.sh_flags = flags;
|
|
shdr.sh_type = type;
|
|
}
|
|
|
|
tbb::concurrent_hash_map<SectionFragmentKey, SectionFragment> map;
|
|
};
|
|
|
|
class EhFrameSection : public OutputChunk {
|
|
public:
|
|
EhFrameSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".eh_frame";
|
|
shdr.sh_type = SHT_X86_64_UNWIND;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_addralign = 8;
|
|
}
|
|
|
|
void construct();
|
|
void copy_buf() override;
|
|
u64 get_addr(const Symbol &sym);
|
|
|
|
std::vector<CieRecord *> cies;
|
|
u32 num_fdes = 0;
|
|
};
|
|
|
|
class EhFrameHdrSection : public OutputChunk {
|
|
public:
|
|
EhFrameHdrSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".eh_frame_hdr";
|
|
shdr.sh_type = SHT_PROGBITS;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_addralign = 4;
|
|
shdr.sh_size = HEADER_SIZE;
|
|
}
|
|
|
|
static constexpr i64 HEADER_SIZE = 12;
|
|
};
|
|
|
|
class CopyrelSection : public OutputChunk {
|
|
public:
|
|
CopyrelSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".bss";
|
|
shdr.sh_type = SHT_NOBITS;
|
|
shdr.sh_flags = SHF_ALLOC | SHF_WRITE;
|
|
shdr.sh_addralign = 32;
|
|
}
|
|
|
|
void add_symbol(Symbol *sym);
|
|
|
|
std::vector<Symbol *> symbols;
|
|
};
|
|
|
|
class VersymSection : public OutputChunk {
|
|
public:
|
|
VersymSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".gnu.version";
|
|
shdr.sh_type = SHT_GNU_VERSYM;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_entsize = 2;
|
|
shdr.sh_addralign = 2;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
|
|
std::vector<u16> contents;
|
|
};
|
|
|
|
class VerneedSection : public OutputChunk {
|
|
public:
|
|
VerneedSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".gnu.version_r";
|
|
shdr.sh_type = SHT_GNU_VERNEED;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_addralign = 8;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
|
|
std::vector<u8> contents;
|
|
};
|
|
|
|
class BuildIdSection : public OutputChunk {
|
|
public:
|
|
BuildIdSection() : OutputChunk(SYNTHETIC) {
|
|
name = ".note.gnu.build-id";
|
|
shdr.sh_type = SHT_NOTE;
|
|
shdr.sh_flags = SHF_ALLOC;
|
|
shdr.sh_addralign = 4;
|
|
shdr.sh_size = 1;
|
|
}
|
|
|
|
void update_shdr() override;
|
|
void copy_buf() override;
|
|
void write_buildid(i64 filesize);
|
|
|
|
static constexpr i64 HEADER_SIZE = 16;
|
|
};
|
|
|
|
bool is_c_identifier(std::string_view name);
|
|
std::vector<ElfPhdr> create_phdr();
|
|
|
|
//
|
|
// object_file.cc
|
|
//
|
|
|
|
struct ComdatGroup {
|
|
ComdatGroup() = default;
|
|
ComdatGroup(const ComdatGroup &other)
|
|
: owner(other.owner.load()), section_idx(other.section_idx) {}
|
|
|
|
std::atomic<ObjectFile *> owner = nullptr;
|
|
u32 section_idx = -1;
|
|
};
|
|
|
|
class MemoryMappedFile {
|
|
public:
|
|
static MemoryMappedFile *open(std::string path);
|
|
static MemoryMappedFile *must_open(std::string path);
|
|
|
|
MemoryMappedFile(std::string name, u8 *data, u64 size, u64 mtime = 0)
|
|
: name(name), data_(data), size_(size), mtime(mtime) {}
|
|
MemoryMappedFile() = delete;
|
|
|
|
MemoryMappedFile *slice(std::string name, u64 start, u64 size);
|
|
|
|
u8 *data();
|
|
i64 size() const { return size_; }
|
|
|
|
std::string_view get_contents() {
|
|
return std::string_view((char *)data(), size());
|
|
}
|
|
|
|
std::string name;
|
|
i64 mtime = 0;
|
|
|
|
private:
|
|
std::mutex mu;
|
|
MemoryMappedFile *parent;
|
|
std::atomic<u8 *> data_;
|
|
i64 size_ = 0;
|
|
};
|
|
|
|
class InputFile {
|
|
public:
|
|
InputFile(MemoryMappedFile *mb);
|
|
InputFile() : name("<internal>") {}
|
|
|
|
MemoryMappedFile *mb;
|
|
std::span<ElfShdr> elf_sections;
|
|
std::vector<Symbol *> symbols;
|
|
|
|
std::string name;
|
|
bool is_dso = false;
|
|
u32 priority;
|
|
std::atomic_bool is_alive = false;
|
|
|
|
std::string_view get_string(const ElfShdr &shdr);
|
|
std::string_view get_string(i64 idx);
|
|
|
|
protected:
|
|
template<typename T> std::span<T> get_data(const ElfShdr &shdr);
|
|
template<typename T> std::span<T> get_data(i64 idx);
|
|
ElfShdr *find_section(i64 type);
|
|
|
|
std::string_view shstrtab;
|
|
};
|
|
|
|
class ObjectFile : public InputFile {
|
|
public:
|
|
ObjectFile(MemoryMappedFile *mb, std::string archive_name);
|
|
ObjectFile();
|
|
|
|
void parse();
|
|
void resolve_symbols();
|
|
void mark_live_objects(std::function<void(ObjectFile *)> feeder);
|
|
void handle_undefined_weak_symbols();
|
|
void resolve_comdat_groups();
|
|
void eliminate_duplicate_comdat_groups();
|
|
void scan_relocations();
|
|
void convert_common_symbols();
|
|
void compute_symtab();
|
|
void write_symtab();
|
|
|
|
static ObjectFile *create_internal_file();
|
|
|
|
std::string archive_name;
|
|
std::vector<InputSection *> sections;
|
|
std::span<ElfSym> elf_syms;
|
|
i64 first_global = 0;
|
|
const bool is_in_archive = false;
|
|
std::vector<CieRecord> cies;
|
|
|
|
u64 num_dynrel = 0;
|
|
u64 reldyn_offset = 0;
|
|
|
|
u64 local_symtab_offset = 0;
|
|
u64 global_symtab_offset = 0;
|
|
u64 num_local_symtab = 0;
|
|
u64 num_global_symtab = 0;
|
|
u64 strtab_offset = 0;
|
|
u64 strtab_size = 0;
|
|
|
|
std::vector<MergeableSection *> mergeable_sections;
|
|
|
|
private:
|
|
void initialize_sections();
|
|
void initialize_symbols();
|
|
void initialize_mergeable_sections();
|
|
void initialize_ehframe_sections();
|
|
void read_ehframe(InputSection &isec);
|
|
void maybe_override_symbol(Symbol &sym, i64 symidx);
|
|
|
|
std::vector<std::pair<ComdatGroup *, std::span<u32>>> comdat_groups;
|
|
std::vector<SectionFragmentRef> sym_fragments;
|
|
bool has_common_symbol;
|
|
|
|
std::string_view symbol_strtab;
|
|
const ElfShdr *symtab_sec;
|
|
};
|
|
|
|
class SharedFile : public InputFile {
|
|
public:
|
|
SharedFile(MemoryMappedFile *mb, bool as_needed) : InputFile(mb) {
|
|
is_alive = !as_needed;
|
|
}
|
|
|
|
void parse();
|
|
void resolve_symbols();
|
|
std::span<Symbol *> find_aliases(Symbol *sym);
|
|
|
|
std::string_view soname;
|
|
std::vector<std::string_view> version_strings;
|
|
|
|
private:
|
|
std::string_view get_soname();
|
|
void maybe_override_symbol(Symbol &sym, const ElfSym &esym);
|
|
std::vector<std::string_view> read_verdef();
|
|
|
|
std::vector<const ElfSym *> elf_syms;
|
|
std::vector<u16> versyms;
|
|
std::string_view symbol_strtab;
|
|
const ElfShdr *symtab_sec;
|
|
};
|
|
|
|
inline std::ostream &operator<<(std::ostream &out, const InputChunk &isec) {
|
|
out << *isec.file << ":(" << isec.name << ")";
|
|
return out;
|
|
}
|
|
|
|
//
|
|
// archive_file.cc
|
|
//
|
|
|
|
std::vector<MemoryMappedFile *> read_archive_members(MemoryMappedFile *mb);
|
|
std::vector<MemoryMappedFile *> read_fat_archive_members(MemoryMappedFile *mb);
|
|
std::vector<MemoryMappedFile *> read_thin_archive_members(MemoryMappedFile *mb);
|
|
|
|
//
|
|
// linker_script.cc
|
|
//
|
|
|
|
void parse_linker_script(MemoryMappedFile *mb, bool as_needed);
|
|
void parse_version_script(std::string path);
|
|
|
|
//
|
|
// output_file.cc
|
|
//
|
|
|
|
class OutputFile {
|
|
public:
|
|
static OutputFile *open(std::string path, u64 filesize);
|
|
virtual void close() = 0;
|
|
|
|
u8 *buf;
|
|
static inline char *tmpfile;
|
|
|
|
protected:
|
|
OutputFile(std::string path, u64 filesize) : path(path), filesize(filesize) {}
|
|
|
|
std::string path;
|
|
u64 filesize;
|
|
};
|
|
|
|
//
|
|
// perf.cc
|
|
//
|
|
|
|
class Counter {
|
|
public:
|
|
Counter(std::string_view name, i64 value = 0) : name(name), values(value) {
|
|
static std::mutex mu;
|
|
std::lock_guard lock(mu);
|
|
instances.push_back(this);
|
|
}
|
|
|
|
void inc(i64 delta = 1) {
|
|
if (enabled)
|
|
values.local() += delta;
|
|
}
|
|
|
|
static void print();
|
|
static inline bool enabled = false;
|
|
|
|
private:
|
|
i64 get_value();
|
|
|
|
std::string_view name;
|
|
tbb::enumerable_thread_specific<i64> values;
|
|
|
|
static inline std::vector<Counter *> instances;
|
|
};
|
|
|
|
struct TimerRecord {
|
|
TimerRecord(std::string name);
|
|
void stop();
|
|
|
|
std::string name;
|
|
i64 start;
|
|
i64 end;
|
|
i64 user;
|
|
i64 sys;
|
|
bool stopped = false;
|
|
};
|
|
|
|
class Timer {
|
|
public:
|
|
Timer(std::string name);
|
|
~Timer();
|
|
void stop();
|
|
static void print();
|
|
|
|
private:
|
|
static inline std::vector<TimerRecord *> records;
|
|
TimerRecord *record;
|
|
};
|
|
|
|
//
|
|
// gc_sections.cc
|
|
//
|
|
|
|
void gc_sections();
|
|
|
|
//
|
|
// icf_sections.cc
|
|
//
|
|
|
|
void icf_sections();
|
|
|
|
//
|
|
// icf.cc
|
|
//
|
|
|
|
void icf_sections();
|
|
|
|
//
|
|
// mapfile.cc
|
|
//
|
|
|
|
void print_map();
|
|
|
|
//
|
|
// subprocess.cc
|
|
//
|
|
|
|
inline char *socket_tmpfile;
|
|
|
|
std::function<void()> fork_child();
|
|
bool resume_daemon(char **argv, i64 *code);
|
|
void daemonize(char **argv, std::function<void()> *wait_for_client,
|
|
std::function<void()> *on_complete);
|
|
|
|
//
|
|
// main.cc
|
|
//
|
|
|
|
MemoryMappedFile *find_library(std::string path, std::span<std::string_view> lib_paths);
|
|
void read_file(MemoryMappedFile *mb, bool as_needed);
|
|
|
|
//
|
|
// Inline objects and functions
|
|
//
|
|
|
|
namespace out {
|
|
inline std::vector<ObjectFile *> objs;
|
|
inline std::vector<SharedFile *> dsos;
|
|
inline std::vector<OutputChunk *> chunks;
|
|
inline u8 *buf;
|
|
|
|
inline ObjectFile *internal_file;
|
|
|
|
inline OutputEhdr *ehdr;
|
|
inline OutputShdr *shdr;
|
|
inline OutputPhdr *phdr;
|
|
inline InterpSection *interp;
|
|
inline GotSection *got;
|
|
inline GotPltSection *gotplt;
|
|
inline RelPltSection *relplt;
|
|
inline RelDynSection *reldyn;
|
|
inline DynamicSection *dynamic;
|
|
inline StrtabSection *strtab;
|
|
inline DynstrSection *dynstr;
|
|
inline HashSection *hash;
|
|
inline GnuHashSection *gnu_hash;
|
|
inline ShstrtabSection *shstrtab;
|
|
inline PltSection *plt;
|
|
inline SymtabSection *symtab;
|
|
inline DynsymSection *dynsym;
|
|
inline EhFrameSection *eh_frame;
|
|
inline EhFrameHdrSection *eh_frame_hdr;
|
|
inline CopyrelSection *copyrel;
|
|
inline VersymSection *versym;
|
|
inline VerneedSection *verneed;
|
|
inline BuildIdSection *buildid;
|
|
|
|
inline u64 tls_begin;
|
|
inline u64 tls_end;
|
|
|
|
inline Symbol *__bss_start;
|
|
inline Symbol *__ehdr_start;
|
|
inline Symbol *__rela_iplt_start;
|
|
inline Symbol *__rela_iplt_end;
|
|
inline Symbol *__init_array_start;
|
|
inline Symbol *__init_array_end;
|
|
inline Symbol *__fini_array_start;
|
|
inline Symbol *__fini_array_end;
|
|
inline Symbol *__preinit_array_start;
|
|
inline Symbol *__preinit_array_end;
|
|
inline Symbol *_DYNAMIC;
|
|
inline Symbol *_GLOBAL_OFFSET_TABLE_;
|
|
inline Symbol *_end;
|
|
inline Symbol *_etext;
|
|
inline Symbol *_edata;
|
|
}
|
|
|
|
inline u64 align_to(u64 val, u64 align) {
|
|
if (align == 0)
|
|
return val;
|
|
assert(__builtin_popcount(align) == 1);
|
|
return (val + align - 1) & ~(align - 1);
|
|
}
|
|
|
|
inline u64 next_power_of_two(u64 val) {
|
|
if (!val)
|
|
return 1;
|
|
|
|
val--;
|
|
val |= val >> 1;
|
|
val |= val >> 2;
|
|
val |= val >> 4;
|
|
val |= val >> 8;
|
|
val |= val >> 16;
|
|
val |= val >> 32;
|
|
return val + 1;
|
|
}
|
|
|
|
inline bool Symbol::is_alive() const {
|
|
if (frag)
|
|
return frag->is_alive;
|
|
if (input_section)
|
|
return input_section->is_alive;
|
|
return true;
|
|
}
|
|
|
|
inline bool Symbol::is_absolute() const {
|
|
return input_section == nullptr && file != out::internal_file;
|
|
}
|
|
|
|
inline u64 Symbol::get_addr() const {
|
|
if (frag) {
|
|
if (frag->is_alive)
|
|
return frag->get_addr() + value;
|
|
return 0; // todo: do not return 0
|
|
}
|
|
|
|
if (has_copyrel)
|
|
return out::copyrel->shdr.sh_addr + value;
|
|
|
|
if (input_section) {
|
|
if (input_section->is_ehframe)
|
|
return out::eh_frame->get_addr(*this);
|
|
|
|
if (!input_section->is_alive) {
|
|
// The control can reach here if there's a relocation that refers
|
|
// a local symbol belonging to a comdat group section. This is a
|
|
// violation of the spec, as all relocations should use only global
|
|
// symbols of comdat members. However, .eh_frame tends to have such
|
|
// relocations.
|
|
return 0;
|
|
}
|
|
|
|
return input_section->get_addr() + value;
|
|
}
|
|
|
|
if (file && file->is_dso)
|
|
return get_plt_addr();
|
|
|
|
return value;
|
|
}
|
|
|
|
inline u64 Symbol::get_got_addr() const {
|
|
assert(got_idx != -1);
|
|
return out::got->shdr.sh_addr + got_idx * GOT_SIZE;
|
|
}
|
|
|
|
inline u64 Symbol::get_gotplt_addr() const {
|
|
assert(gotplt_idx != -1);
|
|
return out::gotplt->shdr.sh_addr + gotplt_idx * GOT_SIZE;
|
|
}
|
|
|
|
inline u64 Symbol::get_gottpoff_addr() const {
|
|
assert(gottpoff_idx != -1);
|
|
return out::got->shdr.sh_addr + gottpoff_idx * GOT_SIZE;
|
|
}
|
|
|
|
inline u64 Symbol::get_tlsgd_addr() const {
|
|
assert(tlsgd_idx != -1);
|
|
return out::got->shdr.sh_addr + tlsgd_idx * GOT_SIZE;
|
|
}
|
|
|
|
inline u64 Symbol::get_plt_addr() const {
|
|
assert(plt_idx != -1);
|
|
return out::plt->shdr.sh_addr + plt_idx * PLT_SIZE;
|
|
}
|
|
|
|
inline u64 SectionFragment::get_addr() const {
|
|
if (!is_alive)
|
|
return 0; // todo: remove
|
|
|
|
MergeableSection *is = isec.load();
|
|
return is->parent.shdr.sh_addr + is->offset + offset;
|
|
}
|
|
|
|
inline u64 InputChunk::get_addr() const {
|
|
return output_section->shdr.sh_addr + offset;
|
|
}
|
|
|
|
inline i64 InputSection::get_priority() const {
|
|
return ((i64)file->priority << 32) | section_idx;
|
|
}
|
|
|
|
inline u32 elf_hash(std::string_view name) {
|
|
u32 h = 0;
|
|
for (u8 c : name) {
|
|
h = (h << 4) + c;
|
|
u32 g = h & 0xf0000000;
|
|
if (g != 0)
|
|
h ^= g >> 24;
|
|
h &= ~g;
|
|
}
|
|
return h;
|
|
}
|
|
|
|
inline u32 gnu_hash(std::string_view name) {
|
|
u32 h = 5381;
|
|
for (u8 c : name)
|
|
h = (h << 5) + h + c;
|
|
return h;
|
|
}
|
|
|
|
inline void write_string(u8 *buf, std::string_view str) {
|
|
memcpy(buf, str.data(), str.size());
|
|
buf[str.size()] = '\0';
|
|
}
|
|
|
|
template <typename T>
|
|
inline void write_vector(u8 *buf, const std::vector<T> &vec) {
|
|
memcpy(buf, vec.data(), vec.size() * sizeof(T));
|
|
}
|
|
|
|
template <typename T, typename U>
|
|
inline void append(std::vector<T> &vec1, std::vector<U> vec2) {
|
|
vec1.insert(vec1.end(), vec2.begin(), vec2.end());
|
|
}
|
|
|
|
template <typename T>
|
|
inline std::vector<T> flatten(std::vector<std::vector<T>> &vec) {
|
|
std::vector<T> ret;
|
|
for (std::vector<T> &v : vec)
|
|
append(ret, v);
|
|
return ret;
|
|
}
|
|
|
|
template <typename T, typename U>
|
|
inline void erase(std::vector<T> &vec, U pred) {
|
|
vec.erase(std::remove_if(vec.begin(), vec.end(), pred), vec.end());
|
|
}
|
|
|
|
template <typename T, typename U>
|
|
inline void sort(T &vec, U less) {
|
|
std::stable_sort(vec.begin(), vec.end(), less);
|
|
}
|