1
1
mirror of https://github.com/rui314/mold.git synced 2024-09-22 18:40:59 +03:00
mold/output_chunks.cc

522 lines
15 KiB
C++
Raw Normal View History

2020-10-20 08:54:35 +03:00
#include "mold.h"
2020-10-13 14:35:35 +03:00
2020-11-03 14:47:39 +03:00
#include <shared_mutex>
2020-10-16 10:38:03 +03:00
using namespace llvm::ELF;
2020-11-17 07:56:40 +03:00
void OutputEhdr::copy_buf() {
auto &hdr = *(ELF64LE::Ehdr *)(out::buf + shdr.sh_offset);
2020-11-16 18:17:01 +03:00
memset(&hdr, 0, sizeof(hdr));
memcpy(&hdr.e_ident, "\177ELF", 4);
hdr.e_ident[EI_CLASS] = ELFCLASS64;
hdr.e_ident[EI_DATA] = ELFDATA2LSB;
hdr.e_ident[EI_VERSION] = EV_CURRENT;
hdr.e_ident[EI_OSABI] = 0;
hdr.e_ident[EI_ABIVERSION] = 0;
hdr.e_type = ET_EXEC;
hdr.e_machine = EM_X86_64;
hdr.e_version = EV_CURRENT;
hdr.e_entry = Symbol::intern("_start")->get_addr();
hdr.e_phoff = out::phdr->shdr.sh_offset;
hdr.e_shoff = out::shdr->shdr.sh_offset;
hdr.e_flags = 0;
hdr.e_ehsize = sizeof(ELF64LE::Ehdr);
hdr.e_phentsize = sizeof(ELF64LE::Phdr);
hdr.e_phnum = out::phdr->shdr.sh_size / sizeof(ELF64LE::Phdr);
hdr.e_shentsize = sizeof(ELF64LE::Shdr);
hdr.e_shnum = out::shdr->shdr.sh_size / sizeof(ELF64LE::Shdr);
hdr.e_shstrndx = out::shstrtab->shndx;
}
2020-11-16 18:23:51 +03:00
void OutputShdr::update_shdr() {
int i = 1;
for (OutputChunk *chunk : out::chunks)
if (chunk->kind != OutputChunk::HEADER)
i++;
shdr.sh_size = i * sizeof(ELF64LE::Shdr);
}
2020-11-17 07:56:40 +03:00
void OutputShdr::copy_buf() {
u8 *base = out::buf + shdr.sh_offset;
2020-11-16 18:23:51 +03:00
memset(base, 0, sizeof(ELF64LE::Shdr));
auto *ptr = (ELF64LE::Shdr *)(base + sizeof(ELF64LE::Shdr));
for (OutputChunk *chunk : out::chunks)
if (chunk->kind != OutputChunk::HEADER)
*ptr++ = chunk->shdr;
}
2020-11-16 18:33:41 +03:00
static u32 to_phdr_flags(OutputChunk *chunk) {
u32 ret = PF_R;
if (chunk->shdr.sh_flags & SHF_WRITE)
ret |= PF_W;
if (chunk->shdr.sh_flags & SHF_EXECINSTR)
ret |= PF_X;
return ret;
}
static std::vector<ELF64LE::Phdr> create_phdr() {
std::vector<ELF64LE::Phdr> vec;
auto define = [&](u32 type, u32 flags, u32 align, OutputChunk *chunk) {
vec.push_back({});
ELF64LE::Phdr &phdr = vec.back();
phdr.p_type = type;
phdr.p_flags = flags;
phdr.p_align = std::max<u64>(align, chunk->shdr.sh_addralign);
phdr.p_offset = chunk->shdr.sh_offset;
phdr.p_filesz = (chunk->shdr.sh_type == SHT_NOBITS) ? 0 : chunk->shdr.sh_size;
phdr.p_vaddr = chunk->shdr.sh_addr;
phdr.p_memsz = chunk->shdr.sh_size;
if (type == PT_LOAD)
chunk->starts_new_ptload = true;
};
auto append = [&](OutputChunk *chunk) {
ELF64LE::Phdr &phdr = vec.back();
phdr.p_align = std::max<u64>(phdr.p_align, chunk->shdr.sh_addralign);
phdr.p_filesz = (chunk->shdr.sh_type == SHT_NOBITS)
? chunk->shdr.sh_offset - phdr.p_offset
: chunk->shdr.sh_offset + chunk->shdr.sh_size - phdr.p_offset;
phdr.p_memsz = chunk->shdr.sh_addr + chunk->shdr.sh_size - phdr.p_vaddr;
};
auto is_bss = [](OutputChunk *chunk) {
return chunk->shdr.sh_type == SHT_NOBITS && !(chunk->shdr.sh_flags & SHF_TLS);
};
// Create a PT_PHDR for the program header itself.
define(PT_PHDR, PF_R, 8, out::phdr);
// Create an PT_INTERP.
if (out::interp)
define(PT_INTERP, PF_R, 1, out::interp);
// Create PT_LOAD segments.
for (int i = 0, end = out::chunks.size(); i < end;) {
OutputChunk *first = out::chunks[i++];
if (!(first->shdr.sh_flags & SHF_ALLOC))
break;
u32 flags = to_phdr_flags(first);
define(PT_LOAD, flags, PAGE_SIZE, first);
if (!is_bss(first))
while (i < end && !is_bss(out::chunks[i]) &&
to_phdr_flags(out::chunks[i]) == flags)
append(out::chunks[i++]);
while (i < end && is_bss(out::chunks[i]) &&
to_phdr_flags(out::chunks[i]) == flags)
append(out::chunks[i++]);
}
// Create a PT_TLS.
for (int i = 0; i < out::chunks.size(); i++) {
if (out::chunks[i]->shdr.sh_flags & SHF_TLS) {
define(PT_TLS, to_phdr_flags(out::chunks[i]), 1, out::chunks[i]);
i++;
while (i < out::chunks.size() && (out::chunks[i]->shdr.sh_flags & SHF_TLS))
append(out::chunks[i++]);
}
}
// Add PT_DYNAMIC
if (out::dynamic)
define(PT_DYNAMIC, PF_R | PF_W, out::dynamic->shdr.sh_addralign, out::dynamic);
return vec;
}
void OutputPhdr::update_shdr() {
shdr.sh_size = create_phdr().size() * sizeof(ELF64LE::Phdr);
}
2020-11-17 07:56:40 +03:00
void OutputPhdr::copy_buf() {
write_vector(out::buf + shdr.sh_offset, create_phdr());
2020-11-16 18:43:32 +03:00
}
2020-11-17 07:56:40 +03:00
void InterpSection::copy_buf() {
write_string(out::buf + shdr.sh_offset, config.dynamic_linker);
2020-11-16 19:05:01 +03:00
}
2020-11-16 18:43:32 +03:00
static std::vector<u64> create_dynamic_section() {
std::vector<u64> vec;
auto define = [&](u64 tag, u64 val) {
vec.push_back(tag);
vec.push_back(val);
};
int i = 1;
for (ObjectFile *file : out::files) {
if (!file->soname.empty()) {
define(DT_NEEDED, i);
i += file->soname.size() + 1;
}
}
define(DT_RELA, out::reldyn->shdr.sh_addr);
define(DT_RELASZ, out::reldyn->shdr.sh_size);
define(DT_RELAENT, sizeof(ELF64LE::Rela));
define(DT_JMPREL, out::relplt->shdr.sh_addr);
define(DT_PLTRELSZ, out::relplt->shdr.sh_size);
define(DT_PLTGOT, out::gotplt->shdr.sh_addr);
define(DT_PLTREL, DT_RELA);
define(DT_SYMTAB, out::dynsym->shdr.sh_addr);
define(DT_SYMENT, sizeof(ELF64LE::Sym));
define(DT_STRTAB, out::dynstr->shdr.sh_addr);
define(DT_STRSZ, out::dynstr->shdr.sh_size);
define(DT_HASH, out::hash->shdr.sh_addr);
define(DT_INIT_ARRAY, out::__init_array_start->value);
define(DT_INIT_ARRAYSZ, out::__init_array_end->value - out::__init_array_start->value);
define(DT_FINI_ARRAY, out::__fini_array_start->value);
define(DT_FINI_ARRAYSZ, out::__fini_array_end->value - out::__fini_array_start->value);
define(DT_NULL, 0);
return vec;
}
2020-11-17 07:34:02 +03:00
void RelPltSection::update_shdr() {
shdr.sh_link = out::dynsym->shndx;
}
2020-11-17 07:30:33 +03:00
void RelDynSection::update_shdr() {
shdr.sh_link = out::dynsym->shndx;
}
2020-11-17 07:51:44 +03:00
void StrtabSection::initialize_buf() {
out::buf[shdr.sh_offset] = '\0';
}
2020-11-17 06:20:56 +03:00
void ShstrtabSection::update_shdr() {
shdr.sh_size = 1;
for (OutputChunk *chunk : out::chunks) {
if (!chunk->name.empty()) {
chunk->shdr.sh_name = shdr.sh_size;
shdr.sh_size += chunk->name.size() + 1;
}
}
}
2020-11-17 07:56:40 +03:00
void ShstrtabSection::copy_buf() {
u8 *base = out::buf + shdr.sh_offset;
2020-11-17 06:20:56 +03:00
base[0] = '\0';
2020-11-17 07:19:54 +03:00
int i = 1;
2020-11-17 06:20:56 +03:00
for (OutputChunk *chunk : out::chunks) {
if (!chunk->name.empty()) {
2020-11-17 07:19:54 +03:00
write_string(base + i, chunk->name);
i += chunk->name.size() + 1;
2020-11-17 06:20:56 +03:00
}
}
}
2020-11-17 07:19:54 +03:00
u32 DynstrSection::add_string(StringRef str) {
u32 ret = shdr.sh_size;
shdr.sh_size += str.size() + 1;
contents.push_back(str);
return ret;
}
2020-11-17 07:56:40 +03:00
void DynstrSection::copy_buf() {
u8 *base = out::buf + shdr.sh_offset;
2020-11-17 07:19:54 +03:00
base[0] = '\0';
int i = 1;
for (StringRef s : contents) {
write_string(base + i, s);
i += s.size() + 1;
}
}
2020-11-17 07:32:22 +03:00
void SymtabSection::update_shdr() {
2020-11-17 08:47:43 +03:00
shdr.sh_link = out::strtab->shndx;
2020-11-17 08:40:24 +03:00
tbb::parallel_for_each(out::files,
[](ObjectFile *file) { file->compute_symtab(); });
2020-11-17 08:28:53 +03:00
local_symtab_off.resize(out::files.size() + 1);
local_strtab_off.resize(out::files.size() + 1);
global_symtab_off.resize(out::files.size() + 1);
global_strtab_off.resize(out::files.size() + 1);
local_symtab_off[0] = sizeof(ELF64LE::Sym);
local_strtab_off[0] = 1;
for (int i = 1; i < out::files.size() + 1; i++) {
local_symtab_off[i] = local_symtab_off[i - 1] + out::files[i - 1]->local_symtab_size;
local_strtab_off[i] = local_strtab_off[i - 1] + out::files[i - 1]->local_strtab_size;
}
shdr.sh_info = local_symtab_off.back() / sizeof(ELF64LE::Sym);
global_symtab_off[0] = local_symtab_off.back();
global_strtab_off[0] = local_strtab_off.back();
for (int i = 1; i < out::files.size() + 1; i++) {
global_symtab_off[i] =
global_symtab_off[i - 1] + out::files[i - 1]->global_symtab_size;
global_strtab_off[i] =
global_strtab_off[i - 1] + out::files[i - 1]->global_strtab_size;
}
2020-11-17 08:40:24 +03:00
shdr.sh_size = global_symtab_off.back();
out::strtab->shdr.sh_size = global_strtab_off.back();
2020-11-17 07:32:22 +03:00
}
2020-11-17 08:28:53 +03:00
void SymtabSection::copy_buf() {
2020-11-17 07:51:44 +03:00
memset(out::buf + shdr.sh_offset, 0, sizeof(ELF64LE::Sym));
2020-11-17 08:28:53 +03:00
tbb::parallel_for((size_t)0, out::files.size(), [&](size_t i) {
out::files[i]->write_local_symtab(local_symtab_off[i], local_strtab_off[i]);
out::files[i]->write_global_symtab(global_symtab_off[i], global_strtab_off[i]);
});
2020-11-17 07:51:44 +03:00
}
2020-11-16 18:43:32 +03:00
void DynamicSection::update_shdr() {
shdr.sh_size = create_dynamic_section().size() * 8;
shdr.sh_link = out::dynstr->shndx;
}
2020-11-17 07:56:40 +03:00
void DynamicSection::copy_buf() {
write_vector(out::buf + shdr.sh_offset, create_dynamic_section());
2020-11-16 18:33:41 +03:00
}
2020-10-22 10:35:17 +03:00
static StringRef get_output_name(StringRef name) {
static StringRef common_names[] = {
".text.", ".data.rel.ro.", ".data.", ".rodata.", ".bss.rel.ro.",
".bss.", ".init_array.", ".fini_array.", ".tbss.", ".tdata.",
};
for (StringRef s : common_names)
if (name.startswith(s) || name == s.drop_back())
return s.drop_back();
return name;
}
2020-10-27 06:45:59 +03:00
OutputSection *
OutputSection::get_instance(StringRef name, u64 flags, u32 type) {
2020-10-27 06:45:59 +03:00
name = get_output_name(name);
2020-11-07 04:13:19 +03:00
flags = flags & ~(u64)SHF_GROUP;
2020-10-22 10:35:17 +03:00
auto find = [&]() -> OutputSection * {
2020-10-28 08:06:35 +03:00
for (OutputSection *osec : OutputSection::instances)
2020-11-13 06:43:59 +03:00
if (name == osec->name && type == osec->shdr.sh_type &&
flags == (osec->shdr.sh_flags & ~SHF_GROUP))
2020-10-22 10:35:17 +03:00
return osec;
return nullptr;
};
// Search for an exiting output section.
static std::shared_mutex mu;
2020-11-07 04:13:19 +03:00
{
std::shared_lock lock(mu);
if (OutputSection *osec = find())
return osec;
}
2020-10-22 10:35:17 +03:00
// Create a new output section.
2020-11-07 04:13:19 +03:00
std::unique_lock lock(mu);
2020-10-22 10:35:17 +03:00
if (OutputSection *osec = find())
return osec;
2020-11-13 06:43:59 +03:00
return new OutputSection(name, type, flags);
2020-10-22 10:35:17 +03:00
}
2020-11-07 04:13:19 +03:00
2020-11-17 07:56:40 +03:00
void OutputSection::copy_buf() {
2020-11-09 16:25:17 +03:00
if (shdr.sh_type == llvm::ELF::SHT_NOBITS)
return;
2020-11-10 06:23:14 +03:00
int num_members = members.size();
tbb::parallel_for(0, num_members, [&](int i) {
if (members[i]->shdr.sh_type != SHT_NOBITS) {
// Copy section contents to an output file
2020-11-17 07:56:40 +03:00
members[i]->copy_buf();
2020-11-10 06:23:14 +03:00
// Zero-clear trailing padding
u64 this_end = members[i]->offset + members[i]->shdr.sh_size;
u64 next_start = (i == num_members - 1) ? shdr.sh_size : members[i + 1]->offset;
2020-11-17 07:56:40 +03:00
memset(out::buf + shdr.sh_offset + this_end, 0, next_start - this_end);
2020-11-10 06:23:14 +03:00
}
2020-11-09 16:25:17 +03:00
});
2020-11-09 15:32:13 +03:00
}
bool OutputSection::empty() const {
if (!members.empty())
for (InputChunk *mem : members)
if (mem->shdr.sh_size)
return false;
return true;
}
2020-11-17 07:51:44 +03:00
void GotPltSection::initialize_buf() {
u8 *base = out::buf + shdr.sh_offset;
2020-11-13 07:39:29 +03:00
memset(base, 0, shdr.sh_size);
if (out::dynamic)
*(u64 *)base = out::dynamic->shdr.sh_addr;
}
2020-11-17 07:51:44 +03:00
void PltSection::initialize_buf() {
2020-11-13 06:30:27 +03:00
const u8 data[] = {
0xff, 0x35, 0, 0, 0, 0, // pushq GOTPLT+8(%rip)
0xff, 0x25, 0, 0, 0, 0, // jmp *GOTPLT+16(%rip)
0x0f, 0x1f, 0x40, 0x00, // nop
};
2020-11-17 07:51:44 +03:00
u8 *base = out::buf + shdr.sh_offset;
2020-11-13 06:30:27 +03:00
memcpy(base, data, sizeof(data));
*(u32 *)(base + 2) = out::gotplt->shdr.sh_addr - shdr.sh_addr + 2;
*(u32 *)(base + 8) = out::gotplt->shdr.sh_addr - shdr.sh_addr + 4;
}
2020-11-17 07:57:53 +03:00
void PltSection::write_entry(Symbol *sym) {
2020-11-17 14:47:22 +03:00
u8 *base = out::buf + shdr.sh_offset + sym->plt_idx * PLT_SIZE;
2020-11-15 08:07:40 +03:00
2020-11-15 07:01:38 +03:00
if (sym->got_idx == -1) {
const u8 data[] = {
0xff, 0x25, 0, 0, 0, 0, // jmp *foo@GOTPLT
0x68, 0, 0, 0, 0, // push $index_in_relplt
0xe9, 0, 0, 0, 0, // jmp PLT[0]
};
memcpy(base, data, sizeof(data));
*(u32 *)(base + 2) = sym->get_gotplt_addr() - sym->get_plt_addr() - 6;
2020-11-17 14:47:22 +03:00
*(u32 *)(base + 7) = sym->relplt_idx;
2020-11-15 07:01:38 +03:00
*(u32 *)(base + 12) = shdr.sh_addr - sym->get_plt_addr() - 16;
} else {
const u8 data[] = {
2020-11-15 08:07:40 +03:00
0xff, 0x25, 0, 0, 0, 0, // jmp *foo@GOTPLT
2020-11-15 07:01:38 +03:00
0x66, 0x66, 0x66, 0x0f, 0x1f, 0x84, 0, 0, 0, 0, 0, // nop
};
memcpy(base, data, sizeof(data));
*(u32 *)(base + 2) = sym->get_got_addr() - sym->get_plt_addr() - 6;
}
2020-11-13 10:16:40 +03:00
}
2020-11-18 09:35:42 +03:00
void RelPltSection::write_entry(Symbol *sym) {
auto *rel = (ELF64LE::Rela *)(out::buf + out::relplt->shdr.sh_offset +
sym->relplt_idx * sizeof(ELF64LE::Rela));
memset(rel, 0, sizeof(*rel));
rel->setSymbol(sym->dynsym_idx, false);
rel->r_offset = sym->get_gotplt_addr();
if (sym->type == STT_GNU_IFUNC) {
rel->setType(R_X86_64_IRELATIVE, false);
rel->r_addend = sym->get_addr();
} else {
rel->setType(R_X86_64_JUMP_SLOT, false);
}
}
2020-11-17 14:22:52 +03:00
void DynsymSection::add_symbol(Symbol *sym) {
if (sym->dynsym_idx == -1) {
2020-11-16 17:48:20 +03:00
sym->dynsym_idx = symbols.size() + 1;
2020-11-17 07:19:54 +03:00
sym->dynstr_offset = out::dynstr->add_string(sym->name);
2020-11-16 17:48:20 +03:00
symbols.push_back(sym);
}
}
2020-11-16 19:30:24 +03:00
void DynsymSection::update_shdr() {
2020-11-16 17:40:01 +03:00
shdr.sh_link = out::dynstr->shndx;
2020-11-17 14:40:49 +03:00
shdr.sh_size = sizeof(ELF64LE::Sym) * (symbols.size() + 1);
2020-11-16 19:30:24 +03:00
}
2020-11-17 07:51:44 +03:00
void DynsymSection::initialize_buf() {
memset(out::buf + shdr.sh_offset, 0, sizeof(ELF64LE::Sym));
2020-11-16 17:40:01 +03:00
}
2020-11-17 07:56:40 +03:00
void DynsymSection::copy_buf() {
u8 *base = out::buf + shdr.sh_offset;
2020-11-16 17:48:20 +03:00
tbb::parallel_for_each(symbols, [&](Symbol *sym) {
2020-11-17 07:19:54 +03:00
auto &esym = *(ELF64LE::Sym *)(base + sym->dynsym_idx * sizeof(ELF64LE::Sym));
2020-11-16 17:48:20 +03:00
memset(&esym, 0, sizeof(esym));
esym.st_name = sym->dynstr_offset;
esym.setType(sym->type);
esym.setBinding(sym->esym->getBinding());
if (sym->file->is_dso || sym->esym->isUndefined()) {
esym.st_shndx = SHN_UNDEF;
} else if (!sym->input_section) {
esym.st_shndx = SHN_ABS;
esym.st_value = sym->get_addr();
} else {
esym.st_shndx = sym->input_section->output_section->shndx;
esym.st_value = sym->get_addr();
}
});
2020-11-16 17:58:40 +03:00
}
2020-11-16 18:10:38 +03:00
void HashSection::update_shdr() {
2020-11-16 17:58:40 +03:00
int header_size = 8;
int num_slots = out::dynsym->symbols.size() + 1;
shdr.sh_size = header_size + num_slots * 8;
2020-11-16 18:45:02 +03:00
shdr.sh_link = out::dynsym->shndx;
2020-11-16 17:58:40 +03:00
}
2020-11-17 07:56:40 +03:00
void HashSection::copy_buf() {
u8 *base = out::buf + shdr.sh_offset;
2020-11-16 17:58:40 +03:00
memset(base, 0, shdr.sh_size);
int num_slots = out::dynsym->symbols.size() + 1;
2020-11-16 18:08:53 +03:00
u32 *hdr = (u32 *)base;
2020-11-16 17:58:40 +03:00
u32 *buckets = (u32 *)(base + 8);
u32 *chains = buckets + num_slots;
hdr[0] = hdr[1] = num_slots;
2020-11-16 17:48:20 +03:00
2020-11-16 17:58:40 +03:00
for (Symbol *sym : out::dynsym->symbols) {
u32 i = hash(sym->name) % num_slots;
chains[sym->dynsym_idx] = buckets[i];
buckets[i] = sym->dynsym_idx;
}
2020-11-16 17:48:20 +03:00
}
2020-11-16 17:58:40 +03:00
u32 HashSection::hash(StringRef name) {
u32 h = 0;
for (char c : name) {
h = (h << 4) + c;
u32 g = h & 0xf0000000;
if (g != 0)
h ^= g >> 24;
h &= ~g;
}
return h;
2020-11-15 11:01:52 +03:00
}
2020-11-07 15:53:21 +03:00
MergedSection *
MergedSection::get_instance(StringRef name, u64 flags, u32 type) {
2020-11-07 04:13:19 +03:00
name = get_output_name(name);
flags = flags & ~(u64)SHF_MERGE & ~(u64)SHF_STRINGS;
2020-11-07 15:53:21 +03:00
auto find = [&]() -> MergedSection * {
for (MergedSection *osec : MergedSection::instances)
2020-11-07 04:13:19 +03:00
if (name == osec->name && flags == osec->shdr.sh_flags &&
type == osec->shdr.sh_type)
return osec;
return nullptr;
};
// Search for an exiting output section.
static std::shared_mutex mu;
{
std::shared_lock lock(mu);
2020-11-07 15:53:21 +03:00
if (MergedSection *osec = find())
2020-11-07 04:13:19 +03:00
return osec;
}
// Create a new output section.
std::unique_lock lock(mu);
2020-11-07 15:53:21 +03:00
if (MergedSection *osec = find())
2020-11-07 04:13:19 +03:00
return osec;
2020-11-07 15:53:21 +03:00
auto *osec = new MergedSection(name, flags, type);
MergedSection::instances.push_back(osec);
2020-11-07 04:13:19 +03:00
return osec;
}