2020-10-20 08:54:35 +03:00
|
|
|
#include "mold.h"
|
2020-10-02 07:28:26 +03:00
|
|
|
|
2020-12-13 15:07:50 +03:00
|
|
|
#include "tbb/global_control.h"
|
|
|
|
|
2020-11-09 05:58:48 +03:00
|
|
|
#include <fcntl.h>
|
2020-09-29 09:05:29 +03:00
|
|
|
#include <iostream>
|
2020-11-09 06:30:13 +03:00
|
|
|
#include <libgen.h>
|
2020-12-07 15:04:29 +03:00
|
|
|
#include <regex>
|
2020-11-09 05:58:48 +03:00
|
|
|
#include <sys/mman.h>
|
|
|
|
#include <sys/stat.h>
|
|
|
|
#include <sys/types.h>
|
|
|
|
#include <unistd.h>
|
2020-11-20 07:54:29 +03:00
|
|
|
#include <unordered_set>
|
2020-09-29 09:05:29 +03:00
|
|
|
|
2020-12-10 08:27:38 +03:00
|
|
|
MemoryMappedFile *open_input_file(std::string path) {
|
2020-12-10 07:44:58 +03:00
|
|
|
int fd = open(path.c_str(), O_RDONLY);
|
2020-11-09 05:58:48 +03:00
|
|
|
if (fd == -1)
|
2020-11-20 14:07:33 +03:00
|
|
|
return nullptr;
|
2020-10-10 06:47:12 +03:00
|
|
|
|
2020-11-09 05:58:48 +03:00
|
|
|
struct stat st;
|
|
|
|
if (fstat(fd, &st) == -1)
|
|
|
|
error(path + ": stat failed");
|
2020-11-03 14:42:50 +03:00
|
|
|
|
2020-11-09 05:58:48 +03:00
|
|
|
void *addr = mmap(nullptr, st.st_size, PROT_READ, MAP_PRIVATE, fd, 0);
|
|
|
|
if (addr == MAP_FAILED)
|
|
|
|
error(path + ": mmap failed: " + strerror(errno));
|
|
|
|
close(fd);
|
|
|
|
|
2020-12-10 11:44:30 +03:00
|
|
|
return new MemoryMappedFile(path, (u8 *)addr, st.st_size);
|
2020-11-20 14:07:33 +03:00
|
|
|
}
|
|
|
|
|
2020-12-10 08:27:38 +03:00
|
|
|
MemoryMappedFile must_open_input_file(std::string path) {
|
|
|
|
MemoryMappedFile *mb = open_input_file(path);
|
2020-11-20 14:07:33 +03:00
|
|
|
if (!mb)
|
|
|
|
error("cannot open " + path);
|
|
|
|
return *mb;
|
|
|
|
}
|
2020-11-09 05:58:48 +03:00
|
|
|
|
2020-12-12 07:08:40 +03:00
|
|
|
static bool is_text_file(MemoryMappedFile mb) {
|
|
|
|
return mb.size >= 4 &&
|
|
|
|
isprint(mb.data[0]) &&
|
|
|
|
isprint(mb.data[1]) &&
|
|
|
|
isprint(mb.data[2]) &&
|
|
|
|
isprint(mb.data[3]);
|
|
|
|
}
|
2020-12-10 16:51:38 +03:00
|
|
|
|
2020-12-19 12:08:15 +03:00
|
|
|
std::vector<InputFile *> read_file(MemoryMappedFile mb, bool as_needed) {
|
|
|
|
std::vector<InputFile *> vec;
|
|
|
|
|
2020-12-10 16:51:38 +03:00
|
|
|
// .a
|
2020-12-19 12:08:15 +03:00
|
|
|
if (memcmp(mb.data, "!<arch>\n", 8) == 0) {
|
|
|
|
for (MemoryMappedFile &child : read_fat_archive_members(mb))
|
|
|
|
vec.push_back(new ObjectFile(child, mb.name));
|
|
|
|
return vec;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Thin .a
|
|
|
|
if (memcmp(mb.data, "!<thin>\n", 8) == 0) {
|
|
|
|
std::vector<std::string> paths = read_thin_archive_members(mb);
|
|
|
|
vec.resize(paths.size());
|
|
|
|
tbb::parallel_for(0, (int)paths.size(), [&](int i) {
|
|
|
|
vec[i] = new ObjectFile(must_open_input_file(paths[i]), mb.name);
|
|
|
|
});
|
|
|
|
return vec;
|
2020-12-10 16:51:38 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
if (memcmp(mb.data, "\177ELF", 4) == 0) {
|
|
|
|
ElfEhdr &ehdr = *(ElfEhdr *)mb.data;
|
2020-12-12 07:08:40 +03:00
|
|
|
if (mb.size < 20)
|
|
|
|
error(mb.name + ": broken ELF file");
|
2020-12-10 16:51:38 +03:00
|
|
|
|
|
|
|
// .o
|
|
|
|
if (ehdr.e_type == ET_REL) {
|
2020-12-19 12:08:15 +03:00
|
|
|
vec.push_back(new ObjectFile(mb, ""));
|
|
|
|
return vec;
|
2020-12-10 16:51:38 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
// .so
|
|
|
|
if (ehdr.e_type == ET_DYN) {
|
2020-12-19 12:08:15 +03:00
|
|
|
vec.push_back(new SharedFile(mb, as_needed));
|
|
|
|
return vec;
|
2020-12-10 16:51:38 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Linker script
|
2020-12-19 12:08:15 +03:00
|
|
|
if (is_text_file(mb))
|
|
|
|
return parse_linker_script(mb, as_needed);
|
2020-12-10 16:51:38 +03:00
|
|
|
|
|
|
|
error(mb.name + ": unknown file type");
|
2020-10-10 06:47:12 +03:00
|
|
|
}
|
|
|
|
|
2020-10-28 07:42:05 +03:00
|
|
|
template <typename T>
|
2020-12-10 14:20:46 +03:00
|
|
|
static std::vector<std::span<T>> split(std::vector<T> &input, int unit) {
|
|
|
|
std::span<T> span(input);
|
|
|
|
std::vector<std::span<T>> vec;
|
2020-10-28 07:42:05 +03:00
|
|
|
|
2020-12-10 14:20:46 +03:00
|
|
|
while (span.size() >= unit) {
|
|
|
|
vec.push_back(span.subspan(0, unit));
|
|
|
|
span = span.subspan(unit);
|
2020-10-28 07:42:05 +03:00
|
|
|
}
|
2020-12-10 14:20:46 +03:00
|
|
|
if (!span.empty())
|
|
|
|
vec.push_back(span);
|
2020-10-28 07:42:05 +03:00
|
|
|
return vec;
|
|
|
|
}
|
|
|
|
|
2020-11-17 08:05:40 +03:00
|
|
|
static void resolve_symbols() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("resolve_symbols");
|
2020-11-11 04:42:26 +03:00
|
|
|
|
2020-11-11 04:51:30 +03:00
|
|
|
// Register defined symbols
|
2020-11-24 08:31:05 +03:00
|
|
|
tbb::parallel_for_each(out::objs, [](ObjectFile *file) { file->resolve_symbols(); });
|
2020-11-24 10:22:32 +03:00
|
|
|
tbb::parallel_for_each(out::dsos, [](SharedFile *file) { file->resolve_symbols(); });
|
2020-11-11 04:42:26 +03:00
|
|
|
|
2020-11-30 10:43:47 +03:00
|
|
|
// Mark reachable objects and DSOs to decide which files to include
|
|
|
|
// into an output.
|
2020-11-11 04:42:26 +03:00
|
|
|
std::vector<ObjectFile *> root;
|
2020-11-24 07:56:14 +03:00
|
|
|
for (ObjectFile *file : out::objs)
|
2020-11-24 08:31:05 +03:00
|
|
|
if (file->is_alive)
|
2020-11-11 04:42:26 +03:00
|
|
|
root.push_back(file);
|
|
|
|
|
|
|
|
tbb::parallel_do(
|
|
|
|
root,
|
|
|
|
[&](ObjectFile *file, tbb::parallel_do_feeder<ObjectFile *> &feeder) {
|
2020-11-30 10:43:47 +03:00
|
|
|
file->mark_live_objects(feeder);
|
2020-11-11 04:42:26 +03:00
|
|
|
});
|
|
|
|
|
2020-11-30 10:43:47 +03:00
|
|
|
// Eliminate unused archive members and as-needed DSOs.
|
2020-12-13 16:31:50 +03:00
|
|
|
erase(out::objs, [](InputFile *file){ return !file->is_alive; });
|
|
|
|
erase(out::dsos, [](InputFile *file){ return !file->is_alive; });
|
2020-11-11 04:42:26 +03:00
|
|
|
}
|
|
|
|
|
2020-11-17 08:04:53 +03:00
|
|
|
static void eliminate_comdats() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("comdat");
|
2020-11-11 04:42:26 +03:00
|
|
|
|
2020-11-24 07:56:14 +03:00
|
|
|
tbb::parallel_for_each(out::objs, [](ObjectFile *file) {
|
2020-11-08 12:17:24 +03:00
|
|
|
file->resolve_comdat_groups();
|
|
|
|
});
|
|
|
|
|
2020-11-24 07:56:14 +03:00
|
|
|
tbb::parallel_for_each(out::objs, [](ObjectFile *file) {
|
2020-11-08 12:17:24 +03:00
|
|
|
file->eliminate_duplicate_comdat_groups();
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2020-11-17 08:04:53 +03:00
|
|
|
static void handle_mergeable_strings() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("resolve_strings");
|
2020-11-11 04:42:26 +03:00
|
|
|
|
2020-11-07 15:53:21 +03:00
|
|
|
// Resolve mergeable string pieces
|
2020-11-24 07:56:14 +03:00
|
|
|
tbb::parallel_for_each(out::objs, [](ObjectFile *file) {
|
2020-12-13 19:18:25 +03:00
|
|
|
for (MergeableSection *m : file->mergeable_sections) {
|
|
|
|
for (StringPieceRef &ref : m->pieces) {
|
2020-11-08 08:13:59 +03:00
|
|
|
MergeableSection *cur = ref.piece->isec;
|
2020-12-13 19:18:25 +03:00
|
|
|
while (!cur || cur->file->priority > m->file->priority)
|
|
|
|
if (ref.piece->isec.compare_exchange_weak(cur, m))
|
2020-11-07 15:53:21 +03:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
|
|
|
// Calculate the total bytes of mergeable strings for each input section.
|
2020-11-24 07:56:14 +03:00
|
|
|
tbb::parallel_for_each(out::objs, [](ObjectFile *file) {
|
2020-12-13 19:18:25 +03:00
|
|
|
for (MergeableSection *m : file->mergeable_sections) {
|
2020-11-07 15:53:21 +03:00
|
|
|
u32 offset = 0;
|
2020-12-13 19:18:25 +03:00
|
|
|
for (StringPieceRef &ref : m->pieces) {
|
2020-11-10 11:18:10 +03:00
|
|
|
StringPiece &piece = *ref.piece;
|
2020-12-13 19:18:25 +03:00
|
|
|
if (piece.isec == m && piece.output_offset == -1) {
|
2020-11-07 15:53:21 +03:00
|
|
|
ref.piece->output_offset = offset;
|
2020-12-13 19:58:58 +03:00
|
|
|
offset += ref.piece->size;
|
2020-11-07 15:53:21 +03:00
|
|
|
}
|
|
|
|
}
|
2020-12-13 19:18:25 +03:00
|
|
|
m->size = offset;
|
2020-11-07 15:53:21 +03:00
|
|
|
}
|
|
|
|
});
|
|
|
|
|
|
|
|
// Assign each mergeable input section a unique index.
|
2020-11-24 07:56:14 +03:00
|
|
|
for (ObjectFile *file : out::objs) {
|
2020-12-13 19:18:25 +03:00
|
|
|
for (MergeableSection *m : file->mergeable_sections) {
|
2020-12-13 19:21:39 +03:00
|
|
|
m->offset = m->parent.shdr.sh_size;
|
|
|
|
m->parent.shdr.sh_size += m->size;
|
2020-11-07 15:53:21 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-11-11 04:51:30 +03:00
|
|
|
// So far, each input section has a pointer to its corresponding
|
|
|
|
// output section, but there's no reverse edge to get a list of
|
|
|
|
// input sections from an output section. This function creates it.
|
|
|
|
//
|
|
|
|
// An output section may contain millions of input sections.
|
|
|
|
// So, we append input sections to output sections in parallel.
|
2020-11-17 08:04:53 +03:00
|
|
|
static void bin_sections() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("bin_sections");
|
2020-11-11 04:42:26 +03:00
|
|
|
|
2020-11-24 07:56:14 +03:00
|
|
|
int unit = (out::objs.size() + 127) / 128;
|
2020-12-10 14:20:46 +03:00
|
|
|
std::vector<std::span<ObjectFile *>> slices = split(out::objs, unit);
|
2020-10-26 07:36:56 +03:00
|
|
|
|
2020-11-08 04:05:59 +03:00
|
|
|
int num_osec = OutputSection::instances.size();
|
|
|
|
|
2020-11-08 06:36:08 +03:00
|
|
|
std::vector<std::vector<std::vector<InputChunk *>>> groups(slices.size());
|
2020-10-28 08:22:25 +03:00
|
|
|
for (int i = 0; i < groups.size(); i++)
|
2020-11-08 04:05:59 +03:00
|
|
|
groups[i].resize(num_osec);
|
2020-10-28 08:06:35 +03:00
|
|
|
|
|
|
|
tbb::parallel_for(0, (int)slices.size(), [&](int i) {
|
|
|
|
for (ObjectFile *file : slices[i]) {
|
|
|
|
for (InputSection *isec : file->sections) {
|
|
|
|
if (!isec)
|
|
|
|
continue;
|
|
|
|
OutputSection *osec = isec->output_section;
|
2020-10-28 08:22:25 +03:00
|
|
|
groups[i][osec->idx].push_back(isec);
|
2020-10-28 08:06:35 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
2020-11-08 04:05:59 +03:00
|
|
|
std::vector<int> sizes(num_osec);
|
2020-10-26 07:36:56 +03:00
|
|
|
|
2020-12-10 14:20:46 +03:00
|
|
|
for (std::span<std::vector<InputChunk *>> group : groups)
|
2020-10-28 08:22:25 +03:00
|
|
|
for (int i = 0; i < group.size(); i++)
|
|
|
|
sizes[i] += group[i].size();
|
2020-11-08 03:44:27 +03:00
|
|
|
|
2020-11-08 04:05:59 +03:00
|
|
|
tbb::parallel_for(0, num_osec, [&](int j) {
|
2020-11-08 06:42:40 +03:00
|
|
|
OutputSection::instances[j]->members.reserve(sizes[j]);
|
2020-11-08 04:06:36 +03:00
|
|
|
|
2020-11-08 04:05:59 +03:00
|
|
|
for (int i = 0; i < groups.size(); i++) {
|
2020-11-08 06:42:40 +03:00
|
|
|
std::vector<InputChunk *> §ions = OutputSection::instances[j]->members;
|
2020-11-08 04:05:59 +03:00
|
|
|
sections.insert(sections.end(), groups[i][j].begin(), groups[i][j].end());
|
2020-10-28 08:06:35 +03:00
|
|
|
}
|
2020-11-08 04:05:59 +03:00
|
|
|
});
|
2020-10-26 07:36:56 +03:00
|
|
|
}
|
2020-10-22 17:19:48 +03:00
|
|
|
|
2020-11-26 12:09:32 +03:00
|
|
|
static void check_duplicate_symbols() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("check_undef_syms");
|
2020-11-20 11:12:45 +03:00
|
|
|
|
2020-11-30 12:19:33 +03:00
|
|
|
auto is_error = [](ObjectFile *file, int i) {
|
2020-12-10 09:10:18 +03:00
|
|
|
const ElfSym &esym = file->elf_syms[i];
|
2020-11-30 12:19:33 +03:00
|
|
|
Symbol &sym = *file->symbols[i];
|
2020-12-10 09:31:54 +03:00
|
|
|
bool is_weak = (esym.st_bind == STB_WEAK);
|
2020-12-01 15:07:00 +03:00
|
|
|
bool is_eliminated =
|
2020-12-10 09:31:54 +03:00
|
|
|
!esym.is_abs() && !esym.is_common() && !file->sections[esym.st_shndx];
|
|
|
|
return esym.is_defined() && !is_weak && !is_eliminated && sym.file != file;
|
2020-11-30 12:19:33 +03:00
|
|
|
};
|
|
|
|
|
|
|
|
tbb::parallel_for_each(out::objs, [&](ObjectFile *file) {
|
2020-11-26 12:09:32 +03:00
|
|
|
if (!file->is_alive)
|
2020-11-20 11:12:45 +03:00
|
|
|
return;
|
|
|
|
|
2020-11-26 12:09:32 +03:00
|
|
|
for (int i = file->first_global; i < file->elf_syms.size(); i++) {
|
2020-11-30 12:19:33 +03:00
|
|
|
if (is_error(file, i)) {
|
2020-11-26 12:09:32 +03:00
|
|
|
file->has_error = true;
|
2020-11-20 11:12:45 +03:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
2020-11-30 12:19:33 +03:00
|
|
|
for (ObjectFile *file : out::objs)
|
|
|
|
if (file->has_error)
|
|
|
|
for (int i = file->first_global; i < file->elf_syms.size(); i++)
|
|
|
|
if (is_error(file, i))
|
2020-12-11 03:15:08 +03:00
|
|
|
std::cerr << "duplicate symbol: " << to_string(file)
|
|
|
|
<< ": " << to_string(file->symbols[i]->file) << ": "
|
2020-12-10 16:33:28 +03:00
|
|
|
<< file->symbols[i]->name << "\n";
|
2020-11-20 11:12:45 +03:00
|
|
|
|
2020-11-26 12:09:32 +03:00
|
|
|
for (ObjectFile *file : out::objs)
|
|
|
|
if (file->has_error)
|
|
|
|
_exit(1);
|
2020-11-20 11:12:45 +03:00
|
|
|
}
|
|
|
|
|
2020-10-26 08:18:00 +03:00
|
|
|
static void set_isec_offsets() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("isec_offsets");
|
2020-11-11 04:42:26 +03:00
|
|
|
|
2020-11-07 18:47:34 +03:00
|
|
|
tbb::parallel_for_each(OutputSection::instances, [&](OutputSection *osec) {
|
2020-11-08 06:42:40 +03:00
|
|
|
if (osec->members.empty())
|
2020-10-27 07:52:10 +03:00
|
|
|
return;
|
|
|
|
|
2020-12-10 14:20:46 +03:00
|
|
|
std::vector<std::span<InputChunk *>> slices = split(osec->members, 10000);
|
2020-10-29 10:27:11 +03:00
|
|
|
std::vector<u64> size(slices.size());
|
|
|
|
std::vector<u32> alignments(slices.size());
|
2020-10-26 08:18:00 +03:00
|
|
|
|
2020-10-28 07:42:05 +03:00
|
|
|
tbb::parallel_for(0, (int)slices.size(), [&](int i) {
|
2020-10-29 10:27:11 +03:00
|
|
|
u64 off = 0;
|
|
|
|
u32 align = 1;
|
2020-10-26 10:12:35 +03:00
|
|
|
|
2020-11-08 06:36:08 +03:00
|
|
|
for (InputChunk *isec : slices[i]) {
|
2020-10-26 10:12:35 +03:00
|
|
|
off = align_to(off, isec->shdr.sh_addralign);
|
|
|
|
isec->offset = off;
|
|
|
|
off += isec->shdr.sh_size;
|
2020-10-29 10:27:11 +03:00
|
|
|
align = std::max<u32>(align, isec->shdr.sh_addralign);
|
2020-10-26 10:12:35 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
size[i] = off;
|
|
|
|
alignments[i] = align;
|
|
|
|
});
|
|
|
|
|
2020-10-29 10:27:11 +03:00
|
|
|
u32 align = *std::max_element(alignments.begin(), alignments.end());
|
2020-10-26 10:12:35 +03:00
|
|
|
|
2020-10-29 10:27:11 +03:00
|
|
|
std::vector<u64> start(slices.size());
|
2020-10-28 07:42:05 +03:00
|
|
|
for (int i = 1; i < slices.size(); i++)
|
2020-11-10 06:23:14 +03:00
|
|
|
start[i] = align_to(start[i - 1] + size[i - 1], align);
|
2020-10-26 10:58:49 +03:00
|
|
|
|
2020-10-28 07:42:05 +03:00
|
|
|
tbb::parallel_for(1, (int)slices.size(), [&](int i) {
|
2020-11-08 06:36:08 +03:00
|
|
|
for (InputChunk *isec : slices[i])
|
2020-10-26 10:12:35 +03:00
|
|
|
isec->offset += start[i];
|
|
|
|
});
|
|
|
|
|
|
|
|
osec->shdr.sh_size = start.back() + size.back();
|
2020-10-26 08:18:00 +03:00
|
|
|
osec->shdr.sh_addralign = align;
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2020-11-29 05:10:33 +03:00
|
|
|
static void scan_rels() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("scan_rels");
|
2020-11-15 10:19:21 +03:00
|
|
|
|
2020-11-29 05:10:33 +03:00
|
|
|
// Scan relocations to find dynamic symbols.
|
2020-11-24 07:56:14 +03:00
|
|
|
tbb::parallel_for_each(out::objs, [&](ObjectFile *file) {
|
2020-12-16 14:56:04 +03:00
|
|
|
for (InputSection *isec : file->sections) {
|
2020-11-15 10:19:21 +03:00
|
|
|
if (isec)
|
|
|
|
isec->scan_relocations();
|
2020-12-16 14:56:04 +03:00
|
|
|
}
|
2020-11-17 14:54:13 +03:00
|
|
|
});
|
2020-11-17 13:56:02 +03:00
|
|
|
|
2020-11-29 05:10:33 +03:00
|
|
|
// If there was a relocation that refers an undefined symbol,
|
|
|
|
// report an error.
|
2020-11-26 12:09:32 +03:00
|
|
|
for (ObjectFile *file : out::objs)
|
|
|
|
if (file->has_error)
|
|
|
|
for (InputSection *isec : file->sections)
|
|
|
|
if (isec)
|
|
|
|
isec->report_undefined_symbols();
|
|
|
|
|
|
|
|
for (ObjectFile *file : out::objs)
|
|
|
|
if (file->has_error)
|
|
|
|
_exit(1);
|
|
|
|
|
2020-11-29 05:10:33 +03:00
|
|
|
// Aggregate dynamic symbols to a single vector.
|
2020-11-24 10:22:32 +03:00
|
|
|
std::vector<InputFile *> files;
|
|
|
|
files.insert(files.end(), out::objs.begin(), out::objs.end());
|
|
|
|
files.insert(files.end(), out::dsos.begin(), out::dsos.end());
|
|
|
|
|
2020-11-24 08:31:05 +03:00
|
|
|
std::vector<std::vector<Symbol *>> vec(files.size());
|
2020-11-17 14:54:13 +03:00
|
|
|
|
2020-11-24 08:31:05 +03:00
|
|
|
tbb::parallel_for(0, (int)files.size(), [&](int i) {
|
|
|
|
for (Symbol *sym : files[i]->symbols)
|
2020-12-13 14:18:49 +03:00
|
|
|
if (sym->file == files[i])
|
2020-12-16 12:38:13 +03:00
|
|
|
if (sym->flags)
|
2020-12-13 14:18:49 +03:00
|
|
|
vec[i].push_back(sym);
|
2020-11-15 07:01:38 +03:00
|
|
|
});
|
2020-11-06 06:01:52 +03:00
|
|
|
|
2020-11-29 05:10:33 +03:00
|
|
|
// Assign offsets in additional tables for each dynamic symbol.
|
|
|
|
for (Symbol *sym : flatten(vec)) {
|
2020-12-16 14:56:04 +03:00
|
|
|
if (sym->is_imported || (sym->flags & NEEDS_DYNSYM))
|
2020-12-13 15:57:45 +03:00
|
|
|
out::dynsym->add_symbol(sym);
|
|
|
|
|
2020-12-16 12:38:13 +03:00
|
|
|
if (sym->flags & NEEDS_GOT)
|
2020-11-21 06:49:28 +03:00
|
|
|
out::got->add_got_symbol(sym);
|
2020-11-06 07:54:37 +03:00
|
|
|
|
2020-12-16 12:38:13 +03:00
|
|
|
if (sym->flags & NEEDS_PLT)
|
2020-11-18 15:45:49 +03:00
|
|
|
out::plt->add_symbol(sym);
|
2020-11-17 14:22:52 +03:00
|
|
|
|
2020-12-16 12:38:13 +03:00
|
|
|
if (sym->flags & NEEDS_GOTTPOFF)
|
2020-11-21 04:48:51 +03:00
|
|
|
out::got->add_gottpoff_symbol(sym);
|
2020-11-17 14:22:52 +03:00
|
|
|
|
2020-12-16 12:38:13 +03:00
|
|
|
if (sym->flags & NEEDS_TLSGD)
|
2020-11-21 04:48:23 +03:00
|
|
|
out::got->add_tlsgd_symbol(sym);
|
|
|
|
|
2020-12-16 12:38:13 +03:00
|
|
|
if (sym->flags & NEEDS_TLSLD)
|
2020-11-21 04:48:23 +03:00
|
|
|
out::got->add_tlsld_symbol(sym);
|
2020-11-25 11:20:48 +03:00
|
|
|
|
2020-12-16 12:38:13 +03:00
|
|
|
if (sym->flags & NEEDS_COPYREL) {
|
2020-11-25 11:20:48 +03:00
|
|
|
out::copyrel->add_symbol(sym);
|
2020-11-25 14:35:04 +03:00
|
|
|
assert(sym->file->is_dso);
|
|
|
|
|
|
|
|
for (Symbol *alias : ((SharedFile *)sym->file)->find_aliases(sym)) {
|
2020-11-29 05:06:11 +03:00
|
|
|
if (sym == alias)
|
|
|
|
continue;
|
|
|
|
assert(alias->copyrel_offset == -1);
|
2020-11-25 14:35:04 +03:00
|
|
|
alias->copyrel_offset = sym->copyrel_offset;
|
|
|
|
out::dynsym->add_symbol(alias);
|
|
|
|
}
|
|
|
|
}
|
2020-11-18 15:45:49 +03:00
|
|
|
}
|
2020-11-16 16:25:58 +03:00
|
|
|
}
|
2020-11-11 11:25:00 +03:00
|
|
|
|
2020-12-07 09:50:13 +03:00
|
|
|
static void export_dynamic() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("export_dynamic");
|
2020-12-07 15:04:29 +03:00
|
|
|
|
|
|
|
tbb::parallel_for(0, (int)out::objs.size(), [&](int i) {
|
|
|
|
ObjectFile *file = out::objs[i];
|
2020-12-10 14:20:46 +03:00
|
|
|
for (Symbol *sym : std::span(file->symbols).subspan(file->first_global))
|
2020-12-07 16:13:42 +03:00
|
|
|
if (sym->file == file && config.export_dynamic)
|
2020-12-07 15:04:29 +03:00
|
|
|
sym->ver_idx = VER_NDX_GLOBAL;
|
|
|
|
});
|
2020-12-07 16:13:42 +03:00
|
|
|
|
2020-12-10 07:44:58 +03:00
|
|
|
for (std::string_view name : config.globals)
|
2020-12-07 16:13:42 +03:00
|
|
|
Symbol::intern(name)->ver_idx = VER_NDX_GLOBAL;
|
2020-12-07 15:04:29 +03:00
|
|
|
|
2020-12-07 09:50:13 +03:00
|
|
|
std::vector<std::vector<Symbol *>> vec(out::objs.size());
|
|
|
|
|
|
|
|
tbb::parallel_for(0, (int)out::objs.size(), [&](int i) {
|
2020-12-07 10:19:56 +03:00
|
|
|
ObjectFile *file = out::objs[i];
|
2020-12-10 14:20:46 +03:00
|
|
|
for (Symbol *sym : std::span(file->symbols).subspan(file->first_global))
|
2020-12-07 15:04:29 +03:00
|
|
|
if (sym->file == file && sym->ver_idx != VER_NDX_LOCAL)
|
2020-12-07 09:50:13 +03:00
|
|
|
vec[i].push_back(sym);
|
|
|
|
});
|
|
|
|
|
|
|
|
for (Symbol *sym : flatten(vec))
|
|
|
|
out::dynsym->add_symbol(sym);
|
|
|
|
}
|
|
|
|
|
2020-11-29 05:40:57 +03:00
|
|
|
static void fill_symbol_versions() {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("fill_symbol_versions");
|
2020-11-29 05:40:57 +03:00
|
|
|
|
2020-11-29 05:57:58 +03:00
|
|
|
// Create a list of versioned symbols and sort by file and version.
|
2020-11-29 05:40:57 +03:00
|
|
|
std::vector<Symbol *> syms = out::dynsym->symbols;
|
2020-12-13 16:31:50 +03:00
|
|
|
erase(syms, [](Symbol *sym){ return sym->ver_idx < 2; });
|
2020-11-29 05:40:57 +03:00
|
|
|
|
2020-11-29 05:57:58 +03:00
|
|
|
if (syms.empty())
|
|
|
|
return;
|
|
|
|
|
2020-11-29 05:40:57 +03:00
|
|
|
std::stable_sort(syms.begin(), syms.end(), [](Symbol *a, Symbol *b) {
|
|
|
|
SharedFile *x = (SharedFile *)a->file;
|
|
|
|
SharedFile *y = (SharedFile *)b->file;
|
2020-11-30 11:52:08 +03:00
|
|
|
return std::make_tuple(x->soname, a->ver_idx) <
|
|
|
|
std::make_tuple(y->soname, b->ver_idx);
|
2020-11-29 05:40:57 +03:00
|
|
|
});
|
|
|
|
|
2020-11-29 05:57:58 +03:00
|
|
|
// Compute sizes of .gnu.version and .gnu.version_r sections.
|
2020-11-29 07:02:51 +03:00
|
|
|
out::versym->contents.resize(out::dynsym->symbols.size() + 1, 1);
|
2020-11-29 05:57:58 +03:00
|
|
|
out::versym->contents[0] = 0;
|
|
|
|
|
2020-12-10 15:18:20 +03:00
|
|
|
int sz = sizeof(ElfVerneed) + sizeof(ElfVernaux);
|
2020-11-29 05:57:58 +03:00
|
|
|
for (int i = 1; i < syms.size(); i++) {
|
|
|
|
if (syms[i - 1]->file != syms[i]->file)
|
2020-12-10 15:18:20 +03:00
|
|
|
sz += sizeof(ElfVerneed) + sizeof(ElfVernaux);
|
2020-11-29 05:57:58 +03:00
|
|
|
else if (syms[i - 1]->ver_idx != syms[i]->ver_idx)
|
2020-12-10 15:18:20 +03:00
|
|
|
sz += sizeof(ElfVernaux);
|
2020-11-29 05:40:57 +03:00
|
|
|
}
|
2020-11-29 05:57:58 +03:00
|
|
|
out::verneed->contents.resize(sz);
|
|
|
|
|
|
|
|
// Fill .gnu.versoin_r.
|
|
|
|
u8 *buf = (u8 *)&out::verneed->contents[0];
|
2020-11-29 06:59:08 +03:00
|
|
|
u16 version = 1;
|
2020-12-10 15:18:20 +03:00
|
|
|
ElfVerneed *verneed = nullptr;
|
|
|
|
ElfVernaux *aux = nullptr;
|
2020-11-29 06:59:08 +03:00
|
|
|
|
2020-11-29 08:05:44 +03:00
|
|
|
auto add_aux = [&](Symbol *sym) {
|
2020-11-29 06:59:08 +03:00
|
|
|
SharedFile *file = (SharedFile *)sym->file;
|
2020-12-10 07:44:58 +03:00
|
|
|
std::string_view verstr = file->version_strings[sym->ver_idx];
|
2020-11-29 06:59:08 +03:00
|
|
|
|
2020-11-29 08:05:44 +03:00
|
|
|
verneed->vn_cnt += 1;
|
|
|
|
if (aux)
|
2020-12-10 15:18:20 +03:00
|
|
|
aux->vna_next = sizeof(ElfVernaux);
|
2020-11-29 08:05:44 +03:00
|
|
|
|
2020-12-10 15:18:20 +03:00
|
|
|
aux = (ElfVernaux *)buf;
|
2020-11-29 06:59:08 +03:00
|
|
|
buf += sizeof(*aux);
|
|
|
|
aux->vna_hash = elf_hash(verstr);
|
|
|
|
aux->vna_other = ++version;
|
|
|
|
aux->vna_name = out::dynstr->add_string(verstr);
|
|
|
|
};
|
|
|
|
|
2020-11-29 08:05:44 +03:00
|
|
|
auto add_verneed = [&](Symbol *sym) {
|
2020-11-29 06:59:08 +03:00
|
|
|
SharedFile *file = (SharedFile *)sym->file;
|
|
|
|
|
2020-11-29 08:05:44 +03:00
|
|
|
out::verneed->shdr.sh_info += 1;
|
|
|
|
if (verneed)
|
|
|
|
verneed->vn_next = buf - (u8 *)verneed;
|
|
|
|
|
2020-12-10 15:18:20 +03:00
|
|
|
verneed = (ElfVerneed *)buf;
|
2020-11-29 08:05:44 +03:00
|
|
|
buf += sizeof(*verneed);
|
|
|
|
verneed->vn_version = 1;
|
2020-11-30 11:52:08 +03:00
|
|
|
verneed->vn_file = out::dynstr->find_string(file->soname);
|
2020-12-10 15:18:20 +03:00
|
|
|
verneed->vn_aux = sizeof(ElfVerneed);
|
2020-11-29 08:05:44 +03:00
|
|
|
|
|
|
|
aux = nullptr;
|
|
|
|
add_aux(sym);
|
2020-11-29 06:59:08 +03:00
|
|
|
};
|
|
|
|
|
2020-11-29 08:05:44 +03:00
|
|
|
add_verneed(syms[0]);
|
2020-11-29 07:14:56 +03:00
|
|
|
out::versym->contents[syms[0]->dynsym_idx] = version;
|
|
|
|
|
2020-11-29 06:59:08 +03:00
|
|
|
for (int i = 1; i < syms.size(); i++) {
|
|
|
|
if (syms[i - 1]->file != syms[i]->file)
|
2020-11-29 08:05:44 +03:00
|
|
|
add_verneed(syms[i]);
|
2020-11-29 06:59:08 +03:00
|
|
|
else if (syms[i - 1]->ver_idx != syms[i]->ver_idx)
|
2020-11-29 08:05:44 +03:00
|
|
|
add_aux(syms[i]);
|
2020-11-29 06:59:08 +03:00
|
|
|
out::versym->contents[syms[i]->dynsym_idx] = version;
|
|
|
|
}
|
2020-11-29 05:40:57 +03:00
|
|
|
}
|
|
|
|
|
2020-11-17 07:59:24 +03:00
|
|
|
static void clear_padding(u64 filesize) {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("clear_padding");
|
2020-11-11 04:42:26 +03:00
|
|
|
|
2020-11-29 14:39:44 +03:00
|
|
|
auto zero = [](OutputChunk *chunk, u64 next_start) {
|
2020-11-10 11:32:41 +03:00
|
|
|
u64 pos = chunk->shdr.sh_offset;
|
|
|
|
if (chunk->shdr.sh_type != SHT_NOBITS)
|
|
|
|
pos += chunk->shdr.sh_size;
|
2020-11-17 07:59:24 +03:00
|
|
|
memset(out::buf + pos, 0, next_start - pos);
|
2020-11-09 15:50:47 +03:00
|
|
|
};
|
|
|
|
|
2020-11-17 07:59:24 +03:00
|
|
|
for (int i = 1; i < out::chunks.size(); i++)
|
|
|
|
zero(out::chunks[i - 1], out::chunks[i]->shdr.sh_offset);
|
|
|
|
zero(out::chunks.back(), filesize);
|
2020-11-09 15:50:47 +03:00
|
|
|
}
|
|
|
|
|
2020-10-22 12:54:51 +03:00
|
|
|
// We want to sort output sections in the following order.
|
|
|
|
//
|
2020-10-22 17:19:48 +03:00
|
|
|
// alloc readonly data
|
|
|
|
// alloc readonly code
|
|
|
|
// alloc writable tdata
|
|
|
|
// alloc writable tbss
|
|
|
|
// alloc writable data
|
|
|
|
// alloc writable bss
|
|
|
|
// nonalloc
|
2020-12-10 09:59:24 +03:00
|
|
|
static int get_section_rank(const ElfShdr &shdr) {
|
2020-10-29 12:31:06 +03:00
|
|
|
bool alloc = shdr.sh_flags & SHF_ALLOC;
|
|
|
|
bool writable = shdr.sh_flags & SHF_WRITE;
|
|
|
|
bool exec = shdr.sh_flags & SHF_EXECINSTR;
|
|
|
|
bool tls = shdr.sh_flags & SHF_TLS;
|
2020-10-30 06:47:35 +03:00
|
|
|
bool nobits = shdr.sh_type == SHT_NOBITS;
|
2020-11-17 08:50:18 +03:00
|
|
|
return (!alloc << 5) | (writable << 4) | (exec << 3) | (!tls << 2) | nobits;
|
2020-10-22 12:54:51 +03:00
|
|
|
}
|
|
|
|
|
2020-12-10 14:20:46 +03:00
|
|
|
static u64 set_osec_offsets(std::span<OutputChunk *> chunks) {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("osec_offset");
|
2020-11-11 04:42:26 +03:00
|
|
|
|
2020-10-29 10:27:11 +03:00
|
|
|
u64 fileoff = 0;
|
2020-11-17 09:05:53 +03:00
|
|
|
u64 vaddr = config.image_base;
|
2020-10-26 08:16:13 +03:00
|
|
|
|
2020-11-11 08:13:39 +03:00
|
|
|
for (OutputChunk *chunk : chunks) {
|
2020-10-30 05:40:38 +03:00
|
|
|
if (chunk->starts_new_ptload)
|
2020-10-26 08:16:13 +03:00
|
|
|
vaddr = align_to(vaddr, PAGE_SIZE);
|
|
|
|
|
2020-11-24 16:54:21 +03:00
|
|
|
if (vaddr % PAGE_SIZE > fileoff % PAGE_SIZE)
|
|
|
|
fileoff += vaddr % PAGE_SIZE - fileoff % PAGE_SIZE;
|
|
|
|
else if (vaddr % PAGE_SIZE < fileoff % PAGE_SIZE)
|
|
|
|
fileoff = align_to(fileoff, PAGE_SIZE) + vaddr % PAGE_SIZE;
|
2020-10-30 05:40:38 +03:00
|
|
|
|
|
|
|
fileoff = align_to(fileoff, chunk->shdr.sh_addralign);
|
2020-10-26 08:16:13 +03:00
|
|
|
vaddr = align_to(vaddr, chunk->shdr.sh_addralign);
|
|
|
|
|
|
|
|
chunk->shdr.sh_offset = fileoff;
|
|
|
|
if (chunk->shdr.sh_flags & SHF_ALLOC)
|
|
|
|
chunk->shdr.sh_addr = vaddr;
|
|
|
|
|
2020-11-24 16:54:21 +03:00
|
|
|
bool is_bss = chunk->shdr.sh_type == SHT_NOBITS;
|
2020-11-03 14:37:27 +03:00
|
|
|
if (!is_bss)
|
2020-11-03 14:13:03 +03:00
|
|
|
fileoff += chunk->shdr.sh_size;
|
2020-10-30 05:40:38 +03:00
|
|
|
|
2020-11-03 14:37:27 +03:00
|
|
|
bool is_tbss = is_bss && (chunk->shdr.sh_flags & SHF_TLS);
|
2020-10-30 05:40:38 +03:00
|
|
|
if (!is_tbss)
|
2020-11-03 14:13:03 +03:00
|
|
|
vaddr += chunk->shdr.sh_size;
|
2020-10-26 08:16:13 +03:00
|
|
|
}
|
|
|
|
return fileoff;
|
|
|
|
}
|
|
|
|
|
2020-12-10 14:20:46 +03:00
|
|
|
static void fix_synthetic_symbols(std::span<OutputChunk *> chunks) {
|
2020-11-29 14:39:44 +03:00
|
|
|
auto start = [](OutputChunk *chunk, Symbol *sym) {
|
2020-11-11 04:45:52 +03:00
|
|
|
if (sym) {
|
|
|
|
sym->shndx = chunk->shndx;
|
|
|
|
sym->value = chunk->shdr.sh_addr;
|
|
|
|
}
|
|
|
|
};
|
2020-11-04 08:23:39 +03:00
|
|
|
|
2020-11-29 14:39:44 +03:00
|
|
|
auto stop = [](OutputChunk *chunk, Symbol *sym) {
|
2020-11-11 04:45:52 +03:00
|
|
|
if (sym) {
|
|
|
|
sym->shndx = chunk->shndx;
|
|
|
|
sym->value = chunk->shdr.sh_addr + chunk->shdr.sh_size;
|
|
|
|
}
|
|
|
|
};
|
2020-11-04 08:23:39 +03:00
|
|
|
|
|
|
|
// __bss_start
|
2020-11-11 08:13:39 +03:00
|
|
|
for (OutputChunk *chunk : chunks) {
|
2020-11-08 10:09:01 +03:00
|
|
|
if (chunk->kind == OutputChunk::REGULAR && chunk->name == ".bss") {
|
2020-11-04 08:23:39 +03:00
|
|
|
start(chunk, out::__bss_start);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// __ehdr_start
|
2020-11-11 08:13:39 +03:00
|
|
|
for (OutputChunk *chunk : chunks) {
|
2020-11-04 08:23:39 +03:00
|
|
|
if (chunk->shndx == 1) {
|
2020-11-04 08:41:40 +03:00
|
|
|
out::__ehdr_start->shndx = 1;
|
2020-11-12 07:15:29 +03:00
|
|
|
out::__ehdr_start->value = out::ehdr->shdr.sh_addr;
|
2020-11-04 08:23:39 +03:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// __rela_iplt_start and __rela_iplt_end
|
2020-11-11 15:32:41 +03:00
|
|
|
start(out::relplt, out::__rela_iplt_start);
|
|
|
|
stop(out::relplt, out::__rela_iplt_end);
|
2020-11-04 08:23:39 +03:00
|
|
|
|
|
|
|
// __{init,fini}_array_{start,end}
|
2020-11-11 08:13:39 +03:00
|
|
|
for (OutputChunk *chunk : chunks) {
|
2020-11-04 08:23:39 +03:00
|
|
|
switch (chunk->shdr.sh_type) {
|
|
|
|
case SHT_INIT_ARRAY:
|
|
|
|
start(chunk, out::__init_array_start);
|
|
|
|
stop(chunk, out::__init_array_end);
|
|
|
|
break;
|
|
|
|
case SHT_FINI_ARRAY:
|
|
|
|
start(chunk, out::__fini_array_start);
|
|
|
|
stop(chunk, out::__fini_array_end);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// _end, end, _etext, etext, _edata and edata
|
2020-11-11 08:13:39 +03:00
|
|
|
for (OutputChunk *chunk : chunks) {
|
2020-11-08 10:09:01 +03:00
|
|
|
if (chunk->kind == OutputChunk::HEADER)
|
2020-11-04 08:23:39 +03:00
|
|
|
continue;
|
|
|
|
|
2020-11-12 07:19:19 +03:00
|
|
|
if (chunk->shdr.sh_flags & SHF_ALLOC)
|
2020-11-04 08:23:39 +03:00
|
|
|
stop(chunk, out::_end);
|
|
|
|
|
2020-11-12 07:19:19 +03:00
|
|
|
if (chunk->shdr.sh_flags & SHF_EXECINSTR)
|
2020-11-04 08:23:39 +03:00
|
|
|
stop(chunk, out::_etext);
|
|
|
|
|
2020-11-12 07:19:19 +03:00
|
|
|
if (chunk->shdr.sh_type != SHT_NOBITS && chunk->shdr.sh_flags & SHF_ALLOC)
|
2020-11-04 08:23:39 +03:00
|
|
|
stop(chunk, out::_edata);
|
|
|
|
}
|
|
|
|
|
2020-11-13 04:19:47 +03:00
|
|
|
// _DYNAMIC
|
|
|
|
if (out::dynamic)
|
|
|
|
start(out::dynamic, out::_DYNAMIC);
|
|
|
|
|
2020-11-16 07:48:14 +03:00
|
|
|
// _GLOBAL_OFFSET_TABLE_
|
|
|
|
if (out::gotplt)
|
|
|
|
start(out::gotplt, out::_GLOBAL_OFFSET_TABLE_);
|
|
|
|
|
2020-11-04 08:23:39 +03:00
|
|
|
// __start_ and __stop_ symbols
|
2020-11-11 08:13:39 +03:00
|
|
|
for (OutputChunk *chunk : chunks) {
|
2020-11-11 08:45:17 +03:00
|
|
|
if (is_c_identifier(chunk->name)) {
|
2020-12-10 16:51:38 +03:00
|
|
|
start(chunk, Symbol::intern("__start_" + std::string(chunk->name)));
|
|
|
|
stop(chunk, Symbol::intern("__stop_" + std::string(chunk->name)));
|
2020-11-11 08:45:17 +03:00
|
|
|
}
|
2020-11-04 08:23:39 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-11-20 09:35:47 +03:00
|
|
|
static u32 get_umask() {
|
|
|
|
u32 mask = umask(0);
|
|
|
|
umask(mask);
|
|
|
|
return mask;
|
|
|
|
}
|
|
|
|
|
2020-11-09 11:38:12 +03:00
|
|
|
static u8 *open_output_file(u64 filesize) {
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("open_file");
|
2020-11-17 08:03:32 +03:00
|
|
|
|
2020-12-10 07:44:58 +03:00
|
|
|
int fd = open(std::string(config.output).c_str(), O_RDWR | O_CREAT, 0777);
|
2020-11-09 06:30:13 +03:00
|
|
|
if (fd == -1)
|
|
|
|
error("cannot open " + config.output + ": " + strerror(errno));
|
2020-11-03 14:29:24 +03:00
|
|
|
|
2020-11-09 11:38:12 +03:00
|
|
|
if (ftruncate(fd, filesize))
|
2020-11-19 03:24:10 +03:00
|
|
|
error("ftruncate failed");
|
2020-11-03 14:29:24 +03:00
|
|
|
|
2020-11-20 09:35:47 +03:00
|
|
|
if (fchmod(fd, (0777 & ~get_umask())) == -1)
|
|
|
|
error("fchmod failed");
|
|
|
|
|
2020-11-09 11:38:12 +03:00
|
|
|
void *buf = mmap(nullptr, filesize, PROT_READ | PROT_WRITE, MAP_SHARED, fd, 0);
|
2020-11-09 08:47:51 +03:00
|
|
|
if (buf == MAP_FAILED)
|
2020-11-09 06:30:13 +03:00
|
|
|
error(config.output + ": mmap failed: " + strerror(errno));
|
2020-11-09 11:38:12 +03:00
|
|
|
close(fd);
|
2020-11-12 07:33:57 +03:00
|
|
|
|
|
|
|
if (config.filler != -1)
|
|
|
|
memset(buf, config.filler, filesize);
|
2020-11-09 11:38:12 +03:00
|
|
|
return (u8 *)buf;
|
2020-11-03 14:29:24 +03:00
|
|
|
}
|
|
|
|
|
2020-12-10 08:27:38 +03:00
|
|
|
MemoryMappedFile find_library(std::string name) {
|
2020-12-10 07:44:58 +03:00
|
|
|
for (std::string_view dir : config.library_paths) {
|
|
|
|
std::string root = dir.starts_with("/") ? config.sysroot : "";
|
|
|
|
std::string stem = root + std::string(dir) + "/lib" + name;
|
2020-11-19 12:03:26 +03:00
|
|
|
if (!config.is_static)
|
2020-12-10 08:27:38 +03:00
|
|
|
if (MemoryMappedFile *mb = open_input_file(stem + ".so"))
|
2020-11-20 14:07:33 +03:00
|
|
|
return *mb;
|
2020-12-10 08:27:38 +03:00
|
|
|
if (MemoryMappedFile *mb = open_input_file(stem + ".a"))
|
2020-11-20 14:07:33 +03:00
|
|
|
return *mb;
|
2020-11-19 12:03:26 +03:00
|
|
|
}
|
|
|
|
error("library not found: " + name);
|
|
|
|
}
|
|
|
|
|
2020-12-12 07:20:26 +03:00
|
|
|
static std::vector<std::string> add_dashes(std::string name) {
|
|
|
|
std::vector<std::string> opts;
|
|
|
|
opts.push_back("-" + name);
|
|
|
|
if (!name.starts_with("o"))
|
|
|
|
opts.push_back("--" + name);
|
|
|
|
return opts;
|
|
|
|
}
|
|
|
|
|
2020-12-18 13:58:52 +03:00
|
|
|
static bool read_arg(std::span<std::string_view> &args, std::string_view &arg,
|
|
|
|
std::string name) {
|
2020-12-11 06:43:14 +03:00
|
|
|
if (name.size() == 1) {
|
|
|
|
if (args[0] == "-" + name) {
|
|
|
|
if (args.size() == 1)
|
|
|
|
error("option -" + name + ": argument missing");
|
|
|
|
arg = args[1];
|
|
|
|
args = args.subspan(2);
|
|
|
|
return true;
|
|
|
|
}
|
2020-10-02 10:47:51 +03:00
|
|
|
|
2020-12-18 13:58:52 +03:00
|
|
|
if (args[0].starts_with("-" + name)) {
|
|
|
|
arg = args[0].substr(name.size() + 1);
|
2020-12-11 06:43:14 +03:00
|
|
|
args = args.subspan(1);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
2020-10-30 07:47:51 +03:00
|
|
|
|
2020-12-12 07:20:26 +03:00
|
|
|
for (std::string opt : add_dashes(name)) {
|
2020-12-11 06:43:14 +03:00
|
|
|
if (args[0] == opt) {
|
|
|
|
if (args.size() == 1)
|
|
|
|
error("option " + name + ": argument missing");
|
|
|
|
arg = args[1];
|
|
|
|
args = args.subspan(2);
|
|
|
|
return true;
|
|
|
|
}
|
2020-11-03 12:02:28 +03:00
|
|
|
|
2020-12-18 13:58:52 +03:00
|
|
|
if (args[0].starts_with(opt + "=")) {
|
|
|
|
arg = args[0].substr(opt.size() + 1);
|
2020-12-11 06:43:14 +03:00
|
|
|
args = args.subspan(1);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2020-12-18 13:58:52 +03:00
|
|
|
static bool read_flag(std::span<std::string_view> &args, std::string name) {
|
2020-12-12 07:20:26 +03:00
|
|
|
for (std::string opt : add_dashes(name)) {
|
|
|
|
if (args[0] == opt) {
|
|
|
|
args = args.subspan(1);
|
|
|
|
return true;
|
|
|
|
}
|
2020-12-17 16:29:43 +03:00
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2020-12-18 13:58:52 +03:00
|
|
|
static bool read_z_flag(std::span<std::string_view> &args, std::string name) {
|
|
|
|
if (args.size() >= 2 && args[0] == "-z" && args[1] == name) {
|
2020-12-17 16:29:43 +03:00
|
|
|
args = args.subspan(2);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2020-12-18 13:58:52 +03:00
|
|
|
if (!args.empty() && args[0] == "-z" + name) {
|
2020-12-17 16:29:43 +03:00
|
|
|
args = args.subspan(1);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2020-12-12 07:20:26 +03:00
|
|
|
return false;
|
|
|
|
}
|
2020-10-04 12:00:33 +03:00
|
|
|
|
2020-12-18 13:58:52 +03:00
|
|
|
static bool read_equal(std::span<std::string_view> &args, std::string_view &arg,
|
2020-12-12 07:20:26 +03:00
|
|
|
std::string name, std::string default_) {
|
|
|
|
for (std::string opt : add_dashes(name)) {
|
2020-12-11 06:43:14 +03:00
|
|
|
if (args[0] == opt) {
|
2020-12-12 07:20:26 +03:00
|
|
|
arg = default_;
|
2020-12-11 06:43:14 +03:00
|
|
|
args = args.subspan(1);
|
|
|
|
return true;
|
|
|
|
}
|
2020-12-17 16:29:43 +03:00
|
|
|
}
|
2020-12-12 07:20:26 +03:00
|
|
|
|
|
|
|
for (std::string opt : add_dashes(name)) {
|
2020-12-18 13:58:52 +03:00
|
|
|
if (args[0].starts_with(opt + "=")) {
|
|
|
|
arg = args[0].substr(opt.size() + 1);
|
2020-12-12 07:20:26 +03:00
|
|
|
args = args.subspan(1);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
2020-12-11 06:43:14 +03:00
|
|
|
return false;
|
|
|
|
}
|
2020-10-29 06:24:54 +03:00
|
|
|
|
2020-12-11 06:43:14 +03:00
|
|
|
static u64 parse_hex(std::string opt, std::string_view value) {
|
|
|
|
if (!value.starts_with("0x") && !value.starts_with("0X"))
|
|
|
|
error("option -" + opt + ": not a hexadecimal number");
|
|
|
|
value = value.substr(2);
|
|
|
|
if (value.find_first_not_of("0123456789abcdefABCDEF") != std::string_view::npos)
|
|
|
|
error("option -" + opt + ": not a hexadecimal number");
|
|
|
|
return std::stol(std::string(value), nullptr, 16);
|
|
|
|
}
|
2020-11-30 11:57:58 +03:00
|
|
|
|
2020-12-11 06:43:14 +03:00
|
|
|
static u64 parse_number(std::string opt, std::string_view value) {
|
|
|
|
if (value.find_first_not_of("0123456789") != std::string_view::npos)
|
|
|
|
error("option -" + opt + ": not a number");
|
|
|
|
return std::stol(std::string(value));
|
|
|
|
}
|
2020-12-07 14:04:44 +03:00
|
|
|
|
2020-12-19 04:08:32 +03:00
|
|
|
// Exiting from a program with large memory usage is slow --
|
|
|
|
// it may take a few hundred milliseconds. To hide the latency,
|
|
|
|
// we fork a child and let it do the actual linking work.
|
|
|
|
static std::function<void()> fork_child() {
|
|
|
|
int pipefd[2];
|
|
|
|
if (pipe(pipefd) == -1) {
|
|
|
|
perror("pipe");
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
|
|
|
|
pid_t pid = fork();
|
|
|
|
if (pid == -1) {
|
|
|
|
perror("fork");
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (pid > 0) {
|
|
|
|
// Parent
|
|
|
|
close(pipefd[1]);
|
|
|
|
char buf[1];
|
|
|
|
int r = read(pipefd[0], buf, 1);
|
|
|
|
_exit(r != 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Child
|
|
|
|
close(pipefd[0]);
|
2020-12-19 04:45:33 +03:00
|
|
|
return [=]() { write(pipefd[1], (char []){1}, 1); };
|
2020-12-19 04:08:32 +03:00
|
|
|
}
|
|
|
|
|
2020-12-11 06:43:14 +03:00
|
|
|
int main(int argc, char **argv) {
|
2020-12-19 04:08:32 +03:00
|
|
|
std::function<void()> on_complete = fork_child();
|
|
|
|
|
|
|
|
// Main
|
2020-12-11 10:51:20 +03:00
|
|
|
Timer t_all("all");
|
|
|
|
|
2020-12-11 06:43:14 +03:00
|
|
|
config.thread_count =
|
|
|
|
tbb::global_control::active_value(tbb::global_control::max_allowed_parallelism);
|
2020-11-05 02:31:32 +03:00
|
|
|
|
2020-12-11 06:43:14 +03:00
|
|
|
// Parse command line options
|
2020-12-18 13:58:52 +03:00
|
|
|
std::vector<std::string_view> arg_vector;
|
|
|
|
for (int i = 1; i < argc; i++)
|
|
|
|
arg_vector.push_back(argv[i]);
|
|
|
|
|
2020-12-19 11:45:11 +03:00
|
|
|
Timer t_open("open");
|
2020-12-19 12:08:15 +03:00
|
|
|
std::vector<std::pair<std::string, bool>> input_paths;
|
|
|
|
|
2020-12-18 13:58:52 +03:00
|
|
|
for (std::span<std::string_view> args = arg_vector; !args.empty();) {
|
2020-12-17 09:03:17 +03:00
|
|
|
std::string_view arg;
|
2020-12-11 06:43:14 +03:00
|
|
|
|
|
|
|
if (read_arg(args, arg, "o")) {
|
|
|
|
config.output = arg;
|
2020-12-12 07:20:26 +03:00
|
|
|
} else if (read_arg(args, arg, "dynamic-linker")) {
|
|
|
|
config.dynamic_linker = arg;
|
2020-12-14 11:01:07 +03:00
|
|
|
} else if (read_flag(args, "export-dynamic")) {
|
|
|
|
config.export_dynamic = true;
|
2020-12-14 04:07:14 +03:00
|
|
|
} else if (read_arg(args, arg, "e") || read_arg(args, arg, "entry")) {
|
|
|
|
config.entry = arg;
|
2020-12-11 06:43:14 +03:00
|
|
|
} else if (read_flag(args, "print-map")) {
|
|
|
|
config.print_map = true;
|
|
|
|
} else if (read_arg(args, arg, "thread-count")) {
|
|
|
|
config.thread_count = parse_number("thread-count", arg);
|
|
|
|
} else if (read_flag(args, "stat")) {
|
|
|
|
Counter::enabled = true;
|
|
|
|
} else if (read_flag(args, "static")) {
|
|
|
|
config.is_static = true;
|
|
|
|
} else if (read_arg(args, arg, "y") || read_arg(args, arg, "trace-symbol")) {
|
|
|
|
Symbol::intern(arg)->traced = true;
|
|
|
|
} else if (read_arg(args, arg, "filler")) {
|
|
|
|
config.filler = parse_hex("filler", arg);
|
|
|
|
} else if (read_arg(args, arg, "L") || read_arg(args, arg, "library-path")) {
|
2020-12-17 09:03:17 +03:00
|
|
|
config.library_paths.push_back(std::string(arg));
|
2020-12-11 06:43:14 +03:00
|
|
|
} else if (read_arg(args, arg, "sysroot")) {
|
|
|
|
config.sysroot = arg;
|
|
|
|
} else if (read_flag(args, "trace")) {
|
|
|
|
config.trace = true;
|
|
|
|
} else if (read_flag(args, "as-needed")) {
|
|
|
|
config.as_needed = true;
|
|
|
|
} else if (read_flag(args, "no-as-needed")) {
|
|
|
|
config.as_needed = false;
|
|
|
|
} else if (read_arg(args, arg, "rpath")) {
|
2020-12-17 09:03:17 +03:00
|
|
|
config.rpaths.push_back(std::string(arg));
|
2020-12-11 06:43:14 +03:00
|
|
|
} else if (read_arg(args, arg, "version-script")) {
|
2020-12-17 09:03:17 +03:00
|
|
|
parse_version_script(std::string(arg));
|
2020-12-16 15:16:34 +03:00
|
|
|
} else if (read_flag(args, "pie")) {
|
|
|
|
config.pie = true;
|
2020-12-17 15:36:38 +03:00
|
|
|
} else if (read_flag(args, "no-pie")) {
|
|
|
|
config.pie = false;
|
2020-12-13 16:41:50 +03:00
|
|
|
} else if (read_flag(args, "perf")) {
|
|
|
|
config.perf = true;
|
2020-12-11 06:43:14 +03:00
|
|
|
} else if (read_arg(args, arg, "l")) {
|
2020-12-19 12:08:15 +03:00
|
|
|
input_paths.push_back({"-l" + std::string(arg), config.as_needed});
|
2020-12-17 16:29:43 +03:00
|
|
|
} else if (read_z_flag(args, "now")) {
|
|
|
|
config.z_now = true;
|
2020-12-12 07:20:26 +03:00
|
|
|
} else if (read_arg(args, arg, "z")) {
|
|
|
|
} else if (read_arg(args, arg, "hash-style")) {
|
|
|
|
} else if (read_arg(args, arg, "m")) {
|
|
|
|
} else if (read_equal(args, arg, "build-id", "none")) {
|
|
|
|
} else if (read_flag(args, "eh-frame-hdr")) {
|
|
|
|
} else if (read_flag(args, "start-group")) {
|
|
|
|
} else if (read_flag(args, "end-group")) {
|
|
|
|
} else if (read_flag(args, "fatal-warnings")) {
|
|
|
|
} else if (read_flag(args, "disable-new-dtags")) {
|
2020-12-11 06:43:14 +03:00
|
|
|
} else if (args[0][0] == '-') {
|
|
|
|
error("unknown command line option: " + std::string(args[0]));
|
|
|
|
} else {
|
2020-12-19 12:08:15 +03:00
|
|
|
input_paths.push_back({std::string(args[0]), config.as_needed});
|
2020-12-11 06:43:14 +03:00
|
|
|
args = args.subspan(1);
|
2020-11-19 12:03:26 +03:00
|
|
|
}
|
2020-11-07 17:00:01 +03:00
|
|
|
}
|
2020-10-25 03:38:53 +03:00
|
|
|
|
2020-12-19 12:08:15 +03:00
|
|
|
std::vector<std::vector<InputFile *>> input_file_vectors(input_paths.size());
|
|
|
|
tbb::parallel_for(0, (int)input_paths.size(), [&](int i) {
|
|
|
|
std::string path = input_paths[i].first;
|
|
|
|
bool as_needed = input_paths[i].second;
|
|
|
|
|
|
|
|
if (path.starts_with("-l"))
|
|
|
|
input_file_vectors[i] = read_file(find_library(path.substr(2)), as_needed);
|
|
|
|
else
|
|
|
|
input_file_vectors[i] = read_file(must_open_input_file(path), as_needed);
|
|
|
|
});
|
|
|
|
|
|
|
|
std::vector<InputFile *> input_files = flatten(input_file_vectors);
|
|
|
|
|
2020-12-19 11:45:11 +03:00
|
|
|
t_open.stop();
|
|
|
|
|
2020-12-11 06:43:14 +03:00
|
|
|
if (config.output == "")
|
|
|
|
error("-o option is missing");
|
|
|
|
|
2020-12-17 15:36:38 +03:00
|
|
|
if (config.pie)
|
|
|
|
config.image_base = 0;
|
|
|
|
|
2020-12-11 06:43:14 +03:00
|
|
|
tbb::global_control tbb_cont(tbb::global_control::max_allowed_parallelism,
|
|
|
|
config.thread_count);
|
|
|
|
|
2020-11-07 17:00:01 +03:00
|
|
|
// Parse input files
|
|
|
|
{
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("parse");
|
2020-12-19 12:08:15 +03:00
|
|
|
tbb::parallel_for_each(input_files, [](InputFile *file) { file->parse(); });
|
|
|
|
}
|
|
|
|
|
|
|
|
for (InputFile *file : input_files) {
|
|
|
|
if (file->is_dso)
|
|
|
|
out::dsos.push_back((SharedFile *)file);
|
|
|
|
else
|
|
|
|
out::objs.push_back((ObjectFile *)file);
|
2020-10-25 03:38:53 +03:00
|
|
|
}
|
2020-10-18 13:17:44 +03:00
|
|
|
|
2020-11-20 07:54:29 +03:00
|
|
|
// Uniquify shared object files with soname
|
|
|
|
{
|
2020-11-29 16:05:34 +03:00
|
|
|
std::vector<SharedFile *> vec;
|
2020-12-11 06:46:03 +03:00
|
|
|
std::unordered_set<std::string_view> seen;
|
2020-11-29 16:05:34 +03:00
|
|
|
for (SharedFile *file : out::dsos)
|
|
|
|
if (seen.insert(file->soname).second)
|
|
|
|
vec.push_back(file);
|
|
|
|
out::dsos = vec;
|
2020-11-20 07:54:29 +03:00
|
|
|
}
|
|
|
|
|
2020-12-11 10:51:20 +03:00
|
|
|
Timer t_total("total");
|
|
|
|
Timer t_before_copy("before_copy");
|
2020-11-06 10:58:13 +03:00
|
|
|
|
2020-11-16 18:17:01 +03:00
|
|
|
out::ehdr = new OutputEhdr;
|
2020-11-16 18:23:51 +03:00
|
|
|
out::shdr = new OutputShdr;
|
2020-11-16 18:33:41 +03:00
|
|
|
out::phdr = new OutputPhdr;
|
2020-11-18 11:11:58 +03:00
|
|
|
out::got = new GotSection;
|
2020-11-13 06:43:59 +03:00
|
|
|
out::gotplt = new GotPltSection;
|
2020-11-17 07:34:02 +03:00
|
|
|
out::relplt = new RelPltSection;
|
2020-11-19 10:13:19 +03:00
|
|
|
out::strtab = new StrtabSection;
|
2020-11-17 06:20:56 +03:00
|
|
|
out::shstrtab = new ShstrtabSection;
|
2020-11-11 15:32:41 +03:00
|
|
|
out::plt = new PltSection;
|
2020-11-17 07:32:22 +03:00
|
|
|
out::symtab = new SymtabSection;
|
2020-11-16 17:40:01 +03:00
|
|
|
out::dynsym = new DynsymSection;
|
2020-11-17 07:19:54 +03:00
|
|
|
out::dynstr = new DynstrSection;
|
2020-11-25 11:20:48 +03:00
|
|
|
out::copyrel = new CopyrelSection;
|
2020-11-12 08:40:39 +03:00
|
|
|
|
2020-11-10 13:33:27 +03:00
|
|
|
if (!config.is_static) {
|
2020-11-16 19:05:01 +03:00
|
|
|
out::interp = new InterpSection;
|
2020-11-16 18:43:32 +03:00
|
|
|
out::dynamic = new DynamicSection;
|
2020-11-17 07:30:33 +03:00
|
|
|
out::reldyn = new RelDynSection;
|
2020-11-11 15:32:41 +03:00
|
|
|
out::hash = new HashSection;
|
2020-11-29 05:57:58 +03:00
|
|
|
out::versym = new VersymSection;
|
|
|
|
out::verneed = new VerneedSection;
|
2020-11-10 13:33:27 +03:00
|
|
|
}
|
|
|
|
|
2020-11-20 06:44:02 +03:00
|
|
|
out::chunks.push_back(out::got);
|
|
|
|
out::chunks.push_back(out::plt);
|
|
|
|
out::chunks.push_back(out::gotplt);
|
|
|
|
out::chunks.push_back(out::relplt);
|
|
|
|
out::chunks.push_back(out::reldyn);
|
|
|
|
out::chunks.push_back(out::dynamic);
|
|
|
|
out::chunks.push_back(out::dynsym);
|
|
|
|
out::chunks.push_back(out::dynstr);
|
|
|
|
out::chunks.push_back(out::shstrtab);
|
|
|
|
out::chunks.push_back(out::symtab);
|
|
|
|
out::chunks.push_back(out::strtab);
|
|
|
|
out::chunks.push_back(out::hash);
|
2020-11-25 11:20:48 +03:00
|
|
|
out::chunks.push_back(out::copyrel);
|
2020-11-29 06:59:08 +03:00
|
|
|
out::chunks.push_back(out::versym);
|
|
|
|
out::chunks.push_back(out::verneed);
|
2020-11-20 06:44:02 +03:00
|
|
|
|
2020-11-22 05:10:38 +03:00
|
|
|
// Set priorities to files. File priority 1 is reserved for the internal file.
|
|
|
|
int priority = 2;
|
2020-11-24 07:56:14 +03:00
|
|
|
for (ObjectFile *file : out::objs)
|
2020-11-24 08:31:05 +03:00
|
|
|
if (!file->is_in_archive)
|
2020-10-28 04:15:05 +03:00
|
|
|
file->priority = priority++;
|
2020-11-24 07:56:14 +03:00
|
|
|
for (ObjectFile *file : out::objs)
|
2020-11-24 08:31:05 +03:00
|
|
|
if (file->is_in_archive)
|
2020-10-28 04:15:05 +03:00
|
|
|
file->priority = priority++;
|
2020-11-24 10:22:32 +03:00
|
|
|
for (SharedFile *file : out::dsos)
|
2020-11-24 08:31:05 +03:00
|
|
|
file->priority = priority++;
|
2020-10-18 13:05:28 +03:00
|
|
|
|
2020-11-11 04:42:26 +03:00
|
|
|
// Resolve symbols and fix the set of object files that are
|
|
|
|
// included to the final output.
|
2020-11-17 08:05:40 +03:00
|
|
|
resolve_symbols();
|
2020-10-19 15:50:33 +03:00
|
|
|
|
2020-12-11 06:43:14 +03:00
|
|
|
if (config.trace) {
|
2020-11-24 07:56:14 +03:00
|
|
|
for (ObjectFile *file : out::objs)
|
2020-12-11 03:15:08 +03:00
|
|
|
message(to_string(file));
|
2020-11-24 10:22:32 +03:00
|
|
|
for (SharedFile *file : out::dsos)
|
2020-12-11 03:15:08 +03:00
|
|
|
message(to_string(file));
|
2020-11-24 08:31:05 +03:00
|
|
|
}
|
2020-11-05 03:24:47 +03:00
|
|
|
|
2020-11-11 04:42:26 +03:00
|
|
|
// Remove redundant comdat sections (e.g. duplicate inline functions).
|
2020-11-17 08:04:53 +03:00
|
|
|
eliminate_comdats();
|
2020-10-10 06:47:12 +03:00
|
|
|
|
2020-11-11 04:42:26 +03:00
|
|
|
// Merge strings constants in SHF_MERGE sections.
|
2020-11-17 08:04:53 +03:00
|
|
|
handle_mergeable_strings();
|
2020-11-07 14:29:06 +03:00
|
|
|
|
2020-10-27 06:50:25 +03:00
|
|
|
// Create .bss sections for common symbols.
|
|
|
|
{
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("common");
|
2020-12-13 16:23:30 +03:00
|
|
|
tbb::parallel_for_each(out::objs, [](ObjectFile *file) {
|
|
|
|
file->convert_common_symbols();
|
|
|
|
});
|
2020-10-27 06:50:25 +03:00
|
|
|
}
|
|
|
|
|
2020-10-26 05:34:26 +03:00
|
|
|
// Bin input sections into output sections
|
2020-11-17 08:04:53 +03:00
|
|
|
bin_sections();
|
2020-10-23 04:27:11 +03:00
|
|
|
|
2020-10-29 12:19:10 +03:00
|
|
|
// Assign offsets within an output section to input sections.
|
2020-11-11 04:42:26 +03:00
|
|
|
set_isec_offsets();
|
2020-10-22 10:35:17 +03:00
|
|
|
|
2020-11-12 10:09:17 +03:00
|
|
|
// Sections are added to the section lists in an arbitrary order because
|
2020-12-13 16:23:30 +03:00
|
|
|
// they are created in parallel. Sort them to to make the output deterministic.
|
2020-11-12 09:19:30 +03:00
|
|
|
auto section_compare = [](OutputChunk *x, OutputChunk *y) {
|
|
|
|
return std::make_tuple(x->name, (u32)x->shdr.sh_type, (u64)x->shdr.sh_flags) <
|
|
|
|
std::make_tuple(y->name, (u32)y->shdr.sh_type, (u64)y->shdr.sh_flags);
|
|
|
|
};
|
|
|
|
|
|
|
|
std::stable_sort(OutputSection::instances.begin(), OutputSection::instances.end(),
|
|
|
|
section_compare);
|
|
|
|
std::stable_sort(MergedSection::instances.begin(), MergedSection::instances.end(),
|
|
|
|
section_compare);
|
|
|
|
|
2020-11-12 10:09:17 +03:00
|
|
|
// Add sections to the section lists
|
2020-11-04 04:39:17 +03:00
|
|
|
for (OutputSection *osec : OutputSection::instances)
|
2020-11-11 16:14:12 +03:00
|
|
|
if (osec->shdr.sh_size)
|
2020-11-17 07:48:11 +03:00
|
|
|
out::chunks.push_back(osec);
|
2020-11-07 15:53:21 +03:00
|
|
|
for (MergedSection *osec : MergedSection::instances)
|
2020-11-11 16:14:12 +03:00
|
|
|
if (osec->shdr.sh_size)
|
2020-11-17 07:48:11 +03:00
|
|
|
out::chunks.push_back(osec);
|
2020-11-07 14:31:09 +03:00
|
|
|
|
2020-12-13 16:31:50 +03:00
|
|
|
erase(out::chunks, [](OutputChunk *c) { return !c; });
|
2020-11-20 06:44:02 +03:00
|
|
|
|
|
|
|
// Sort the sections by section flags so that we'll have to create
|
|
|
|
// as few segments as possible.
|
|
|
|
std::stable_sort(out::chunks.begin(), out::chunks.end(),
|
|
|
|
[](OutputChunk *a, OutputChunk *b) {
|
|
|
|
return get_section_rank(a->shdr) < get_section_rank(b->shdr);
|
|
|
|
});
|
|
|
|
|
2020-11-04 04:39:17 +03:00
|
|
|
// Create a dummy file containing linker-synthesized symbols
|
|
|
|
// (e.g. `__bss_start`).
|
2020-11-17 07:48:11 +03:00
|
|
|
ObjectFile *internal_file = ObjectFile::create_internal_file();
|
2020-11-22 05:10:38 +03:00
|
|
|
internal_file->priority = 1;
|
2020-11-20 06:44:02 +03:00
|
|
|
internal_file->resolve_symbols();
|
2020-11-24 07:56:14 +03:00
|
|
|
out::objs.push_back(internal_file);
|
2020-11-04 04:39:17 +03:00
|
|
|
|
2020-11-20 05:08:06 +03:00
|
|
|
// Convert weak symbols to absolute symbols with value 0.
|
2020-11-24 07:56:14 +03:00
|
|
|
tbb::parallel_for_each(out::objs, [](ObjectFile *file) {
|
2020-11-20 05:08:06 +03:00
|
|
|
file->handle_undefined_weak_symbols();
|
|
|
|
});
|
|
|
|
|
2020-11-09 05:31:00 +03:00
|
|
|
// Beyond this point, no new symbols will be added to the result.
|
|
|
|
|
2020-12-13 16:23:30 +03:00
|
|
|
// Copy shared object name strings to .dynstr.
|
2020-11-24 10:22:32 +03:00
|
|
|
for (SharedFile *file : out::dsos)
|
2020-11-30 11:52:08 +03:00
|
|
|
out::dynstr->add_string(file->soname);
|
2020-11-12 18:14:15 +03:00
|
|
|
|
2020-11-30 11:57:58 +03:00
|
|
|
// Copy DT_RUNPATH strings to .dynstr.
|
2020-12-10 07:44:58 +03:00
|
|
|
for (std::string_view path : config.rpaths)
|
2020-11-30 11:57:58 +03:00
|
|
|
out::dynstr->add_string(path);
|
|
|
|
|
2020-11-09 03:47:58 +03:00
|
|
|
// Add headers and sections that have to be at the beginning
|
|
|
|
// or the ending of a file.
|
2020-11-17 07:48:11 +03:00
|
|
|
out::chunks.insert(out::chunks.begin(), out::ehdr);
|
|
|
|
out::chunks.insert(out::chunks.begin() + 1, out::phdr);
|
2020-11-11 15:32:41 +03:00
|
|
|
if (out::interp)
|
2020-11-17 07:48:11 +03:00
|
|
|
out::chunks.insert(out::chunks.begin() + 2, out::interp);
|
|
|
|
out::chunks.push_back(out::shdr);
|
2020-10-27 11:36:55 +03:00
|
|
|
|
2020-11-26 12:09:32 +03:00
|
|
|
// Make sure that all symbols have been resolved.
|
|
|
|
check_duplicate_symbols();
|
|
|
|
|
2020-11-29 05:06:11 +03:00
|
|
|
// Scan relocations to find symbols that need entries in .got, .plt,
|
|
|
|
// .got.plt, .dynsym, .dynstr, etc.
|
2020-11-29 05:10:33 +03:00
|
|
|
scan_rels();
|
2020-11-20 06:44:02 +03:00
|
|
|
|
2020-12-07 09:50:13 +03:00
|
|
|
// Put symbols to .dynsym.
|
|
|
|
export_dynamic();
|
|
|
|
|
2020-11-29 05:40:57 +03:00
|
|
|
// Fill .gnu.version and .gnu.version_r section contents.
|
|
|
|
fill_symbol_versions();
|
|
|
|
|
2020-11-29 12:58:36 +03:00
|
|
|
// Compute .symtab and .strtab sizes for each file.
|
|
|
|
tbb::parallel_for_each(out::objs, [](ObjectFile *file) {
|
|
|
|
file->compute_symtab();
|
|
|
|
});
|
|
|
|
|
2020-11-19 10:20:09 +03:00
|
|
|
// Now that we have computed sizes for all sections and assigned
|
|
|
|
// section indices to them, so we can fix section header contents
|
|
|
|
// for all output sections.
|
2020-12-07 10:12:19 +03:00
|
|
|
for (OutputChunk *chunk : out::chunks)
|
|
|
|
chunk->update_shdr();
|
|
|
|
|
2020-12-13 16:31:50 +03:00
|
|
|
erase(out::chunks, [](OutputChunk *c) { return c->shdr.sh_size == 0; });
|
2020-12-07 10:12:19 +03:00
|
|
|
|
|
|
|
// Set section indices.
|
|
|
|
for (int i = 0, shndx = 1; i < out::chunks.size(); i++)
|
|
|
|
if (out::chunks[i]->kind != OutputChunk::HEADER)
|
|
|
|
out::chunks[i]->shndx = shndx++;
|
|
|
|
|
|
|
|
for (OutputChunk *chunk : out::chunks)
|
2020-12-07 09:50:13 +03:00
|
|
|
chunk->update_shdr();
|
2020-11-16 18:45:02 +03:00
|
|
|
|
2020-10-30 10:55:59 +03:00
|
|
|
// Assign offsets to output sections
|
2020-11-17 07:48:11 +03:00
|
|
|
u64 filesize = set_osec_offsets(out::chunks);
|
2020-10-19 17:37:29 +03:00
|
|
|
|
2020-11-03 10:51:28 +03:00
|
|
|
// Fix linker-synthesized symbol addresses.
|
2020-11-17 07:48:11 +03:00
|
|
|
fix_synthetic_symbols(out::chunks);
|
2020-11-01 07:05:51 +03:00
|
|
|
|
2020-11-09 03:58:35 +03:00
|
|
|
// At this point, file layout is fixed. Beyond this, you can assume
|
|
|
|
// that symbol addresses including their GOT/PLT/etc addresses have
|
|
|
|
// a correct final value.
|
|
|
|
|
2020-11-11 04:42:26 +03:00
|
|
|
// Some types of relocations for TLS symbols need the ending address
|
|
|
|
// of the TLS section. Find it out now.
|
2020-12-10 15:13:02 +03:00
|
|
|
for (ElfPhdr phdr : create_phdr())
|
2020-11-29 14:19:59 +03:00
|
|
|
if (phdr.p_type == PT_TLS)
|
|
|
|
out::tls_end = align_to(phdr.p_vaddr + phdr.p_memsz, phdr.p_align);
|
2020-10-26 08:38:43 +03:00
|
|
|
|
2020-12-11 10:51:20 +03:00
|
|
|
t_before_copy.stop();
|
|
|
|
|
2020-11-09 10:41:26 +03:00
|
|
|
// Create an output file
|
2020-11-17 08:03:32 +03:00
|
|
|
out::buf = open_output_file(filesize);
|
2020-11-09 10:41:26 +03:00
|
|
|
|
2020-12-11 10:51:20 +03:00
|
|
|
Timer t_copy("copy");
|
|
|
|
|
2020-11-17 08:49:07 +03:00
|
|
|
// Copy input sections to the output file
|
2020-11-12 16:06:47 +03:00
|
|
|
{
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("copy_buf");
|
2020-11-17 07:48:11 +03:00
|
|
|
tbb::parallel_for_each(out::chunks, [&](OutputChunk *chunk) {
|
2020-11-17 07:56:40 +03:00
|
|
|
chunk->copy_buf();
|
2020-11-09 08:47:51 +03:00
|
|
|
});
|
2020-10-30 05:40:38 +03:00
|
|
|
}
|
2020-10-20 03:20:52 +03:00
|
|
|
|
2020-11-09 15:50:47 +03:00
|
|
|
// Zero-clear paddings between sections
|
2020-11-17 07:59:24 +03:00
|
|
|
clear_padding(filesize);
|
2020-11-09 15:50:47 +03:00
|
|
|
|
2020-11-09 10:41:26 +03:00
|
|
|
// Commit
|
2020-10-25 03:38:53 +03:00
|
|
|
{
|
2020-12-11 10:51:20 +03:00
|
|
|
ScopedTimer t("munmap");
|
2020-11-17 07:49:18 +03:00
|
|
|
munmap(out::buf, filesize);
|
2020-10-25 03:38:53 +03:00
|
|
|
}
|
2020-10-14 12:41:09 +03:00
|
|
|
|
2020-12-11 10:51:20 +03:00
|
|
|
t_copy.stop();
|
2020-12-11 11:04:19 +03:00
|
|
|
t_total.stop();
|
2020-12-11 10:51:20 +03:00
|
|
|
t_all.stop();
|
2020-11-06 10:58:13 +03:00
|
|
|
|
2020-12-11 10:51:20 +03:00
|
|
|
if (config.print_map)
|
2020-11-24 08:31:05 +03:00
|
|
|
print_map();
|
2020-10-29 06:24:54 +03:00
|
|
|
|
2020-12-12 06:57:56 +03:00
|
|
|
// Show stats numbers
|
2020-12-13 19:28:43 +03:00
|
|
|
if (Counter::enabled) {
|
|
|
|
for (ObjectFile *obj : out::objs) {
|
|
|
|
static Counter defined("defined_syms");
|
|
|
|
defined.inc(obj->first_global - 1);
|
2020-12-12 06:57:56 +03:00
|
|
|
|
2020-12-13 19:28:43 +03:00
|
|
|
static Counter undefined("undefined_syms");
|
|
|
|
undefined.inc(obj->symbols.size() - obj->first_global);
|
|
|
|
}
|
2020-12-12 06:57:56 +03:00
|
|
|
|
2020-12-13 19:28:43 +03:00
|
|
|
Counter num_input_sections("input_sections");
|
|
|
|
for (ObjectFile *file : out::objs)
|
|
|
|
num_input_sections.inc(file->sections.size());
|
|
|
|
|
|
|
|
static Counter merged_strings("merged_strings");
|
|
|
|
for (MergedSection *osec : MergedSection::instances)
|
|
|
|
merged_strings.inc(osec->map.size());
|
2020-11-03 11:36:43 +03:00
|
|
|
|
2020-12-13 19:28:43 +03:00
|
|
|
Counter num_output_chunks("output_out::chunks", out::chunks.size());
|
|
|
|
Counter num_objs("num_objs", out::objs.size());
|
|
|
|
Counter num_dsos("num_dsos", out::dsos.size());
|
|
|
|
Counter filesize_counter("filesize", filesize);
|
2020-11-03 11:36:43 +03:00
|
|
|
|
2020-12-13 16:41:50 +03:00
|
|
|
Counter::print();
|
2020-12-13 19:28:43 +03:00
|
|
|
}
|
|
|
|
|
2020-12-13 16:41:50 +03:00
|
|
|
if (config.perf)
|
|
|
|
Timer::print();
|
|
|
|
|
|
|
|
std::cout << std::flush;
|
|
|
|
std::cerr << std::flush;
|
2020-12-19 04:08:32 +03:00
|
|
|
on_complete();
|
2020-12-13 19:30:08 +03:00
|
|
|
std::quick_exit(0);
|
2020-09-29 09:05:29 +03:00
|
|
|
}
|