#include "mold.h" namespace mold::elf { using E = I386; template <> void GotPltSection::copy_buf(Context &ctx) { u32 *buf = (u32 *)(ctx.buf + this->shdr.sh_offset); // The first slot of .got.plt points to _DYNAMIC. buf[0] = ctx.dynamic ? ctx.dynamic->shdr.sh_addr : 0; buf[1] = 0; buf[2] = 0; for (Symbol *sym : ctx.plt->symbols) buf[sym->get_gotplt_idx(ctx)] = sym->get_plt_addr(ctx) + 6; } static void write_plt_header(Context &ctx, u8 *buf) { if (ctx.arg.pic) { static const u8 plt0[] = { 0xff, 0xb3, 0x04, 0, 0, 0, // pushl 4(%ebx) 0xff, 0xa3, 0x08, 0, 0, 0, // jmp *8(%ebx) 0x90, 0x90, 0x90, 0x90, // nop }; memcpy(buf, plt0, sizeof(plt0)); } else { static const u8 plt0[] = { 0xff, 0x35, 0, 0, 0, 0, // pushl (GOTPLT+4) 0xff, 0x25, 0, 0, 0, 0, // jmp *(GOTPLT+8) 0x90, 0x90, 0x90, 0x90, // nop }; memcpy(buf, plt0, sizeof(plt0)); *(u32 *)(buf + 2) = ctx.gotplt->shdr.sh_addr + 4; *(u32 *)(buf + 8) = ctx.gotplt->shdr.sh_addr + 8; } } static void write_plt_entry(Context &ctx, u8 *buf, Symbol &sym, i64 idx) { u8 *ent = buf + ctx.plt_hdr_size + sym.get_plt_idx(ctx) * ctx.plt_size; if (ctx.arg.pic) { static const u8 data[] = { 0xff, 0xa3, 0, 0, 0, 0, // jmp *foo@GOT(%ebx) 0x68, 0, 0, 0, 0, // pushl $reloc_offset 0xe9, 0, 0, 0, 0, // jmp .PLT0@PC }; memcpy(ent, data, sizeof(data)); *(u32 *)(ent + 2) = sym.get_gotplt_addr(ctx) - ctx.gotplt->shdr.sh_addr; } else { static const u8 data[] = { 0xff, 0x25, 0, 0, 0, 0, // jmp *foo@GOT 0x68, 0, 0, 0, 0, // pushl $reloc_offset 0xe9, 0, 0, 0, 0, // jmp .PLT0@PC }; memcpy(ent, data, sizeof(data)); *(u32 *)(ent + 2) = sym.get_gotplt_addr(ctx); } *(u32 *)(ent + 7) = idx * sizeof(ElfRel); *(u32 *)(ent + 12) = ctx.plt->shdr.sh_addr - sym.get_plt_addr(ctx) - 16; } template <> void PltSection::copy_buf(Context &ctx) { u8 *buf = ctx.buf + this->shdr.sh_offset; write_plt_header(ctx, buf); for (i64 i = 0; i < symbols.size(); i++) write_plt_entry(ctx, buf, *symbols[i], i); } template <> void PltGotSection::copy_buf(Context &ctx) { u8 *buf = ctx.buf + this->shdr.sh_offset; if (ctx.arg.pic) { static const u8 data[] = { 0xff, 0xa3, 0, 0, 0, 0, // jmp *foo@GOT(%ebx) 0x66, 0x90, // nop }; for (i64 i = 0; i < symbols.size(); i++) { u8 *ent = buf + i * sizeof(data); memcpy(ent, data, sizeof(data)); *(u32 *)(ent + 2) = symbols[i]->get_got_addr(ctx) - ctx.gotplt->shdr.sh_addr; } } else { static const u8 data[] = { 0xff, 0x25, 0, 0, 0, 0, // jmp *foo@GOT 0x66, 0x90, // nop }; for (i64 i = 0; i < symbols.size(); i++) { u8 *ent = buf + i * sizeof(data); memcpy(ent, data, sizeof(data)); *(u32 *)(ent + 2) = symbols[i]->get_got_addr(ctx); } } } template <> void EhFrameSection::apply_reloc(Context &ctx, ElfRel &rel, u64 loc, u64 val) { u8 *base = ctx.buf + this->shdr.sh_offset; switch (rel.r_type) { case R_386_NONE: return; case R_386_32: *(u32 *)(base + loc) = val; return; case R_386_PC32: *(u32 *)(base + loc) = val - this->shdr.sh_addr - loc; return; } unreachable(); } template <> void InputSection::apply_reloc_alloc(Context &ctx, u8 *base) { ElfRel *dynrel = nullptr; std::span> rels = get_rels(ctx); i64 frag_idx = 0; if (ctx.reldyn) dynrel = (ElfRel *)(ctx.buf + ctx.reldyn->shdr.sh_offset + file.reldyn_offset + this->reldyn_offset); for (i64 i = 0; i < rels.size(); i++) { const ElfRel &rel = rels[i]; if (rel.r_type == R_386_NONE) continue; Symbol &sym = *file.symbols[rel.r_sym]; u8 *loc = base + rel.r_offset; const SectionFragmentRef *frag_ref = nullptr; if (rel_fragments && rel_fragments[frag_idx].idx == i) frag_ref = &rel_fragments[frag_idx++]; auto overflow_check = [&](i64 val, i64 lo, i64 hi) { if (val < lo || hi <= val) Error(ctx) << *this << ": relocation " << rel << " against " << sym << " out of range: " << val << " is not in [" << lo << ", " << hi << ")"; }; auto write8 = [&](u64 val) { overflow_check(val, 0, 1 << 8); *loc = val; }; auto write8s = [&](u64 val) { overflow_check(val, -(1 << 7), 1 << 7); *loc = val; }; auto write16 = [&](u64 val) { overflow_check(val, 0, 1 << 16); *(u16 *)loc = val; }; auto write16s = [&](u64 val) { overflow_check(val, -(1 << 15), 1 << 15); *(u16 *)loc = val; }; auto write32 = [&](u64 val) { *(u32 *)loc = val; }; #define S (frag_ref ? frag_ref->frag->get_addr(ctx) : sym.get_addr(ctx)) #define A (frag_ref ? frag_ref->addend : this->get_addend(rel)) #define P (output_section->shdr.sh_addr + offset + rel.r_offset) #define G (sym.get_got_addr(ctx) - ctx.got->shdr.sh_addr) #define GOTPLT ctx.gotplt->shdr.sh_addr if (needs_dynrel[i]) { *dynrel++ = {P, R_386_32, (u32)sym.get_dynsym_idx(ctx)}; write32(A); continue; } if (needs_baserel[i]) { if (!is_relr_reloc(ctx, rel)) *dynrel++ = {P, R_386_RELATIVE, 0}; write32(S + A); continue; } switch (rel.r_type) { case R_386_8: write8(S + A); continue; case R_386_16: write16(S + A); continue; case R_386_32: write32(S + A); continue; case R_386_PC8: write8s(S + A); continue; case R_386_PC16: write16s(S + A); continue; case R_386_PC32: case R_386_PLT32: write32(S + A - P); continue; case R_386_GOT32: case R_386_GOT32X: write32(sym.get_got_addr(ctx) + A - GOTPLT); continue; case R_386_GOTOFF: write32(S + A - GOTPLT); continue; case R_386_GOTPC: write32(GOTPLT + A - P); continue; case R_386_TLS_GOTIE: write32(sym.get_gottp_addr(ctx) + A - GOTPLT); continue; case R_386_TLS_LE: write32(S + A - ctx.tls_end); continue; case R_386_TLS_IE: write32(sym.get_gottp_addr(ctx) + A); continue; case R_386_TLS_GD: write32(sym.get_tlsgd_addr(ctx) + A - GOTPLT); continue; case R_386_TLS_LDM: write32(ctx.got->get_tlsld_addr(ctx) + A - GOTPLT); continue; case R_386_TLS_LDO_32: write32(S + A - ctx.tls_begin); continue; case R_386_SIZE32: write32(sym.esym().st_size + A); continue; case R_386_TLS_GOTDESC: if (sym.get_tlsdesc_idx(ctx) == -1) { static const u8 insn[] = { 0x8d, 0x05, 0, 0, 0, 0, // lea 0, %eax }; memcpy(loc - 2, insn, sizeof(insn)); write32(S + A - ctx.tls_end); } else { write32(sym.get_tlsdesc_addr(ctx) + A - GOTPLT); } continue; case R_386_TLS_DESC_CALL: if (ctx.arg.relax && !ctx.arg.shared) { // call *(%rax) -> nop loc[0] = 0x66; loc[1] = 0x90; } continue; default: unreachable(); } #undef S #undef A #undef P #undef G #undef GOTPLT } } template <> void InputSection::apply_reloc_nonalloc(Context &ctx, u8 *base) { std::span> rels = get_rels(ctx); i64 frag_idx = 0; for (i64 i = 0; i < rels.size(); i++) { const ElfRel &rel = rels[i]; if (rel.r_type == R_386_NONE) continue; Symbol &sym = *file.symbols[rel.r_sym]; u8 *loc = base + rel.r_offset; if (!sym.file) { report_undef(ctx, sym); continue; } SectionFragment *frag; i64 addend; std::tie(frag, addend) = get_fragment(ctx, rel); auto overflow_check = [&](i64 val, i64 lo, i64 hi) { if (val < lo || hi <= val) Error(ctx) << *this << ": relocation " << rel << " against " << sym << " out of range: " << val << " is not in [" << lo << ", " << hi << ")"; }; auto write8 = [&](u64 val) { overflow_check(val, 0, 1 << 8); *loc = val; }; auto write8s = [&](u64 val) { overflow_check(val, -(1 << 7), 1 << 7); *loc = val; }; auto write16 = [&](u64 val) { overflow_check(val, 0, 1 << 16); *(u16 *)loc = val; }; auto write16s = [&](u64 val) { overflow_check(val, -(1 << 15), 1 << 15); *(u16 *)loc = val; }; #define S (frag ? frag->get_addr(ctx) : sym.get_addr(ctx)) #define A (frag ? addend : this->get_addend(rel)) #define G (sym.get_got_addr(ctx) - ctx.got->shdr.sh_addr) #define GOTPLT ctx.gotplt->shdr.sh_addr switch (rel.r_type) { case R_386_8: write8(S + A); continue; case R_386_16: write16(S + A); continue; case R_386_32: *(u32 *)loc = S + A; continue; case R_386_PC8: write8s(S + A); continue; case R_386_PC16: write16s(S + A); continue; case R_386_PC32: *(u32 *)loc = S + A; continue; case R_386_GOTPC: *(u32 *)loc = GOTPLT + A; continue; case R_386_GOTOFF: *(u32 *)loc = S + A - GOTPLT; continue; case R_386_TLS_LDO_32: *(u32 *)loc = S + A - ctx.tls_begin; continue; case R_386_SIZE32: *(u32 *)loc = sym.esym().st_size + A; continue; default: unreachable(); } #undef S #undef A #undef GOTPLT } } template <> void InputSection::scan_relocations(Context &ctx) { assert(shdr.sh_flags & SHF_ALLOC); this->reldyn_offset = file.num_dynrel * sizeof(ElfRel); std::span> rels = get_rels(ctx); // Scan relocations for (i64 i = 0; i < rels.size(); i++) { const ElfRel &rel = rels[i]; if (rel.r_type == R_386_NONE) continue; Symbol &sym = *file.symbols[rel.r_sym]; if (!sym.file) { report_undef(ctx, sym); continue; } if (sym.get_type() == STT_GNU_IFUNC) { sym.flags |= NEEDS_GOT; sym.flags |= NEEDS_PLT; } switch (rel.r_type) { case R_386_8: case R_386_16: { Action table[][4] = { // Absolute Local Imported data Imported code { NONE, ERROR, ERROR, ERROR }, // DSO { NONE, ERROR, ERROR, ERROR }, // PIE { NONE, NONE, COPYREL, PLT }, // PDE }; dispatch(ctx, table, i, rel, sym); break; } case R_386_32: { Action table[][4] = { // Absolute Local Imported data Imported code { NONE, BASEREL, DYNREL, DYNREL }, // DSO { NONE, BASEREL, DYNREL, DYNREL }, // PIE { NONE, NONE, COPYREL, PLT }, // PDE }; dispatch(ctx, table, i, rel, sym); break; } case R_386_PC8: case R_386_PC16: { Action table[][4] = { // Absolute Local Imported data Imported code { ERROR, NONE, ERROR, ERROR }, // DSO { ERROR, NONE, COPYREL, PLT }, // PIE { NONE, NONE, COPYREL, PLT }, // PDE }; dispatch(ctx, table, i, rel, sym); break; } case R_386_PC32: { Action table[][4] = { // Absolute Local Imported data Imported code { BASEREL, NONE, DYNREL, DYNREL }, // DSO { BASEREL, NONE, COPYREL, PLT }, // PIE { NONE, NONE, COPYREL, PLT }, // PDE }; dispatch(ctx, table, i, rel, sym); break; } case R_386_GOT32: case R_386_GOT32X: case R_386_GOTPC: sym.flags |= NEEDS_GOT; break; case R_386_PLT32: if (sym.is_imported) sym.flags |= NEEDS_PLT; break; case R_386_TLS_GOTIE: case R_386_TLS_LE: case R_386_TLS_IE: sym.flags |= NEEDS_GOTTP; break; case R_386_TLS_GD: sym.flags |= NEEDS_TLSGD; break; case R_386_TLS_LDM: sym.flags |= NEEDS_TLSLD; break; case R_386_TLS_GOTDESC: if (!ctx.arg.relax || ctx.arg.shared) sym.flags |= NEEDS_TLSDESC; break; case R_386_GOTOFF: case R_386_TLS_LDO_32: case R_386_SIZE32: case R_386_TLS_DESC_CALL: break; default: Error(ctx) << *this << ": unknown relocation: " << rel; } } } } // namespace mold::elf