1
1
mirror of https://github.com/rui314/mold.git synced 2024-10-05 00:57:08 +03:00
mold/tar.cc

110 lines
2.9 KiB
C++
Raw Normal View History

2021-04-08 18:29:01 +03:00
#include "mold.h"
namespace mold {
2021-04-08 18:29:01 +03:00
// A tar file consists of one or more Ustar header followed by data.
// Each Ustar header represents a single file in an archive.
//
// tar is an old file format, and its `name` field is only 100 bytes long.
2021-04-08 19:38:25 +03:00
// If `name` is longer than 100 bytes, we can emit a PAX header before a
// Ustar header to store a long filename.
2021-04-08 18:29:01 +03:00
//
2021-04-08 19:38:25 +03:00
// For simplicity, we always emit a PAX header even for a short filename.
2021-04-08 18:29:01 +03:00
struct UstarHeader {
UstarHeader() {
memset(this, 0, sizeof(*this));
}
void finalize() {
2021-04-08 18:29:01 +03:00
memset(checksum, ' ', sizeof(checksum));
memcpy(magic, "ustar", 5);
memcpy(version, "00", 2);
2021-05-02 13:21:24 +03:00
// Compute checksum
2021-04-08 18:29:01 +03:00
int sum = 0;
for (i64 i = 0; i < sizeof(*this); i++)
sum += ((u8 *)this)[i];
2022-01-07 04:56:55 +03:00
assert(sum < 1000000);
2021-04-08 18:29:01 +03:00
sprintf(checksum, "%06o", sum);
}
char name[100];
char mode[8];
char uid[8];
char gid[8];
char size[12];
char mtime[12];
char checksum[8];
char typeflag[1];
char linkname[100];
char magic[6];
char version[2];
char uname[32];
char gname[32];
char devmajor[8];
char devminor[8];
char prefix[155];
char pad[12];
};
static std::string encode_path(std::string basedir, std::string path) {
2021-09-27 11:37:23 +03:00
path = path_clean(basedir + "/" + path);
2021-04-08 19:59:13 +03:00
2021-04-08 19:38:25 +03:00
// Construct a string which contains something like
// "16 path=foo/bar\n" where 16 is the size of the string
// including the size string itself.
i64 len = std::string(" path=\n").size() + path.size();
2021-04-08 18:29:01 +03:00
i64 total = std::to_string(len).size() + len;
total = std::to_string(total).size() + len;
2021-05-02 13:21:24 +03:00
return std::to_string(total) + " path=" + path + "\n";
}
2021-04-08 18:29:01 +03:00
std::unique_ptr<TarWriter>
TarWriter::open(std::string output_path, std::string basedir) {
FILE *out = fopen(output_path.c_str(), "w");
if (!out)
return nullptr;
return std::unique_ptr<TarWriter>(new TarWriter(out, basedir));
2021-04-08 18:29:01 +03:00
}
TarWriter::~TarWriter() {
fclose(out);
}
2021-05-02 13:21:24 +03:00
void TarWriter::append(std::string path, std::string_view data) {
// Write PAX header
static_assert(sizeof(UstarHeader) == BLOCK_SIZE);
UstarHeader pax;
std::string attr = encode_path(basedir, path);
sprintf(pax.size, "%011zo", attr.size());
pax.typeflag[0] = 'x';
pax.finalize();
fwrite(&pax, sizeof(pax), 1, out);
// Write pathname
fwrite(attr.data(), attr.size(), 1, out);
fseek(out, align_to(ftell(out), BLOCK_SIZE), SEEK_SET);
// Write Ustar header
UstarHeader ustar;
memcpy(ustar.mode, "0000664", 8);
sprintf(ustar.size, "%011zo", data.size());
ustar.finalize();
fwrite(&ustar, sizeof(ustar), 1, out);
// Write file contents
fwrite(data.data(), data.size(), 1, out);
fseek(out, align_to(ftell(out), BLOCK_SIZE), SEEK_SET);
// A tar file must ends with two empty blocks, so write such
// terminator and seek back.
u8 terminator[BLOCK_SIZE * 2] = {};
fwrite(&terminator, BLOCK_SIZE * 2, 1, out);
fseek(out, -BLOCK_SIZE * 2, SEEK_END);
assert(ftell(out) % BLOCK_SIZE == 0);
2021-05-02 13:21:24 +03:00
}
} // namespace mold