diff options
author | Yorick van Pelt <yorick@yorickvanpelt.nl> | 2019-12-07 22:35:14 +0700 |
---|---|---|
committer | Yorick van Pelt <yorick@yorickvanpelt.nl> | 2019-12-07 22:35:14 +0700 |
commit | 9ff5f6492f46b7f3342d47f138b590f09e939865 (patch) | |
tree | ececcaddac8cc3e95e530b53b6c39103c90dcbb0 /src/libutil | |
parent | 3b9c9d34e5ede028860e919d72cc5ae33dd95443 (diff) |
libarchive proof of concept
Diffstat (limited to 'src/libutil')
-rw-r--r-- | src/libutil/local.mk | 2 | ||||
-rw-r--r-- | src/libutil/tarfile.cc | 135 | ||||
-rw-r--r-- | src/libutil/tarfile.hh | 3 |
3 files changed, 118 insertions, 22 deletions
diff --git a/src/libutil/local.mk b/src/libutil/local.mk index 35c1f6c13..16c1fa03f 100644 --- a/src/libutil/local.mk +++ b/src/libutil/local.mk @@ -6,6 +6,6 @@ libutil_DIR := $(d) libutil_SOURCES := $(wildcard $(d)/*.cc) -libutil_LDFLAGS = $(LIBLZMA_LIBS) -lbz2 -pthread $(OPENSSL_LIBS) $(LIBBROTLI_LIBS) $(BOOST_LDFLAGS) -lboost_context +libutil_LDFLAGS = $(LIBLZMA_LIBS) -lbz2 -pthread $(OPENSSL_LIBS) $(LIBBROTLI_LIBS) $(LIBARCHIVE_LIBS) $(BOOST_LDFLAGS) -lboost_context libutil_LIBS = libnixrust diff --git a/src/libutil/tarfile.cc b/src/libutil/tarfile.cc index 2cc7793fd..ab30002dd 100644 --- a/src/libutil/tarfile.cc +++ b/src/libutil/tarfile.cc @@ -1,5 +1,8 @@ #include "rust-ffi.hh" #include "compression.hh" +#include <archive.h> +#include <archive_entry.h> +#include "finally.hh" extern "C" { rust::Result<std::tuple<>> * @@ -8,29 +11,123 @@ extern "C" { namespace nix { -void unpackTarfile(Source & source, const Path & destDir) -{ - rust::Source source2(source); - rust::CBox(unpack_tarfile(source2, destDir))->unwrap(); +std::shared_ptr<struct archive> archive_read_ptr() { + return std::shared_ptr<struct archive>(archive_read_new(), + [](auto p) { + archive_read_close(p); + archive_read_free(p); + }); } - -void unpackTarfile(const Path & tarFile, const Path & destDir, - std::optional<std::string> baseName) +void archive_read_open_source(std::shared_ptr<struct archive> a, Source& s, unsigned int bufsize = 1024) { + std::shared_ptr<unsigned char> buffer((unsigned char*)malloc(bufsize), [](auto p) { free(p); }); + typedef struct { + decltype(buffer) buf; + Source& src; + unsigned int bs; + } St; + St* state = new St({buffer, s, bufsize}); + if (archive_read_open(a.get(), state, + NULL /* open */, + ([] (struct archive*, void* sptr, const void** buf) -> long int { + St& s = *(static_cast<St*>(sptr)); + *buf = s.buf.get(); + try { + return s.src.read(s.buf.get(), s.bs); + } catch (EndOfFile &) { + return 0; + } + /* TODO: I don't know what happens if anything else is thrown here */ + }), [] (struct archive*, void* sptr) { + delete static_cast<St*>(sptr); + return ARCHIVE_OK; + })) { + throw Error("archive is corrupt (%s)", archive_error_string(a.get())); + } +} +std::shared_ptr<struct archive> archive_write_ptr() { + return std::shared_ptr<struct archive>(archive_write_disk_new(), + [](auto p) { + archive_write_close(p); + archive_write_free(p); + }); +} +static void copy_data(std::shared_ptr<struct archive> ar, std::shared_ptr<struct archive> aw) { - if (!baseName) baseName = baseNameOf(tarFile); + int r; + const void *buff; + size_t size; + la_int64_t offset; - auto source = sinkToSource([&](Sink & sink) { - // FIXME: look at first few bytes to determine compression type. - auto decompressor = - // FIXME: add .gz support - hasSuffix(*baseName, ".bz2") ? makeDecompressionSink("bzip2", sink) : - hasSuffix(*baseName, ".xz") ? makeDecompressionSink("xz", sink) : - makeDecompressionSink("none", sink); - readFile(tarFile, *decompressor); - decompressor->finish(); - }); + for (;;) { + r = archive_read_data_block(ar.get(), &buff, &size, &offset); + if (r == ARCHIVE_EOF) return; + if (r < ARCHIVE_OK) { + throw Error("archive is corrupt (%s)", archive_error_string(ar.get())); + } + r = archive_write_data_block(aw.get(), buff, size, offset); + if (r < ARCHIVE_OK) { + throw Error("could not write archive output (%s)", archive_error_string(aw.get())); + } + } +} - unpackTarfile(*source, destDir); +static void extract_archive(std::shared_ptr<struct archive> a, const Path & destDir) { + char * cwd = getcwd(0, 0); + if (!cwd) throw SysError("getting current directory"); + Finally freeCwd([&]() { free(cwd); }); + int r = chdir(destDir.c_str()); + if (r != 0) throw SysError("setting directory to tar output path"); + struct archive_entry *entry; + r = archive_read_next_header(a.get(), &entry); + if (r != ARCHIVE_OK) { + throw Error("archive is corrupt (%s)", archive_error_string(a.get())); + } + int flags = 0; + auto ext = archive_write_ptr(); + flags |= ARCHIVE_EXTRACT_PERM; + flags |= ARCHIVE_EXTRACT_FFLAGS; + archive_write_disk_set_options(ext.get(), flags); + archive_write_disk_set_standard_lookup(ext.get()); + for(;;) { + r = archive_read_next_header(a.get(), &entry); + if (r == ARCHIVE_EOF) break; + if (r == ARCHIVE_WARN) { + std::cerr << "warning: " << archive_error_string(a.get()); + } else if (r < ARCHIVE_WARN) { + throw Error("archive is corrupt (%s)", archive_error_string(a.get())); + } + r = archive_write_header(ext.get(), entry); + if (r != ARCHIVE_OK) { + throw Error("could not write archive output (%s)", archive_error_string(ext.get())); + } + if (archive_entry_size(entry) > 0) { + copy_data(a, ext); + } + archive_write_finish_entry(ext.get()); + } + r = chdir(cwd); + if (r != 0) throw SysError("resetting directory after archive extraction"); +} +void unpackTarfile(Source & source, const Path & destDir) +{ + auto a = archive_read_ptr(); + archive_read_support_filter_all(a.get()); + archive_read_support_format_all(a.get()); + archive_read_open_source(a, source); + createDirs(destDir); + extract_archive(a, destDir); +} +void unpackTarfile(const Path & tarFile, const Path & destDir) +{ + auto a = archive_read_ptr(); + archive_read_support_filter_all(a.get()); + archive_read_support_format_all(a.get()); + int r = archive_read_open_filename(a.get(), tarFile.c_str(), 16384); + if (r != ARCHIVE_OK) { + throw Error("archive is corrupt (%s)", archive_error_string(a.get())); + } + createDirs(destDir); + extract_archive(a, destDir); } } diff --git a/src/libutil/tarfile.hh b/src/libutil/tarfile.hh index ce0911e2a..89a024f1d 100644 --- a/src/libutil/tarfile.hh +++ b/src/libutil/tarfile.hh @@ -4,7 +4,6 @@ namespace nix { void unpackTarfile(Source & source, const Path & destDir); -void unpackTarfile(const Path & tarFile, const Path & destDir, - std::optional<std::string> baseName = {}); +void unpackTarfile(const Path & tarFile, const Path & destDir); } |