simonhf · October 28, 2023 05:30
diff --git a/_libarchive-read-blocking.md b/_libarchive-read-blocking.md
diff --git a/example.cpp b/example.cpp
 // libstd
 #include <iostream>
 #include <vector>
 #include <string>
 #include <unistd.h>
 #include <fcntl.h>

 // libarchive
 #include <archive.h>
 #include <archive_entry.h>

 struct mydata
 {
    char* data;
    la_ssize_t size;
 };

 la_ssize_t libarchiveRead(struct archive* a, void* client_data, const void** block)
 {
    std::cout << "calling custom read().." << std::endl;
    mydata *current_data = (mydata*)client_data;
    *block = current_data->data;
    return current_data->size;
 }

 int main(int argc, char** argv) {

    if(argc < 3)
    {
        std::cout << argv[0] << "{-r | -w} file[s]" << std::endl;
        return 1;
    }

    std::vector<std::string> filenames;
    filenames.reserve(argc);

    while (*++argv != nullptr)
    {
        filenames.emplace_back(*argv);
    }

    bool modeRead = (filenames[0] == "-r");

    // archive related variables
    struct archive *archive;

    char buff_archive[1024 * 1024];

    // archive entry/file variables
    struct archive_entry *entry;
    struct stat st;

    char buff_entry[1024 * 1024];
    int len;
    int fd;

    if(modeRead)
    {
        std::cout << "Attempting to open " << filenames[1] << std::endl;

        fd = open(filenames[1].c_str(), O_RDONLY);
        len = read(fd, buff_archive, sizeof(buff_archive));

        archive = archive_read_new();
        archive_read_support_format_all(archive);
        archive_read_support_filter_all(archive);

        #ifdef FROM_STREAM

            mydata *client_data = new mydata();

            client_data->data = buff_archive;
            client_data->size = len;

            std::cout << "calling archive_read_open.." << std::endl;
            int res = archive_read_open(archive,
                                        client_data,
                                        nullptr,
                                        (archive_read_callback*)libarchiveRead,
                                        nullptr);

        #else
            std::cout << "calling archive_read_open_memory.." << std::endl;
            int res = archive_read_open_memory(archive, buff_archive, len);

        #endif

        int flags = 0;
        flags = ARCHIVE_EXTRACT_TIME;
        flags |= ARCHIVE_EXTRACT_PERM;
        flags |= ARCHIVE_EXTRACT_ACL;
        flags |= ARCHIVE_EXTRACT_FFLAGS;

        res = archive_read_next_header(archive, &(entry));

        while(res == ARCHIVE_OK) {
            std::cout << "Extracting " << archive_entry_pathname(entry) << "..." << std::endl;
            // extract current entry
            archive_read_extract(archive, entry, flags);
            // read next if available
            res = archive_read_next_header(archive, &(entry));
        }

        archive_read_close(archive);
        archive_read_free(archive);
        close(fd);
    }
    else
    {
        archive = archive_write_new(); // initializes a new archive
        archive_write_add_filter_gzip(archive); // gzips incoming data
        archive_write_set_format_pax_restricted(archive); // only use extensions when necessary
        archive_write_set_bytes_per_block(archive, 8192);
        archive_write_open_filename(archive, "test.tar.gz");

        for (auto const& value: filenames){
            std::cout << "Compressing " << value << "...\n";
            stat(value.c_str(), &st);
            if(entry == nullptr){
                entry = archive_entry_new();
            }
            else
            {
                archive_entry_clear(entry);
            }

            // the following attributes are mandatory
            archive_entry_set_pathname(entry, value.c_str());
            archive_entry_set_size(entry, st.st_size);
            archive_entry_set_filetype(entry, st.st_mode);

            archive_write_header(archive, entry);

            fd = open(value.c_str(), O_RDONLY);
            len = read(fd, buff_entry, sizeof(buff_entry));
            while ( len > 0 ) {
                archive_write_data(archive, buff_entry, len);
                len = read(fd, buff_entry, sizeof(buff_entry));
            }
            close(fd);
        }

        // done looping over files
        archive_entry_free(entry);

        archive_write_close(archive);
        archive_write_free(archive);
    }

    return 0;

 }
diff --git a/example2.cpp b/example2.cpp
 // libstd
 #include <iostream>
 #include <vector>
 #include <string>
 #include <unistd.h>
 #include <fcntl.h>

 // libarchive
 #include <archive.h>
 #include <archive_entry.h>

 #define CAST(TYPE, PTR) ((TYPE)(uintptr_t)(PTR))

 #define BUFF_ARCHIVE_LEN (2 * 1024 * 1024)

 #define ID_MAX (2)

 int    id_buff_archive_used[ID_MAX];
 char   id_buff_archive[ID_MAX][BUFF_ARCHIVE_LEN];
 char * id_chunk_addr[ID_MAX];
 int    id_chunk_left[ID_MAX];
 int    id_chunk_size[ID_MAX];
 int    id_chunk_num [ID_MAX];
 int    id_chunk_todo[ID_MAX];

 struct archive       * id_archive[ID_MAX];
 struct archive_entry * id_entry[ID_MAX] = {nullptr};

 la_ssize_t libarchiveRead(struct archive* a, void* client_data, const void** chunk)
 {
    int id = CAST(int, client_data);
    *chunk = id_chunk_addr[id];
    la_ssize_t bytes_available = id_chunk_left[id] < id_chunk_size[id] ? id_chunk_left[id] : id_chunk_size[id];
    if ((id_chunk_num[id] < 3) && (id_chunk_left[id] > 123)) { // special business logic to cause archive_read_open() to call this callback multiple times
        bytes_available = 7;
    }
    id_chunk_left[id] -= bytes_available;
    id_chunk_addr[id] += bytes_available;
    id_chunk_num [id] ++;
    printf("%d=id   - libarchiveRead() {} = %'ld=bytes_available // callback\n", id, bytes_available);
    return bytes_available;
 }

 int main(int argc, char** argv) {
    setlocale(LC_NUMERIC, "");

    if(argc < 3)
    {
        std::cout << argv[0] << "{-r | -w} file[s]" << std::endl;
        return 1;
    }

    std::string mode = *++argv; // "-r" or "-w"
    std::vector<std::string> filenames;
    filenames.reserve(argc);

    while (*++argv != nullptr) {
        filenames.emplace_back(*argv);
    }

    // archive entry/file variables
    struct stat st;

    char buff_entry[2 * 1024 * 1024];
    int fd;

    if("-r" == mode /* read mode */) {
        printf("     - /* for each archive file: read off disk, and archive_read_open() */\n");

        int id_max = filenames.size();
        for (int id = 0; id < id_max; id ++) {
            printf("%d=id - attempting to open: %s\n", id, filenames[id].c_str());

            int fd = open(filenames[id].c_str(), O_RDONLY);
            id_buff_archive_used[id] = read(fd, &id_buff_archive[id][0], sizeof(id_buff_archive[id]));
            printf("%d=id - read %'d bytes into id_buff_archive[%d]\n", id, id_buff_archive_used[id], id);
            close(fd);

            printf("%d=id - archive_read_new() {}\n", id);
            id_archive[id] = archive_read_new();
            archive_read_support_format_all(id_archive[id]);
            archive_read_support_filter_all(id_archive[id]);

            #ifdef FROM_STREAM

            id_chunk_addr[id] = &id_buff_archive[id][0];
            id_chunk_left[id] =  id_buff_archive_used[id];
            id_chunk_size[id] = 256 * 1024;
            id_chunk_num [id] = 0;
            id_chunk_todo[id] = 1;

            printf("%d=id - archive_read_open() {\n", id);
            int res = archive_read_open(id_archive[id], CAST(void *, id), nullptr, (archive_read_callback*)libarchiveRead, nullptr);
            printf("%d=id   } = %s\n", id,
                res == ARCHIVE_OK  ? "ARCHIVE_OK"  :
                res == ARCHIVE_EOF ? "ARCHIVE_EOF" : "ERROR: UNKNOWN");

            #else

            std::cout << "calling archive_read_open_memory.." << std::endl;
            int res = archive_read_open_memory(id_archive[id], &id_buff_archive[id][0], id_buff_archive_used[id]);

            #endif
        }

        int flags = 0;
        flags  = ARCHIVE_EXTRACT_TIME;
        flags |= ARCHIVE_EXTRACT_PERM;
        flags |= ARCHIVE_EXTRACT_ACL;
        flags |= ARCHIVE_EXTRACT_FFLAGS;

        int filenames_unpacked = 0;
        while (filenames_unpacked < id_max) {
            printf("     - /* for each archive file: archive_read_next_header() and archive_read_extract() */\n");
            for (int id = 0; id < id_max; id ++) {
                if (id_chunk_todo[id]) {
                    int res = archive_read_next_header(id_archive[id], &(id_entry[id]));
                    printf("%d=id - archive_read_next_header() {} = %s\n", id,
                        res == ARCHIVE_OK  ? "ARCHIVE_OK"  :
                        res == ARCHIVE_EOF ? "ARCHIVE_EOF" : "ERROR: UNKNOWN");

                    if (ARCHIVE_EOF == res) {
                        id_chunk_todo[id] = 0;
                        filenames_unpacked ++;
                    }
                    else {
                        printf("%d=id - archive_entry_pathname(entry) {} = %s // file to extract\n", id, archive_entry_pathname(id_entry[id]));

                        printf("%d=id - archive_read_extract() {\n", id);
                        res = archive_read_extract(id_archive[id], id_entry[id], flags);
                        printf("%d=id   } = %s\n", id,
                            res == ARCHIVE_OK  ? "ARCHIVE_OK"  :
                            res == ARCHIVE_EOF ? "ARCHIVE_EOF" : "ERROR: UNKNOWN");
                    }
                }
            }
        }

        printf("     - /* for each archive file: archive_read_close() and archive_read_free() */\n");

        for (int id = 0; id < id_max; id ++) {
            printf("%d=id - archive_read_close() {}\n", id);
            archive_read_close(id_archive[id]);

            printf("%d=id - archive_read_free() {}\n", id);
            archive_read_free(id_archive[id]);
        }
    }
    else {
        int id = 0;

        id_archive[id] = archive_write_new(); // initializes a new archive
        archive_write_add_filter_gzip(id_archive[id]); // gzips incoming data
        archive_write_set_format_pax_restricted(id_archive[id]); // only use extensions when necessary
        archive_write_set_bytes_per_block(id_archive[id], 8192);
        archive_write_open_filename(id_archive[id], "test.tar.gz");

        for (auto const& value: filenames) {
            printf("- compressing: %s\n", value.c_str());
            stat(value.c_str(), &st);
            if(id_entry[id] == nullptr) {
                printf("- archive_entry_new() {}\n");
                id_entry[id] = archive_entry_new();
            }
            else {
                printf("- archive_entry_clear() {}\n");
                archive_entry_clear(id_entry[id]);
            }

            // the following attributes are mandatory
            archive_entry_set_pathname(id_entry[id], value.c_str());
            archive_entry_set_size(id_entry[id], st.st_size);
            archive_entry_set_filetype(id_entry[id], st.st_mode);

            archive_write_header(id_archive[id], id_entry[id]);

            fd = open(value.c_str(), O_RDONLY);
            int len = read(fd, buff_entry, sizeof(buff_entry));
            printf("- read() = %d\n", len);
            while ( len > 0 ) {
                archive_write_data(id_archive[id], buff_entry, len);
                len = read(fd, buff_entry, sizeof(buff_entry));
                printf("- read() = %d\n", len);
            }
            close(fd);
        }

        // done looping over files
        archive_entry_free(id_entry[id]);

        archive_write_close(id_archive[id]);
        archive_write_free(id_archive[id]);
    }

    return 0;

 }
	// libstd
	#include <iostream>
	#include <vector>
	#include <string>
	#include <unistd.h>
	#include <fcntl.h>

	// libarchive
	#include <archive.h>
	#include <archive_entry.h>

	struct mydata
	{
	char* data;
	la_ssize_t size;
	};

	la_ssize_t libarchiveRead(struct archive* a, void* client_data, const void** block)
	{
	std::cout << "calling custom read().." << std::endl;
	mydata current_data = (mydata)client_data;
	*block = current_data->data;
	return current_data->size;
	}

	int main(int argc, char** argv) {

	if(argc < 3)
	{
	std::cout << argv[0] << "{-r \| -w} file[s]" << std::endl;
	return 1;
	}

	std::vector<std::string> filenames;
	filenames.reserve(argc);

	while (*++argv != nullptr)
	{
	filenames.emplace_back(*argv);
	}

	bool modeRead = (filenames[0] == "-r");

	// archive related variables
	struct archive *archive;

	char buff_archive[1024 * 1024];

	// archive entry/file variables
	struct archive_entry *entry;
	struct stat st;

	char buff_entry[1024 * 1024];
	int len;
	int fd;

	if(modeRead)
	{
	std::cout << "Attempting to open " << filenames[1] << std::endl;

	fd = open(filenames[1].c_str(), O_RDONLY);
	len = read(fd, buff_archive, sizeof(buff_archive));

	archive = archive_read_new();
	archive_read_support_format_all(archive);
	archive_read_support_filter_all(archive);

	#ifdef FROM_STREAM

	mydata *client_data = new mydata();

	client_data->data = buff_archive;
	client_data->size = len;

	std::cout << "calling archive_read_open.." << std::endl;
	int res = archive_read_open(archive,
	client_data,
	nullptr,
	(archive_read_callback*)libarchiveRead,
	nullptr);

	#else
	std::cout << "calling archive_read_open_memory.." << std::endl;
	int res = archive_read_open_memory(archive, buff_archive, len);

	#endif

	int flags = 0;
	flags = ARCHIVE_EXTRACT_TIME;
	flags \|= ARCHIVE_EXTRACT_PERM;
	flags \|= ARCHIVE_EXTRACT_ACL;
	flags \|= ARCHIVE_EXTRACT_FFLAGS;

	res = archive_read_next_header(archive, &(entry));

	while(res == ARCHIVE_OK) {
	std::cout << "Extracting " << archive_entry_pathname(entry) << "..." << std::endl;
	// extract current entry
	archive_read_extract(archive, entry, flags);
	// read next if available
	res = archive_read_next_header(archive, &(entry));
	}

	archive_read_close(archive);
	archive_read_free(archive);
	close(fd);
	}
	else
	{
	archive = archive_write_new(); // initializes a new archive
	archive_write_add_filter_gzip(archive); // gzips incoming data
	archive_write_set_format_pax_restricted(archive); // only use extensions when necessary
	archive_write_set_bytes_per_block(archive, 8192);
	archive_write_open_filename(archive, "test.tar.gz");

	for (auto const& value: filenames){
	std::cout << "Compressing " << value << "...\n";
	stat(value.c_str(), &st);
	if(entry == nullptr){
	entry = archive_entry_new();
	}
	else
	{
	archive_entry_clear(entry);
	}

	// the following attributes are mandatory
	archive_entry_set_pathname(entry, value.c_str());
	archive_entry_set_size(entry, st.st_size);
	archive_entry_set_filetype(entry, st.st_mode);

	archive_write_header(archive, entry);

	fd = open(value.c_str(), O_RDONLY);
	len = read(fd, buff_entry, sizeof(buff_entry));
	while ( len > 0 ) {
	archive_write_data(archive, buff_entry, len);
	len = read(fd, buff_entry, sizeof(buff_entry));
	}
	close(fd);
	}

	// done looping over files
	archive_entry_free(entry);

	archive_write_close(archive);
	archive_write_free(archive);
	}

	return 0;

	}