1caf54c4fSMartin Matuska /*- 2caf54c4fSMartin Matuska * Copyright (c) 2003-2007 Tim Kientzle 3caf54c4fSMartin Matuska * All rights reserved. 4caf54c4fSMartin Matuska * 5caf54c4fSMartin Matuska * Redistribution and use in source and binary forms, with or without 6caf54c4fSMartin Matuska * modification, are permitted provided that the following conditions 7caf54c4fSMartin Matuska * are met: 8caf54c4fSMartin Matuska * 1. Redistributions of source code must retain the above copyright 9caf54c4fSMartin Matuska * notice, this list of conditions and the following disclaimer. 10caf54c4fSMartin Matuska * 2. Redistributions in binary form must reproduce the above copyright 11caf54c4fSMartin Matuska * notice, this list of conditions and the following disclaimer in the 12caf54c4fSMartin Matuska * documentation and/or other materials provided with the distribution. 13caf54c4fSMartin Matuska * 14caf54c4fSMartin Matuska * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR 15caf54c4fSMartin Matuska * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 16caf54c4fSMartin Matuska * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 17caf54c4fSMartin Matuska * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT, 18caf54c4fSMartin Matuska * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 19caf54c4fSMartin Matuska * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 20caf54c4fSMartin Matuska * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 21caf54c4fSMartin Matuska * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 22caf54c4fSMartin Matuska * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 23caf54c4fSMartin Matuska * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 24caf54c4fSMartin Matuska */ 25caf54c4fSMartin Matuska 26f9762417SMartin Matuska #ifndef ARCHIVE_READ_PRIVATE_H_INCLUDED 27f9762417SMartin Matuska #define ARCHIVE_READ_PRIVATE_H_INCLUDED 28f9762417SMartin Matuska 29caf54c4fSMartin Matuska #ifndef __LIBARCHIVE_BUILD 30cdf63a70SMartin Matuska #ifndef __LIBARCHIVE_TEST 31caf54c4fSMartin Matuska #error This header is only to be used internally to libarchive. 32caf54c4fSMartin Matuska #endif 33cdf63a70SMartin Matuska #endif 34caf54c4fSMartin Matuska 35caf54c4fSMartin Matuska #include "archive.h" 36caf54c4fSMartin Matuska #include "archive_string.h" 37caf54c4fSMartin Matuska #include "archive_private.h" 38caf54c4fSMartin Matuska 39caf54c4fSMartin Matuska struct archive_read; 40caf54c4fSMartin Matuska struct archive_read_filter_bidder; 41caf54c4fSMartin Matuska struct archive_read_filter; 42caf54c4fSMartin Matuska 43*833a452eSMartin Matuska struct archive_read_filter_bidder_vtable { 44*833a452eSMartin Matuska /* Taste the upstream filter to see if we handle this. */ 45*833a452eSMartin Matuska int (*bid)(struct archive_read_filter_bidder *, 46*833a452eSMartin Matuska struct archive_read_filter *); 47*833a452eSMartin Matuska /* Initialize a newly-created filter. */ 48*833a452eSMartin Matuska int (*init)(struct archive_read_filter *); 49*833a452eSMartin Matuska /* Release the bidder's configuration data. */ 50*833a452eSMartin Matuska void (*free)(struct archive_read_filter_bidder *); 51*833a452eSMartin Matuska }; 52*833a452eSMartin Matuska 53caf54c4fSMartin Matuska /* 54caf54c4fSMartin Matuska * How bidding works for filters: 556c95142eSMartin Matuska * * The bid manager initializes the client-provided reader as the 566c95142eSMartin Matuska * first filter. 576c95142eSMartin Matuska * * It invokes the bidder for each registered filter with the 586c95142eSMartin Matuska * current head filter. 596c95142eSMartin Matuska * * The bidders can use archive_read_filter_ahead() to peek ahead 606c95142eSMartin Matuska * at the incoming data to compose their bids. 61caf54c4fSMartin Matuska * * The bid manager creates a new filter structure for the winning 62caf54c4fSMartin Matuska * bidder and gives the winning bidder a chance to initialize it. 636c95142eSMartin Matuska * * The new filter becomes the new top filter and we repeat the 646c95142eSMartin Matuska * process. 656c95142eSMartin Matuska * This ends only when no bidder provides a non-zero bid. Then 666c95142eSMartin Matuska * we perform a similar dance with the registered format handlers. 67caf54c4fSMartin Matuska */ 68caf54c4fSMartin Matuska struct archive_read_filter_bidder { 69caf54c4fSMartin Matuska /* Configuration data for the bidder. */ 70caf54c4fSMartin Matuska void *data; 71acc60b03SMartin Matuska /* Name of the filter */ 72acc60b03SMartin Matuska const char *name; 73*833a452eSMartin Matuska const struct archive_read_filter_bidder_vtable *vtable; 74*833a452eSMartin Matuska }; 75*833a452eSMartin Matuska 76*833a452eSMartin Matuska struct archive_read_filter_vtable { 77*833a452eSMartin Matuska /* Return next block. */ 78*833a452eSMartin Matuska ssize_t (*read)(struct archive_read_filter *, const void **); 79*833a452eSMartin Matuska /* Close (just this filter) and free(self). */ 80*833a452eSMartin Matuska int (*close)(struct archive_read_filter *self); 81*833a452eSMartin Matuska /* Read any header metadata if available. */ 82*833a452eSMartin Matuska int (*read_header)(struct archive_read_filter *self, struct archive_entry *entry); 83caf54c4fSMartin Matuska }; 84caf54c4fSMartin Matuska 85caf54c4fSMartin Matuska /* 86caf54c4fSMartin Matuska * This structure is allocated within the archive_read core 87caf54c4fSMartin Matuska * and initialized by archive_read and the init() method of the 88caf54c4fSMartin Matuska * corresponding bidder above. 89caf54c4fSMartin Matuska */ 90caf54c4fSMartin Matuska struct archive_read_filter { 916c95142eSMartin Matuska int64_t position; 92caf54c4fSMartin Matuska /* Essentially all filters will need these values, so 93caf54c4fSMartin Matuska * just declare them here. */ 94caf54c4fSMartin Matuska struct archive_read_filter_bidder *bidder; /* My bidder. */ 95caf54c4fSMartin Matuska struct archive_read_filter *upstream; /* Who I read from. */ 96caf54c4fSMartin Matuska struct archive_read *archive; /* Associated archive. */ 97*833a452eSMartin Matuska const struct archive_read_filter_vtable *vtable; 98caf54c4fSMartin Matuska /* My private data. */ 99caf54c4fSMartin Matuska void *data; 100caf54c4fSMartin Matuska 101caf54c4fSMartin Matuska const char *name; 102caf54c4fSMartin Matuska int code; 103*833a452eSMartin Matuska int can_skip; 104*833a452eSMartin Matuska int can_seek; 105caf54c4fSMartin Matuska 106caf54c4fSMartin Matuska /* Used by reblocking logic. */ 107caf54c4fSMartin Matuska char *buffer; 108caf54c4fSMartin Matuska size_t buffer_size; 109caf54c4fSMartin Matuska char *next; /* Current read location. */ 110caf54c4fSMartin Matuska size_t avail; /* Bytes in my buffer. */ 111caf54c4fSMartin Matuska const void *client_buff; /* Client buffer information. */ 112caf54c4fSMartin Matuska size_t client_total; 113caf54c4fSMartin Matuska const char *client_next; 114caf54c4fSMartin Matuska size_t client_avail; 115caf54c4fSMartin Matuska char end_of_file; 1166c95142eSMartin Matuska char closed; 117caf54c4fSMartin Matuska char fatal; 118caf54c4fSMartin Matuska }; 119caf54c4fSMartin Matuska 120caf54c4fSMartin Matuska /* 121caf54c4fSMartin Matuska * The client looks a lot like a filter, so we just wrap it here. 122caf54c4fSMartin Matuska * 123caf54c4fSMartin Matuska * TODO: Make archive_read_filter and archive_read_client identical so 124caf54c4fSMartin Matuska * that users of the library can easily register their own 125caf54c4fSMartin Matuska * transformation filters. This will probably break the API/ABI and 126caf54c4fSMartin Matuska * so should be deferred at least until libarchive 3.0. 127caf54c4fSMartin Matuska */ 128acc60b03SMartin Matuska struct archive_read_data_node { 129acc60b03SMartin Matuska int64_t begin_position; 130acc60b03SMartin Matuska int64_t total_size; 131acc60b03SMartin Matuska void *data; 132acc60b03SMartin Matuska }; 133caf54c4fSMartin Matuska struct archive_read_client { 1346c95142eSMartin Matuska archive_open_callback *opener; 135caf54c4fSMartin Matuska archive_read_callback *reader; 136caf54c4fSMartin Matuska archive_skip_callback *skipper; 1376c95142eSMartin Matuska archive_seek_callback *seeker; 138caf54c4fSMartin Matuska archive_close_callback *closer; 139acc60b03SMartin Matuska archive_switch_callback *switcher; 140acc60b03SMartin Matuska unsigned int nodes; 141acc60b03SMartin Matuska unsigned int cursor; 142acc60b03SMartin Matuska int64_t position; 143acc60b03SMartin Matuska struct archive_read_data_node *dataset; 144caf54c4fSMartin Matuska }; 145cdf63a70SMartin Matuska struct archive_read_passphrase { 146cdf63a70SMartin Matuska char *passphrase; 147cdf63a70SMartin Matuska struct archive_read_passphrase *next; 148cdf63a70SMartin Matuska }; 149cdf63a70SMartin Matuska 150cdf63a70SMartin Matuska struct archive_read_extract { 151cdf63a70SMartin Matuska struct archive *ad; /* archive_write_disk object */ 152cdf63a70SMartin Matuska 153cdf63a70SMartin Matuska /* Progress function invoked during extract. */ 154cdf63a70SMartin Matuska void (*extract_progress)(void *); 155cdf63a70SMartin Matuska void *extract_progress_user_data; 156cdf63a70SMartin Matuska }; 157caf54c4fSMartin Matuska 158caf54c4fSMartin Matuska struct archive_read { 159caf54c4fSMartin Matuska struct archive archive; 160caf54c4fSMartin Matuska 161caf54c4fSMartin Matuska struct archive_entry *entry; 162caf54c4fSMartin Matuska 163caf54c4fSMartin Matuska /* Dev/ino of the archive being read/written. */ 1646c95142eSMartin Matuska int skip_file_set; 165fd082e96SMartin Matuska int64_t skip_file_dev; 166fd082e96SMartin Matuska int64_t skip_file_ino; 167caf54c4fSMartin Matuska 168acc60b03SMartin Matuska /* Callbacks to open/read/write/close client archive streams. */ 169caf54c4fSMartin Matuska struct archive_read_client client; 170caf54c4fSMartin Matuska 171caf54c4fSMartin Matuska /* Registered filter bidders. */ 172cdf63a70SMartin Matuska struct archive_read_filter_bidder bidders[16]; 173caf54c4fSMartin Matuska 174caf54c4fSMartin Matuska /* Last filter in chain */ 175caf54c4fSMartin Matuska struct archive_read_filter *filter; 176caf54c4fSMartin Matuska 177acc60b03SMartin Matuska /* Whether to bypass filter bidding process */ 178acc60b03SMartin Matuska int bypass_filter_bidding; 179acc60b03SMartin Matuska 180caf54c4fSMartin Matuska /* File offset of beginning of most recently-read header. */ 1816c95142eSMartin Matuska int64_t header_position; 182caf54c4fSMartin Matuska 183acc60b03SMartin Matuska /* Nodes and offsets of compressed data block */ 184acc60b03SMartin Matuska unsigned int data_start_node; 185acc60b03SMartin Matuska unsigned int data_end_node; 186acc60b03SMartin Matuska 187caf54c4fSMartin Matuska /* 188caf54c4fSMartin Matuska * Format detection is mostly the same as compression 189caf54c4fSMartin Matuska * detection, with one significant difference: The bidders 190caf54c4fSMartin Matuska * use the read_ahead calls above to examine the stream rather 191caf54c4fSMartin Matuska * than having the supervisor hand them a block of data to 192caf54c4fSMartin Matuska * examine. 193caf54c4fSMartin Matuska */ 194caf54c4fSMartin Matuska 195caf54c4fSMartin Matuska struct archive_format_descriptor { 196caf54c4fSMartin Matuska void *data; 197caf54c4fSMartin Matuska const char *name; 1986c95142eSMartin Matuska int (*bid)(struct archive_read *, int best_bid); 199caf54c4fSMartin Matuska int (*options)(struct archive_read *, const char *key, 200caf54c4fSMartin Matuska const char *value); 201caf54c4fSMartin Matuska int (*read_header)(struct archive_read *, struct archive_entry *); 2026c95142eSMartin Matuska int (*read_data)(struct archive_read *, const void **, size_t *, int64_t *); 203caf54c4fSMartin Matuska int (*read_data_skip)(struct archive_read *); 204acc60b03SMartin Matuska int64_t (*seek_data)(struct archive_read *, int64_t, int); 205caf54c4fSMartin Matuska int (*cleanup)(struct archive_read *); 206cdf63a70SMartin Matuska int (*format_capabilties)(struct archive_read *); 207cdf63a70SMartin Matuska int (*has_encrypted_entries)(struct archive_read *); 2086c95142eSMartin Matuska } formats[16]; 209caf54c4fSMartin Matuska struct archive_format_descriptor *format; /* Active format. */ 210caf54c4fSMartin Matuska 211caf54c4fSMartin Matuska /* 212caf54c4fSMartin Matuska * Various information needed by archive_extract. 213caf54c4fSMartin Matuska */ 214cdf63a70SMartin Matuska struct archive_read_extract *extract; 215caf54c4fSMartin Matuska int (*cleanup_archive_extract)(struct archive_read *); 216cdf63a70SMartin Matuska 217cdf63a70SMartin Matuska /* 218cdf63a70SMartin Matuska * Decryption passphrase. 219cdf63a70SMartin Matuska */ 220cdf63a70SMartin Matuska struct { 221cdf63a70SMartin Matuska struct archive_read_passphrase *first; 222cdf63a70SMartin Matuska struct archive_read_passphrase **last; 223cfa49a9bSMartin Matuska int candidate; 224cdf63a70SMartin Matuska archive_passphrase_callback *callback; 225cdf63a70SMartin Matuska void *client_data; 226cdf63a70SMartin Matuska } passphrases; 227caf54c4fSMartin Matuska }; 228caf54c4fSMartin Matuska 229caf54c4fSMartin Matuska int __archive_read_register_format(struct archive_read *a, 230caf54c4fSMartin Matuska void *format_data, 231caf54c4fSMartin Matuska const char *name, 2326c95142eSMartin Matuska int (*bid)(struct archive_read *, int), 233caf54c4fSMartin Matuska int (*options)(struct archive_read *, const char *, const char *), 234caf54c4fSMartin Matuska int (*read_header)(struct archive_read *, struct archive_entry *), 2356c95142eSMartin Matuska int (*read_data)(struct archive_read *, const void **, size_t *, int64_t *), 236caf54c4fSMartin Matuska int (*read_data_skip)(struct archive_read *), 237acc60b03SMartin Matuska int64_t (*seek_data)(struct archive_read *, int64_t, int), 238cdf63a70SMartin Matuska int (*cleanup)(struct archive_read *), 239cdf63a70SMartin Matuska int (*format_capabilities)(struct archive_read *), 240cdf63a70SMartin Matuska int (*has_encrypted_entries)(struct archive_read *)); 241caf54c4fSMartin Matuska 242*833a452eSMartin Matuska int __archive_read_register_bidder(struct archive_read *a, 243*833a452eSMartin Matuska void *bidder_data, 244*833a452eSMartin Matuska const char *name, 245*833a452eSMartin Matuska const struct archive_read_filter_bidder_vtable *vtable); 246caf54c4fSMartin Matuska 247caf54c4fSMartin Matuska const void *__archive_read_ahead(struct archive_read *, size_t, ssize_t *); 248caf54c4fSMartin Matuska const void *__archive_read_filter_ahead(struct archive_read_filter *, 249caf54c4fSMartin Matuska size_t, ssize_t *); 2506c95142eSMartin Matuska int64_t __archive_read_seek(struct archive_read*, int64_t, int); 2516c95142eSMartin Matuska int64_t __archive_read_filter_seek(struct archive_read_filter *, int64_t, int); 2526c95142eSMartin Matuska int64_t __archive_read_consume(struct archive_read *, int64_t); 2536c95142eSMartin Matuska int64_t __archive_read_filter_consume(struct archive_read_filter *, int64_t); 25452c2bb75SMartin Matuska int __archive_read_header(struct archive_read *, struct archive_entry *); 255caf54c4fSMartin Matuska int __archive_read_program(struct archive_read_filter *, const char *); 256acc60b03SMartin Matuska void __archive_read_free_filters(struct archive_read *); 257cdf63a70SMartin Matuska struct archive_read_extract *__archive_read_get_extract(struct archive_read *); 258cdf63a70SMartin Matuska 259cdf63a70SMartin Matuska 260cdf63a70SMartin Matuska /* 261cdf63a70SMartin Matuska * Get a decryption passphrase. 262cdf63a70SMartin Matuska */ 263cdf63a70SMartin Matuska void __archive_read_reset_passphrase(struct archive_read *a); 264cdf63a70SMartin Matuska const char * __archive_read_next_passphrase(struct archive_read *a); 265caf54c4fSMartin Matuska #endif 266