xref: /freebsd-src/contrib/libarchive/libarchive/archive_read_private.h (revision b9128a37faafede823eb456aa65a11ac69997284)
1caf54c4fSMartin Matuska /*-
2caf54c4fSMartin Matuska  * Copyright (c) 2003-2007 Tim Kientzle
3caf54c4fSMartin Matuska  * All rights reserved.
4caf54c4fSMartin Matuska  *
5caf54c4fSMartin Matuska  * Redistribution and use in source and binary forms, with or without
6caf54c4fSMartin Matuska  * modification, are permitted provided that the following conditions
7caf54c4fSMartin Matuska  * are met:
8caf54c4fSMartin Matuska  * 1. Redistributions of source code must retain the above copyright
9caf54c4fSMartin Matuska  *    notice, this list of conditions and the following disclaimer.
10caf54c4fSMartin Matuska  * 2. Redistributions in binary form must reproduce the above copyright
11caf54c4fSMartin Matuska  *    notice, this list of conditions and the following disclaimer in the
12caf54c4fSMartin Matuska  *    documentation and/or other materials provided with the distribution.
13caf54c4fSMartin Matuska  *
14caf54c4fSMartin Matuska  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
15caf54c4fSMartin Matuska  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
16caf54c4fSMartin Matuska  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
17caf54c4fSMartin Matuska  * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
18caf54c4fSMartin Matuska  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
19caf54c4fSMartin Matuska  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
20caf54c4fSMartin Matuska  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
21caf54c4fSMartin Matuska  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
22caf54c4fSMartin Matuska  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
23caf54c4fSMartin Matuska  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
24caf54c4fSMartin Matuska  */
25caf54c4fSMartin Matuska 
26f9762417SMartin Matuska #ifndef ARCHIVE_READ_PRIVATE_H_INCLUDED
27f9762417SMartin Matuska #define ARCHIVE_READ_PRIVATE_H_INCLUDED
28f9762417SMartin Matuska 
29caf54c4fSMartin Matuska #ifndef __LIBARCHIVE_BUILD
30cdf63a70SMartin Matuska #ifndef __LIBARCHIVE_TEST
31caf54c4fSMartin Matuska #error This header is only to be used internally to libarchive.
32caf54c4fSMartin Matuska #endif
33cdf63a70SMartin Matuska #endif
34caf54c4fSMartin Matuska 
35caf54c4fSMartin Matuska #include "archive.h"
36caf54c4fSMartin Matuska #include "archive_string.h"
37caf54c4fSMartin Matuska #include "archive_private.h"
38caf54c4fSMartin Matuska 
39caf54c4fSMartin Matuska struct archive_read;
40caf54c4fSMartin Matuska struct archive_read_filter_bidder;
41caf54c4fSMartin Matuska struct archive_read_filter;
42caf54c4fSMartin Matuska 
43*833a452eSMartin Matuska struct archive_read_filter_bidder_vtable {
44*833a452eSMartin Matuska 	/* Taste the upstream filter to see if we handle this. */
45*833a452eSMartin Matuska 	int (*bid)(struct archive_read_filter_bidder *,
46*833a452eSMartin Matuska 	    struct archive_read_filter *);
47*833a452eSMartin Matuska 	/* Initialize a newly-created filter. */
48*833a452eSMartin Matuska 	int (*init)(struct archive_read_filter *);
49*833a452eSMartin Matuska 	/* Release the bidder's configuration data. */
50*833a452eSMartin Matuska 	void (*free)(struct archive_read_filter_bidder *);
51*833a452eSMartin Matuska };
52*833a452eSMartin Matuska 
53caf54c4fSMartin Matuska /*
54caf54c4fSMartin Matuska  * How bidding works for filters:
556c95142eSMartin Matuska  *   * The bid manager initializes the client-provided reader as the
566c95142eSMartin Matuska  *     first filter.
576c95142eSMartin Matuska  *   * It invokes the bidder for each registered filter with the
586c95142eSMartin Matuska  *     current head filter.
596c95142eSMartin Matuska  *   * The bidders can use archive_read_filter_ahead() to peek ahead
606c95142eSMartin Matuska  *     at the incoming data to compose their bids.
61caf54c4fSMartin Matuska  *   * The bid manager creates a new filter structure for the winning
62caf54c4fSMartin Matuska  *     bidder and gives the winning bidder a chance to initialize it.
636c95142eSMartin Matuska  *   * The new filter becomes the new top filter and we repeat the
646c95142eSMartin Matuska  *     process.
656c95142eSMartin Matuska  * This ends only when no bidder provides a non-zero bid.  Then
666c95142eSMartin Matuska  * we perform a similar dance with the registered format handlers.
67caf54c4fSMartin Matuska  */
68caf54c4fSMartin Matuska struct archive_read_filter_bidder {
69caf54c4fSMartin Matuska 	/* Configuration data for the bidder. */
70caf54c4fSMartin Matuska 	void *data;
71acc60b03SMartin Matuska 	/* Name of the filter */
72acc60b03SMartin Matuska 	const char *name;
73*833a452eSMartin Matuska 	const struct archive_read_filter_bidder_vtable *vtable;
74*833a452eSMartin Matuska };
75*833a452eSMartin Matuska 
76*833a452eSMartin Matuska struct archive_read_filter_vtable {
77*833a452eSMartin Matuska 	/* Return next block. */
78*833a452eSMartin Matuska 	ssize_t (*read)(struct archive_read_filter *, const void **);
79*833a452eSMartin Matuska 	/* Close (just this filter) and free(self). */
80*833a452eSMartin Matuska 	int (*close)(struct archive_read_filter *self);
81*833a452eSMartin Matuska 	/* Read any header metadata if available. */
82*833a452eSMartin Matuska 	int (*read_header)(struct archive_read_filter *self, struct archive_entry *entry);
83caf54c4fSMartin Matuska };
84caf54c4fSMartin Matuska 
85caf54c4fSMartin Matuska /*
86caf54c4fSMartin Matuska  * This structure is allocated within the archive_read core
87caf54c4fSMartin Matuska  * and initialized by archive_read and the init() method of the
88caf54c4fSMartin Matuska  * corresponding bidder above.
89caf54c4fSMartin Matuska  */
90caf54c4fSMartin Matuska struct archive_read_filter {
916c95142eSMartin Matuska 	int64_t position;
92caf54c4fSMartin Matuska 	/* Essentially all filters will need these values, so
93caf54c4fSMartin Matuska 	 * just declare them here. */
94caf54c4fSMartin Matuska 	struct archive_read_filter_bidder *bidder; /* My bidder. */
95caf54c4fSMartin Matuska 	struct archive_read_filter *upstream; /* Who I read from. */
96caf54c4fSMartin Matuska 	struct archive_read *archive; /* Associated archive. */
97*833a452eSMartin Matuska 	const struct archive_read_filter_vtable *vtable;
98caf54c4fSMartin Matuska 	/* My private data. */
99caf54c4fSMartin Matuska 	void *data;
100caf54c4fSMartin Matuska 
101caf54c4fSMartin Matuska 	const char	*name;
102caf54c4fSMartin Matuska 	int		 code;
103*833a452eSMartin Matuska 	int		 can_skip;
104*833a452eSMartin Matuska 	int		 can_seek;
105caf54c4fSMartin Matuska 
106caf54c4fSMartin Matuska 	/* Used by reblocking logic. */
107caf54c4fSMartin Matuska 	char		*buffer;
108caf54c4fSMartin Matuska 	size_t		 buffer_size;
109caf54c4fSMartin Matuska 	char		*next;		/* Current read location. */
110caf54c4fSMartin Matuska 	size_t		 avail;		/* Bytes in my buffer. */
111caf54c4fSMartin Matuska 	const void	*client_buff;	/* Client buffer information. */
112caf54c4fSMartin Matuska 	size_t		 client_total;
113caf54c4fSMartin Matuska 	const char	*client_next;
114caf54c4fSMartin Matuska 	size_t		 client_avail;
115caf54c4fSMartin Matuska 	char		 end_of_file;
1166c95142eSMartin Matuska 	char		 closed;
117caf54c4fSMartin Matuska 	char		 fatal;
118caf54c4fSMartin Matuska };
119caf54c4fSMartin Matuska 
120caf54c4fSMartin Matuska /*
121caf54c4fSMartin Matuska  * The client looks a lot like a filter, so we just wrap it here.
122caf54c4fSMartin Matuska  *
123caf54c4fSMartin Matuska  * TODO: Make archive_read_filter and archive_read_client identical so
124caf54c4fSMartin Matuska  * that users of the library can easily register their own
125caf54c4fSMartin Matuska  * transformation filters.  This will probably break the API/ABI and
126caf54c4fSMartin Matuska  * so should be deferred at least until libarchive 3.0.
127caf54c4fSMartin Matuska  */
128acc60b03SMartin Matuska struct archive_read_data_node {
129acc60b03SMartin Matuska 	int64_t begin_position;
130acc60b03SMartin Matuska 	int64_t total_size;
131acc60b03SMartin Matuska 	void *data;
132acc60b03SMartin Matuska };
133caf54c4fSMartin Matuska struct archive_read_client {
1346c95142eSMartin Matuska 	archive_open_callback	*opener;
135caf54c4fSMartin Matuska 	archive_read_callback	*reader;
136caf54c4fSMartin Matuska 	archive_skip_callback	*skipper;
1376c95142eSMartin Matuska 	archive_seek_callback	*seeker;
138caf54c4fSMartin Matuska 	archive_close_callback	*closer;
139acc60b03SMartin Matuska 	archive_switch_callback *switcher;
140acc60b03SMartin Matuska 	unsigned int nodes;
141acc60b03SMartin Matuska 	unsigned int cursor;
142acc60b03SMartin Matuska 	int64_t position;
143acc60b03SMartin Matuska 	struct archive_read_data_node *dataset;
144caf54c4fSMartin Matuska };
145cdf63a70SMartin Matuska struct archive_read_passphrase {
146cdf63a70SMartin Matuska 	char	*passphrase;
147cdf63a70SMartin Matuska 	struct archive_read_passphrase *next;
148cdf63a70SMartin Matuska };
149cdf63a70SMartin Matuska 
150cdf63a70SMartin Matuska struct archive_read_extract {
151cdf63a70SMartin Matuska 	struct archive *ad; /* archive_write_disk object */
152cdf63a70SMartin Matuska 
153cdf63a70SMartin Matuska 	/* Progress function invoked during extract. */
154cdf63a70SMartin Matuska 	void			(*extract_progress)(void *);
155cdf63a70SMartin Matuska 	void			 *extract_progress_user_data;
156cdf63a70SMartin Matuska };
157caf54c4fSMartin Matuska 
158caf54c4fSMartin Matuska struct archive_read {
159caf54c4fSMartin Matuska 	struct archive	archive;
160caf54c4fSMartin Matuska 
161caf54c4fSMartin Matuska 	struct archive_entry	*entry;
162caf54c4fSMartin Matuska 
163caf54c4fSMartin Matuska 	/* Dev/ino of the archive being read/written. */
1646c95142eSMartin Matuska 	int		  skip_file_set;
165fd082e96SMartin Matuska 	int64_t		  skip_file_dev;
166fd082e96SMartin Matuska 	int64_t		  skip_file_ino;
167caf54c4fSMartin Matuska 
168acc60b03SMartin Matuska 	/* Callbacks to open/read/write/close client archive streams. */
169caf54c4fSMartin Matuska 	struct archive_read_client client;
170caf54c4fSMartin Matuska 
171caf54c4fSMartin Matuska 	/* Registered filter bidders. */
172cdf63a70SMartin Matuska 	struct archive_read_filter_bidder bidders[16];
173caf54c4fSMartin Matuska 
174caf54c4fSMartin Matuska 	/* Last filter in chain */
175caf54c4fSMartin Matuska 	struct archive_read_filter *filter;
176caf54c4fSMartin Matuska 
177acc60b03SMartin Matuska 	/* Whether to bypass filter bidding process */
178acc60b03SMartin Matuska 	int bypass_filter_bidding;
179acc60b03SMartin Matuska 
180caf54c4fSMartin Matuska 	/* File offset of beginning of most recently-read header. */
1816c95142eSMartin Matuska 	int64_t		  header_position;
182caf54c4fSMartin Matuska 
183acc60b03SMartin Matuska 	/* Nodes and offsets of compressed data block */
184acc60b03SMartin Matuska 	unsigned int data_start_node;
185acc60b03SMartin Matuska 	unsigned int data_end_node;
186acc60b03SMartin Matuska 
187caf54c4fSMartin Matuska 	/*
188caf54c4fSMartin Matuska 	 * Format detection is mostly the same as compression
189caf54c4fSMartin Matuska 	 * detection, with one significant difference: The bidders
190caf54c4fSMartin Matuska 	 * use the read_ahead calls above to examine the stream rather
191caf54c4fSMartin Matuska 	 * than having the supervisor hand them a block of data to
192caf54c4fSMartin Matuska 	 * examine.
193caf54c4fSMartin Matuska 	 */
194caf54c4fSMartin Matuska 
195caf54c4fSMartin Matuska 	struct archive_format_descriptor {
196caf54c4fSMartin Matuska 		void	 *data;
197caf54c4fSMartin Matuska 		const char *name;
1986c95142eSMartin Matuska 		int	(*bid)(struct archive_read *, int best_bid);
199caf54c4fSMartin Matuska 		int	(*options)(struct archive_read *, const char *key,
200caf54c4fSMartin Matuska 		    const char *value);
201caf54c4fSMartin Matuska 		int	(*read_header)(struct archive_read *, struct archive_entry *);
2026c95142eSMartin Matuska 		int	(*read_data)(struct archive_read *, const void **, size_t *, int64_t *);
203caf54c4fSMartin Matuska 		int	(*read_data_skip)(struct archive_read *);
204acc60b03SMartin Matuska 		int64_t	(*seek_data)(struct archive_read *, int64_t, int);
205caf54c4fSMartin Matuska 		int	(*cleanup)(struct archive_read *);
206cdf63a70SMartin Matuska 		int	(*format_capabilties)(struct archive_read *);
207cdf63a70SMartin Matuska 		int	(*has_encrypted_entries)(struct archive_read *);
2086c95142eSMartin Matuska 	}	formats[16];
209caf54c4fSMartin Matuska 	struct archive_format_descriptor	*format; /* Active format. */
210caf54c4fSMartin Matuska 
211caf54c4fSMartin Matuska 	/*
212caf54c4fSMartin Matuska 	 * Various information needed by archive_extract.
213caf54c4fSMartin Matuska 	 */
214cdf63a70SMartin Matuska 	struct archive_read_extract		*extract;
215caf54c4fSMartin Matuska 	int			(*cleanup_archive_extract)(struct archive_read *);
216cdf63a70SMartin Matuska 
217cdf63a70SMartin Matuska 	/*
218cdf63a70SMartin Matuska 	 * Decryption passphrase.
219cdf63a70SMartin Matuska 	 */
220cdf63a70SMartin Matuska 	struct {
221cdf63a70SMartin Matuska 		struct archive_read_passphrase *first;
222cdf63a70SMartin Matuska 		struct archive_read_passphrase **last;
223cfa49a9bSMartin Matuska 		int candidate;
224cdf63a70SMartin Matuska 		archive_passphrase_callback *callback;
225cdf63a70SMartin Matuska 		void *client_data;
226cdf63a70SMartin Matuska 	}		passphrases;
227caf54c4fSMartin Matuska };
228caf54c4fSMartin Matuska 
229caf54c4fSMartin Matuska int	__archive_read_register_format(struct archive_read *a,
230caf54c4fSMartin Matuska 		void *format_data,
231caf54c4fSMartin Matuska 		const char *name,
2326c95142eSMartin Matuska 		int (*bid)(struct archive_read *, int),
233caf54c4fSMartin Matuska 		int (*options)(struct archive_read *, const char *, const char *),
234caf54c4fSMartin Matuska 		int (*read_header)(struct archive_read *, struct archive_entry *),
2356c95142eSMartin Matuska 		int (*read_data)(struct archive_read *, const void **, size_t *, int64_t *),
236caf54c4fSMartin Matuska 		int (*read_data_skip)(struct archive_read *),
237acc60b03SMartin Matuska 		int64_t (*seek_data)(struct archive_read *, int64_t, int),
238cdf63a70SMartin Matuska 		int (*cleanup)(struct archive_read *),
239cdf63a70SMartin Matuska 		int (*format_capabilities)(struct archive_read *),
240cdf63a70SMartin Matuska 		int (*has_encrypted_entries)(struct archive_read *));
241caf54c4fSMartin Matuska 
242*833a452eSMartin Matuska int __archive_read_register_bidder(struct archive_read *a,
243*833a452eSMartin Matuska 		void *bidder_data,
244*833a452eSMartin Matuska 		const char *name,
245*833a452eSMartin Matuska 		const struct archive_read_filter_bidder_vtable *vtable);
246caf54c4fSMartin Matuska 
247caf54c4fSMartin Matuska const void *__archive_read_ahead(struct archive_read *, size_t, ssize_t *);
248caf54c4fSMartin Matuska const void *__archive_read_filter_ahead(struct archive_read_filter *,
249caf54c4fSMartin Matuska     size_t, ssize_t *);
2506c95142eSMartin Matuska int64_t	__archive_read_seek(struct archive_read*, int64_t, int);
2516c95142eSMartin Matuska int64_t	__archive_read_filter_seek(struct archive_read_filter *, int64_t, int);
2526c95142eSMartin Matuska int64_t	__archive_read_consume(struct archive_read *, int64_t);
2536c95142eSMartin Matuska int64_t	__archive_read_filter_consume(struct archive_read_filter *, int64_t);
25452c2bb75SMartin Matuska int __archive_read_header(struct archive_read *, struct archive_entry *);
255caf54c4fSMartin Matuska int __archive_read_program(struct archive_read_filter *, const char *);
256acc60b03SMartin Matuska void __archive_read_free_filters(struct archive_read *);
257cdf63a70SMartin Matuska struct archive_read_extract *__archive_read_get_extract(struct archive_read *);
258cdf63a70SMartin Matuska 
259cdf63a70SMartin Matuska 
260cdf63a70SMartin Matuska /*
261cdf63a70SMartin Matuska  * Get a decryption passphrase.
262cdf63a70SMartin Matuska  */
263cdf63a70SMartin Matuska void __archive_read_reset_passphrase(struct archive_read *a);
264cdf63a70SMartin Matuska const char * __archive_read_next_passphrase(struct archive_read *a);
265caf54c4fSMartin Matuska #endif
266