archive_entry.h revision 228759
1/*-
2 * Copyright (c) 2003-2008 Tim Kientzle
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in the
12 *    documentation and/or other materials provided with the distribution.
13 *
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
15 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
16 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
17 * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
18 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
19 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
20 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
21 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
22 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
23 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
24 *
25 * $FreeBSD: head/lib/libarchive/archive_entry.h 201096 2009-12-28 02:41:27Z kientzle $
26 */
27
28#ifndef ARCHIVE_ENTRY_H_INCLUDED
29#define	ARCHIVE_ENTRY_H_INCLUDED
30
31/*
32 * Note: archive_entry.h is for use outside of libarchive; the
33 * configuration headers (config.h, archive_platform.h, etc.) are
34 * purely internal.  Do NOT use HAVE_XXX configuration macros to
35 * control the behavior of this header!  If you must conditionalize,
36 * use predefined compiler and/or platform macros.
37 */
38
39#include <sys/types.h>
40#include <stddef.h>  /* for wchar_t */
41#include <time.h>
42
43#if defined(_WIN32) && !defined(__CYGWIN__)
44#include <windows.h>
45#endif
46
47/* Get appropriate definitions of standard POSIX-style types. */
48/* These should match the types used in 'struct stat' */
49#if defined(_WIN32) && !defined(__CYGWIN__)
50#define	__LA_INT64_T	__int64
51# if defined(__BORLANDC__)
52#  define	__LA_UID_T	uid_t
53#  define	__LA_GID_T	gid_t
54#  define	__LA_DEV_T	dev_t
55#  define	__LA_MODE_T	mode_t
56# else
57#  define	__LA_UID_T	short
58#  define	__LA_GID_T	short
59#  define	__LA_DEV_T	unsigned int
60#  define	__LA_MODE_T	unsigned short
61# endif
62#else
63#include <unistd.h>
64#define	__LA_INT64_T	int64_t
65#define	__LA_UID_T	uid_t
66#define	__LA_GID_T	gid_t
67#define	__LA_DEV_T	dev_t
68#define	__LA_MODE_T	mode_t
69#endif
70
71/*
72 * XXX Is this defined for all Windows compilers?  If so, in what
73 * header?  It would be nice to remove the __LA_INO_T indirection and
74 * just use plain ino_t everywhere.  Likewise for the other types just
75 * above.
76 */
77#define	__LA_INO_T	ino_t
78
79
80/*
81 * On Windows, define LIBARCHIVE_STATIC if you're building or using a
82 * .lib.  The default here assumes you're building a DLL.  Only
83 * libarchive source should ever define __LIBARCHIVE_BUILD.
84 */
85#if ((defined __WIN32__) || (defined _WIN32) || defined(__CYGWIN__)) && (!defined LIBARCHIVE_STATIC)
86# ifdef __LIBARCHIVE_BUILD
87#  ifdef __GNUC__
88#   define __LA_DECL	__attribute__((dllexport)) extern
89#  else
90#   define __LA_DECL	__declspec(dllexport)
91#  endif
92# else
93#  ifdef __GNUC__
94#   define __LA_DECL	__attribute__((dllimport)) extern
95#  else
96#   define __LA_DECL	__declspec(dllimport)
97#  endif
98# endif
99#else
100/* Static libraries on all platforms and shared libraries on non-Windows. */
101# define __LA_DECL
102#endif
103
104#ifdef __cplusplus
105extern "C" {
106#endif
107
108/*
109 * Description of an archive entry.
110 *
111 * You can think of this as "struct stat" with some text fields added in.
112 *
113 * TODO: Add "comment", "charset", and possibly other entries that are
114 * supported by "pax interchange" format.  However, GNU, ustar, cpio,
115 * and other variants don't support these features, so they're not an
116 * excruciatingly high priority right now.
117 *
118 * TODO: "pax interchange" format allows essentially arbitrary
119 * key/value attributes to be attached to any entry.  Supporting
120 * such extensions may make this library useful for special
121 * applications (e.g., a package manager could attach special
122 * package-management attributes to each entry).
123 */
124struct archive_entry;
125
126/*
127 * File-type constants.  These are returned from archive_entry_filetype()
128 * and passed to archive_entry_set_filetype().
129 *
130 * These values match S_XXX defines on every platform I've checked,
131 * including Windows, AIX, Linux, Solaris, and BSD.  They're
132 * (re)defined here because platforms generally don't define the ones
133 * they don't support.  For example, Windows doesn't define S_IFLNK or
134 * S_IFBLK.  Instead of having a mass of conditional logic and system
135 * checks to define any S_XXX values that aren't supported locally,
136 * I've just defined a new set of such constants so that
137 * libarchive-based applications can manipulate and identify archive
138 * entries properly even if the hosting platform can't store them on
139 * disk.
140 *
141 * These values are also used directly within some portable formats,
142 * such as cpio.  If you find a platform that varies from these, the
143 * correct solution is to leave these alone and translate from these
144 * portable values to platform-native values when entries are read from
145 * or written to disk.
146 */
147#define	AE_IFMT		0170000
148#define	AE_IFREG	0100000
149#define	AE_IFLNK	0120000
150#define	AE_IFSOCK	0140000
151#define	AE_IFCHR	0020000
152#define	AE_IFBLK	0060000
153#define	AE_IFDIR	0040000
154#define	AE_IFIFO	0010000
155
156/*
157 * Basic object manipulation
158 */
159
160__LA_DECL struct archive_entry	*archive_entry_clear(struct archive_entry *);
161/* The 'clone' function does a deep copy; all of the strings are copied too. */
162__LA_DECL struct archive_entry	*archive_entry_clone(struct archive_entry *);
163__LA_DECL void			 archive_entry_free(struct archive_entry *);
164__LA_DECL struct archive_entry	*archive_entry_new(void);
165
166/*
167 * Retrieve fields from an archive_entry.
168 *
169 * There are a number of implicit conversions among these fields.  For
170 * example, if a regular string field is set and you read the _w wide
171 * character field, the entry will implicitly convert narrow-to-wide
172 * using the current locale.  Similarly, dev values are automatically
173 * updated when you write devmajor or devminor and vice versa.
174 *
175 * In addition, fields can be "set" or "unset."  Unset string fields
176 * return NULL, non-string fields have _is_set() functions to test
177 * whether they've been set.  You can "unset" a string field by
178 * assigning NULL; non-string fields have _unset() functions to
179 * unset them.
180 *
181 * Note: There is one ambiguity in the above; string fields will
182 * also return NULL when implicit character set conversions fail.
183 * This is usually what you want.
184 */
185__LA_DECL time_t	 archive_entry_atime(struct archive_entry *);
186__LA_DECL long		 archive_entry_atime_nsec(struct archive_entry *);
187__LA_DECL int		 archive_entry_atime_is_set(struct archive_entry *);
188__LA_DECL time_t	 archive_entry_birthtime(struct archive_entry *);
189__LA_DECL long		 archive_entry_birthtime_nsec(struct archive_entry *);
190__LA_DECL int		 archive_entry_birthtime_is_set(struct archive_entry *);
191__LA_DECL time_t	 archive_entry_ctime(struct archive_entry *);
192__LA_DECL long		 archive_entry_ctime_nsec(struct archive_entry *);
193__LA_DECL int		 archive_entry_ctime_is_set(struct archive_entry *);
194__LA_DECL dev_t		 archive_entry_dev(struct archive_entry *);
195__LA_DECL dev_t		 archive_entry_devmajor(struct archive_entry *);
196__LA_DECL dev_t		 archive_entry_devminor(struct archive_entry *);
197__LA_DECL __LA_MODE_T	 archive_entry_filetype(struct archive_entry *);
198__LA_DECL void		 archive_entry_fflags(struct archive_entry *,
199			    unsigned long * /* set */,
200			    unsigned long * /* clear */);
201__LA_DECL const char	*archive_entry_fflags_text(struct archive_entry *);
202__LA_DECL __LA_GID_T	 archive_entry_gid(struct archive_entry *);
203__LA_DECL const char	*archive_entry_gname(struct archive_entry *);
204__LA_DECL const wchar_t	*archive_entry_gname_w(struct archive_entry *);
205__LA_DECL const char	*archive_entry_hardlink(struct archive_entry *);
206__LA_DECL const wchar_t	*archive_entry_hardlink_w(struct archive_entry *);
207__LA_DECL __LA_INO_T	 archive_entry_ino(struct archive_entry *);
208__LA_DECL __LA_INT64_T	 archive_entry_ino64(struct archive_entry *);
209__LA_DECL __LA_MODE_T	 archive_entry_mode(struct archive_entry *);
210__LA_DECL time_t	 archive_entry_mtime(struct archive_entry *);
211__LA_DECL long		 archive_entry_mtime_nsec(struct archive_entry *);
212__LA_DECL int		 archive_entry_mtime_is_set(struct archive_entry *);
213__LA_DECL unsigned int	 archive_entry_nlink(struct archive_entry *);
214__LA_DECL const char	*archive_entry_pathname(struct archive_entry *);
215__LA_DECL const wchar_t	*archive_entry_pathname_w(struct archive_entry *);
216__LA_DECL dev_t		 archive_entry_rdev(struct archive_entry *);
217__LA_DECL dev_t		 archive_entry_rdevmajor(struct archive_entry *);
218__LA_DECL dev_t		 archive_entry_rdevminor(struct archive_entry *);
219__LA_DECL const char	*archive_entry_sourcepath(struct archive_entry *);
220__LA_DECL __LA_INT64_T	 archive_entry_size(struct archive_entry *);
221__LA_DECL int		 archive_entry_size_is_set(struct archive_entry *);
222__LA_DECL const char	*archive_entry_strmode(struct archive_entry *);
223__LA_DECL const char	*archive_entry_symlink(struct archive_entry *);
224__LA_DECL const wchar_t	*archive_entry_symlink_w(struct archive_entry *);
225__LA_DECL __LA_UID_T	 archive_entry_uid(struct archive_entry *);
226__LA_DECL const char	*archive_entry_uname(struct archive_entry *);
227__LA_DECL const wchar_t	*archive_entry_uname_w(struct archive_entry *);
228
229/*
230 * Set fields in an archive_entry.
231 *
232 * Note that string 'set' functions do not copy the string, only the pointer.
233 * In contrast, 'copy' functions do copy the object pointed to.
234 *
235 * Note: As of libarchive 2.4, 'set' functions do copy the string and
236 * are therefore exact synonyms for the 'copy' versions.  The 'copy'
237 * names will be retired in libarchive 3.0.
238 */
239
240__LA_DECL void	archive_entry_set_atime(struct archive_entry *, time_t, long);
241__LA_DECL void  archive_entry_unset_atime(struct archive_entry *);
242#if defined(_WIN32) && !defined(__CYGWIN__)
243__LA_DECL void archive_entry_copy_bhfi(struct archive_entry *,
244									   BY_HANDLE_FILE_INFORMATION *);
245#endif
246__LA_DECL void	archive_entry_set_birthtime(struct archive_entry *, time_t, long);
247__LA_DECL void  archive_entry_unset_birthtime(struct archive_entry *);
248__LA_DECL void	archive_entry_set_ctime(struct archive_entry *, time_t, long);
249__LA_DECL void  archive_entry_unset_ctime(struct archive_entry *);
250__LA_DECL void	archive_entry_set_dev(struct archive_entry *, dev_t);
251__LA_DECL void	archive_entry_set_devmajor(struct archive_entry *, dev_t);
252__LA_DECL void	archive_entry_set_devminor(struct archive_entry *, dev_t);
253__LA_DECL void	archive_entry_set_filetype(struct archive_entry *, unsigned int);
254__LA_DECL void	archive_entry_set_fflags(struct archive_entry *,
255	    unsigned long /* set */, unsigned long /* clear */);
256/* Returns pointer to start of first invalid token, or NULL if none. */
257/* Note that all recognized tokens are processed, regardless. */
258__LA_DECL const char *archive_entry_copy_fflags_text(struct archive_entry *,
259	    const char *);
260__LA_DECL const wchar_t *archive_entry_copy_fflags_text_w(struct archive_entry *,
261	    const wchar_t *);
262__LA_DECL void	archive_entry_set_gid(struct archive_entry *, __LA_GID_T);
263__LA_DECL void	archive_entry_set_gname(struct archive_entry *, const char *);
264__LA_DECL void	archive_entry_copy_gname(struct archive_entry *, const char *);
265__LA_DECL void	archive_entry_copy_gname_w(struct archive_entry *, const wchar_t *);
266__LA_DECL int	archive_entry_update_gname_utf8(struct archive_entry *, const char *);
267__LA_DECL void	archive_entry_set_hardlink(struct archive_entry *, const char *);
268__LA_DECL void	archive_entry_copy_hardlink(struct archive_entry *, const char *);
269__LA_DECL void	archive_entry_copy_hardlink_w(struct archive_entry *, const wchar_t *);
270__LA_DECL int	archive_entry_update_hardlink_utf8(struct archive_entry *, const char *);
271#if ARCHIVE_VERSION_NUMBER >= 3000000
272/* Starting with libarchive 3.0, this will be synonym for ino64. */
273__LA_DECL void	archive_entry_set_ino(struct archive_entry *, __LA_INT64_T);
274#else
275__LA_DECL void	archive_entry_set_ino(struct archive_entry *, unsigned long);
276#endif
277__LA_DECL void	archive_entry_set_ino64(struct archive_entry *, __LA_INT64_T);
278__LA_DECL void	archive_entry_set_link(struct archive_entry *, const char *);
279__LA_DECL void	archive_entry_copy_link(struct archive_entry *, const char *);
280__LA_DECL void	archive_entry_copy_link_w(struct archive_entry *, const wchar_t *);
281__LA_DECL int	archive_entry_update_link_utf8(struct archive_entry *, const char *);
282__LA_DECL void	archive_entry_set_mode(struct archive_entry *, __LA_MODE_T);
283__LA_DECL void	archive_entry_set_mtime(struct archive_entry *, time_t, long);
284__LA_DECL void  archive_entry_unset_mtime(struct archive_entry *);
285__LA_DECL void	archive_entry_set_nlink(struct archive_entry *, unsigned int);
286__LA_DECL void	archive_entry_set_pathname(struct archive_entry *, const char *);
287__LA_DECL void	archive_entry_copy_pathname(struct archive_entry *, const char *);
288__LA_DECL void	archive_entry_copy_pathname_w(struct archive_entry *, const wchar_t *);
289__LA_DECL int	archive_entry_update_pathname_utf8(struct archive_entry *, const char *);
290__LA_DECL void	archive_entry_set_perm(struct archive_entry *, __LA_MODE_T);
291__LA_DECL void	archive_entry_set_rdev(struct archive_entry *, dev_t);
292__LA_DECL void	archive_entry_set_rdevmajor(struct archive_entry *, dev_t);
293__LA_DECL void	archive_entry_set_rdevminor(struct archive_entry *, dev_t);
294__LA_DECL void	archive_entry_set_size(struct archive_entry *, __LA_INT64_T);
295__LA_DECL void	archive_entry_unset_size(struct archive_entry *);
296__LA_DECL void	archive_entry_copy_sourcepath(struct archive_entry *, const char *);
297__LA_DECL void	archive_entry_set_symlink(struct archive_entry *, const char *);
298__LA_DECL void	archive_entry_copy_symlink(struct archive_entry *, const char *);
299__LA_DECL void	archive_entry_copy_symlink_w(struct archive_entry *, const wchar_t *);
300__LA_DECL int	archive_entry_update_symlink_utf8(struct archive_entry *, const char *);
301__LA_DECL void	archive_entry_set_uid(struct archive_entry *, __LA_UID_T);
302__LA_DECL void	archive_entry_set_uname(struct archive_entry *, const char *);
303__LA_DECL void	archive_entry_copy_uname(struct archive_entry *, const char *);
304__LA_DECL void	archive_entry_copy_uname_w(struct archive_entry *, const wchar_t *);
305__LA_DECL int	archive_entry_update_uname_utf8(struct archive_entry *, const char *);
306/*
307 * Routines to bulk copy fields to/from a platform-native "struct
308 * stat."  Libarchive used to just store a struct stat inside of each
309 * archive_entry object, but this created issues when trying to
310 * manipulate archives on systems different than the ones they were
311 * created on.
312 *
313 * TODO: On Linux, provide both stat32 and stat64 versions of these functions.
314 */
315__LA_DECL const struct stat	*archive_entry_stat(struct archive_entry *);
316__LA_DECL void	archive_entry_copy_stat(struct archive_entry *, const struct stat *);
317
318
319/*
320 * ACL routines.  This used to simply store and return text-format ACL
321 * strings, but that proved insufficient for a number of reasons:
322 *   = clients need control over uname/uid and gname/gid mappings
323 *   = there are many different ACL text formats
324 *   = would like to be able to read/convert archives containing ACLs
325 *     on platforms that lack ACL libraries
326 *
327 *  This last point, in particular, forces me to implement a reasonably
328 *  complete set of ACL support routines.
329 *
330 *  TODO: Extend this to support NFSv4/NTFS permissions.  That should
331 *  allow full ACL support on Mac OS, in particular, which uses
332 *  POSIX.1e-style interfaces to manipulate NFSv4/NTFS permissions.
333 */
334
335/*
336 * Permission bits mimic POSIX.1e.  Note that I've not followed POSIX.1e's
337 * "permset"/"perm" abstract type nonsense.  A permset is just a simple
338 * bitmap, following long-standing Unix tradition.
339 */
340#define	ARCHIVE_ENTRY_ACL_EXECUTE	1
341#define	ARCHIVE_ENTRY_ACL_WRITE		2
342#define	ARCHIVE_ENTRY_ACL_READ		4
343
344/* We need to be able to specify either or both of these. */
345#define	ARCHIVE_ENTRY_ACL_TYPE_ACCESS	256
346#define	ARCHIVE_ENTRY_ACL_TYPE_DEFAULT	512
347
348/* Tag values mimic POSIX.1e */
349#define	ARCHIVE_ENTRY_ACL_USER		10001	/* Specified user. */
350#define	ARCHIVE_ENTRY_ACL_USER_OBJ 	10002	/* User who owns the file. */
351#define	ARCHIVE_ENTRY_ACL_GROUP		10003	/* Specified group. */
352#define	ARCHIVE_ENTRY_ACL_GROUP_OBJ	10004	/* Group who owns the file. */
353#define	ARCHIVE_ENTRY_ACL_MASK		10005	/* Modify group access. */
354#define	ARCHIVE_ENTRY_ACL_OTHER		10006	/* Public. */
355
356/*
357 * Set the ACL by clearing it and adding entries one at a time.
358 * Unlike the POSIX.1e ACL routines, you must specify the type
359 * (access/default) for each entry.  Internally, the ACL data is just
360 * a soup of entries.  API calls here allow you to retrieve just the
361 * entries of interest.  This design (which goes against the spirit of
362 * POSIX.1e) is useful for handling archive formats that combine
363 * default and access information in a single ACL list.
364 */
365__LA_DECL void	 archive_entry_acl_clear(struct archive_entry *);
366__LA_DECL void	 archive_entry_acl_add_entry(struct archive_entry *,
367	    int /* type */, int /* permset */, int /* tag */,
368	    int /* qual */, const char * /* name */);
369__LA_DECL void	 archive_entry_acl_add_entry_w(struct archive_entry *,
370	    int /* type */, int /* permset */, int /* tag */,
371	    int /* qual */, const wchar_t * /* name */);
372
373/*
374 * To retrieve the ACL, first "reset", then repeatedly ask for the
375 * "next" entry.  The want_type parameter allows you to request only
376 * access entries or only default entries.
377 */
378__LA_DECL int	 archive_entry_acl_reset(struct archive_entry *, int /* want_type */);
379__LA_DECL int	 archive_entry_acl_next(struct archive_entry *, int /* want_type */,
380	    int * /* type */, int * /* permset */, int * /* tag */,
381	    int * /* qual */, const char ** /* name */);
382__LA_DECL int	 archive_entry_acl_next_w(struct archive_entry *, int /* want_type */,
383	    int * /* type */, int * /* permset */, int * /* tag */,
384	    int * /* qual */, const wchar_t ** /* name */);
385
386/*
387 * Construct a text-format ACL.  The flags argument is a bitmask that
388 * can include any of the following:
389 *
390 * ARCHIVE_ENTRY_ACL_TYPE_ACCESS - Include access entries.
391 * ARCHIVE_ENTRY_ACL_TYPE_DEFAULT - Include default entries.
392 * ARCHIVE_ENTRY_ACL_STYLE_EXTRA_ID - Include extra numeric ID field in
393 *    each ACL entry.  (As used by 'star'.)
394 * ARCHIVE_ENTRY_ACL_STYLE_MARK_DEFAULT - Include "default:" before each
395 *    default ACL entry.
396 */
397#define	ARCHIVE_ENTRY_ACL_STYLE_EXTRA_ID	1024
398#define	ARCHIVE_ENTRY_ACL_STYLE_MARK_DEFAULT	2048
399__LA_DECL const wchar_t	*archive_entry_acl_text_w(struct archive_entry *,
400		    int /* flags */);
401
402/* Return a count of entries matching 'want_type' */
403__LA_DECL int	 archive_entry_acl_count(struct archive_entry *, int /* want_type */);
404
405/*
406 * Private ACL parser.  This is private because it handles some
407 * very weird formats that clients should not be messing with.
408 * Clients should only deal with their platform-native formats.
409 * Because of the need to support many formats cleanly, new arguments
410 * are likely to get added on a regular basis.  Clients who try to use
411 * this interface are likely to be surprised when it changes.
412 *
413 * You were warned!
414 *
415 * TODO: Move this declaration out of the public header and into
416 * a private header.  Warnings above are silly.
417 */
418__LA_DECL int		 __archive_entry_acl_parse_w(struct archive_entry *,
419		    const wchar_t *, int /* type */);
420
421/*
422 * extended attributes
423 */
424
425__LA_DECL void	 archive_entry_xattr_clear(struct archive_entry *);
426__LA_DECL void	 archive_entry_xattr_add_entry(struct archive_entry *,
427	    const char * /* name */, const void * /* value */,
428	    size_t /* size */);
429
430/*
431 * To retrieve the xattr list, first "reset", then repeatedly ask for the
432 * "next" entry.
433 */
434
435__LA_DECL int	archive_entry_xattr_count(struct archive_entry *);
436__LA_DECL int	archive_entry_xattr_reset(struct archive_entry *);
437__LA_DECL int	archive_entry_xattr_next(struct archive_entry *,
438	    const char ** /* name */, const void ** /* value */, size_t *);
439
440/*
441 * Utility to match up hardlinks.
442 *
443 * The 'struct archive_entry_linkresolver' is a cache of archive entries
444 * for files with multiple links.  Here's how to use it:
445 *   1. Create a lookup object with archive_entry_linkresolver_new()
446 *   2. Tell it the archive format you're using.
447 *   3. Hand each archive_entry to archive_entry_linkify().
448 *      That function will return 0, 1, or 2 entries that should
449 *      be written.
450 *   4. Call archive_entry_linkify(resolver, NULL) until
451 *      no more entries are returned.
452 *   5. Call archive_entry_link_resolver_free(resolver) to free resources.
453 *
454 * The entries returned have their hardlink and size fields updated
455 * appropriately.  If an entry is passed in that does not refer to
456 * a file with multiple links, it is returned unchanged.  The intention
457 * is that you should be able to simply filter all entries through
458 * this machine.
459 *
460 * To make things more efficient, be sure that each entry has a valid
461 * nlinks value.  The hardlink cache uses this to track when all links
462 * have been found.  If the nlinks value is zero, it will keep every
463 * name in the cache indefinitely, which can use a lot of memory.
464 *
465 * Note that archive_entry_size() is reset to zero if the file
466 * body should not be written to the archive.  Pay attention!
467 */
468struct archive_entry_linkresolver;
469
470/*
471 * There are three different strategies for marking hardlinks.
472 * The descriptions below name them after the best-known
473 * formats that rely on each strategy:
474 *
475 * "Old cpio" is the simplest, it always returns any entry unmodified.
476 *    As far as I know, only cpio formats use this.  Old cpio archives
477 *    store every link with the full body; the onus is on the dearchiver
478 *    to detect and properly link the files as they are restored.
479 * "tar" is also pretty simple; it caches a copy the first time it sees
480 *    any link.  Subsequent appearances are modified to be hardlink
481 *    references to the first one without any body.  Used by all tar
482 *    formats, although the newest tar formats permit the "old cpio" strategy
483 *    as well.  This strategy is very simple for the dearchiver,
484 *    and reasonably straightforward for the archiver.
485 * "new cpio" is trickier.  It stores the body only with the last
486 *    occurrence.  The complication is that we might not
487 *    see every link to a particular file in a single session, so
488 *    there's no easy way to know when we've seen the last occurrence.
489 *    The solution here is to queue one link until we see the next.
490 *    At the end of the session, you can enumerate any remaining
491 *    entries by calling archive_entry_linkify(NULL) and store those
492 *    bodies.  If you have a file with three links l1, l2, and l3,
493 *    you'll get the following behavior if you see all three links:
494 *           linkify(l1) => NULL   (the resolver stores l1 internally)
495 *           linkify(l2) => l1     (resolver stores l2, you write l1)
496 *           linkify(l3) => l2, l3 (all links seen, you can write both).
497 *    If you only see l1 and l2, you'll get this behavior:
498 *           linkify(l1) => NULL
499 *           linkify(l2) => l1
500 *           linkify(NULL) => l2   (at end, you retrieve remaining links)
501 *    As the name suggests, this strategy is used by newer cpio variants.
502 *    It's noticably more complex for the archiver, slightly more complex
503 *    for the dearchiver than the tar strategy, but makes it straightforward
504 *    to restore a file using any link by simply continuing to scan until
505 *    you see a link that is stored with a body.  In contrast, the tar
506 *    strategy requires you to rescan the archive from the beginning to
507 *    correctly extract an arbitrary link.
508 */
509
510__LA_DECL struct archive_entry_linkresolver *archive_entry_linkresolver_new(void);
511__LA_DECL void archive_entry_linkresolver_set_strategy(
512	struct archive_entry_linkresolver *, int /* format_code */);
513__LA_DECL void archive_entry_linkresolver_free(struct archive_entry_linkresolver *);
514__LA_DECL void archive_entry_linkify(struct archive_entry_linkresolver *,
515    struct archive_entry **, struct archive_entry **);
516
517#ifdef __cplusplus
518}
519#endif
520
521/* This is meaningless outside of this header. */
522#undef __LA_DECL
523
524#endif /* !ARCHIVE_ENTRY_H_INCLUDED */
525