1/*-
2 * Copyright (c) 2003-2007 Tim Kientzle
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in the
12 *    documentation and/or other materials provided with the distribution.
13 *
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
15 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
16 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
17 * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
18 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
19 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
20 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
21 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
22 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
23 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
24 */
25
26#include "bsdtar_platform.h"
27__FBSDID("$FreeBSD$");
28
29#ifdef HAVE_SYS_TYPES_H
30#include <sys/types.h>
31#endif
32#ifdef HAVE_SYS_IOCTL_H
33#include <sys/ioctl.h>
34#endif
35#ifdef HAVE_SYS_STAT_H
36#include <sys/stat.h>
37#endif
38#ifdef HAVE_ATTR_XATTR_H
39#include <attr/xattr.h>
40#endif
41#ifdef HAVE_ERRNO_H
42#include <errno.h>
43#endif
44#ifdef HAVE_FCNTL_H
45#include <fcntl.h>
46#endif
47#ifdef HAVE_GRP_H
48#include <grp.h>
49#endif
50#ifdef HAVE_IO_H
51#include <io.h>
52#endif
53#ifdef HAVE_LIMITS_H
54#include <limits.h>
55#endif
56#ifdef HAVE_LINUX_FS_H
57#include <linux/fs.h>	/* for Linux file flags */
58#endif
59/*
60 * Some Linux distributions have both linux/ext2_fs.h and ext2fs/ext2_fs.h.
61 * As the include guards don't agree, the order of include is important.
62 */
63#ifdef HAVE_LINUX_EXT2_FS_H
64#include <linux/ext2_fs.h>	/* for Linux file flags */
65#endif
66#if defined(HAVE_EXT2FS_EXT2_FS_H) && !defined(__CYGWIN__)
67/* This header exists but is broken on Cygwin. */
68#include <ext2fs/ext2_fs.h>
69#endif
70#ifdef HAVE_PWD_H
71#include <pwd.h>
72#endif
73#ifdef HAVE_STDINT_H
74#include <stdint.h>
75#endif
76#include <stdio.h>
77#ifdef HAVE_STDLIB_H
78#include <stdlib.h>
79#endif
80#ifdef HAVE_STRING_H
81#include <string.h>
82#endif
83#ifdef HAVE_UNISTD_H
84#include <unistd.h>
85#endif
86
87#include "bsdtar.h"
88#include "err.h"
89#include "line_reader.h"
90#include "tree.h"
91
92/* Size of buffer for holding file data prior to writing. */
93#define FILEDATABUFLEN	65536
94
95/* Fixed size of uname/gname caches. */
96#define	name_cache_size 101
97
98#ifndef O_BINARY
99#define O_BINARY 0
100#endif
101
102static const char * const NO_NAME = "(noname)";
103
104struct archive_dir_entry {
105	struct archive_dir_entry	*next;
106	time_t			 mtime_sec;
107	int			 mtime_nsec;
108	char			*name;
109};
110
111struct archive_dir {
112	struct archive_dir_entry *head, *tail;
113};
114
115struct name_cache {
116	int	probes;
117	int	hits;
118	size_t	size;
119	struct {
120		id_t id;
121		const char *name;
122	} cache[name_cache_size];
123};
124
125static void		 add_dir_list(struct bsdtar *bsdtar, const char *path,
126			     time_t mtime_sec, int mtime_nsec);
127static int		 append_archive(struct bsdtar *, struct archive *,
128			     struct archive *ina);
129static int		 append_archive_filename(struct bsdtar *,
130			     struct archive *, const char *fname);
131static void		 archive_names_from_file(struct bsdtar *bsdtar,
132			     struct archive *a);
133static int		 copy_file_data(struct bsdtar *, struct archive *a,
134			     struct archive *ina, struct archive_entry *);
135static int		 new_enough(struct bsdtar *, const char *path,
136			     const struct stat *);
137static void		 report_write(struct bsdtar *, struct archive *,
138			     struct archive_entry *, int64_t progress);
139static void		 test_for_append(struct bsdtar *);
140static void		 write_archive(struct archive *, struct bsdtar *);
141static void		 write_entry_backend(struct bsdtar *, struct archive *,
142			     struct archive_entry *);
143static int		 write_file_data(struct bsdtar *, struct archive *,
144			     struct archive_entry *, int fd);
145static void		 write_hierarchy(struct bsdtar *, struct archive *,
146			     const char *);
147
148#if defined(_WIN32) && !defined(__CYGWIN__)
149/* Not a full lseek() emulation, but enough for our needs here. */
150static int
151seek_file(int fd, int64_t offset, int whence)
152{
153	LARGE_INTEGER distance;
154	(void)whence; /* UNUSED */
155	distance.QuadPart = offset;
156	return (SetFilePointerEx((HANDLE)_get_osfhandle(fd),
157		distance, NULL, FILE_BEGIN) ? 1 : -1);
158}
159#define open _open
160#define close _close
161#define read _read
162#define lseek seek_file
163#endif
164
165void
166tar_mode_c(struct bsdtar *bsdtar)
167{
168	struct archive *a;
169	int r;
170
171	if (*bsdtar->argv == NULL && bsdtar->names_from_file == NULL)
172		lafe_errc(1, 0, "no files or directories specified");
173
174	a = archive_write_new();
175
176	/* Support any format that the library supports. */
177	if (bsdtar->create_format == NULL) {
178		r = archive_write_set_format_pax_restricted(a);
179		bsdtar->create_format = "pax restricted";
180	} else {
181		r = archive_write_set_format_by_name(a, bsdtar->create_format);
182	}
183	if (r != ARCHIVE_OK) {
184		fprintf(stderr, "Can't use format %s: %s\n",
185		    bsdtar->create_format,
186		    archive_error_string(a));
187		usage();
188	}
189
190	/*
191	 * If user explicitly set the block size, then assume they
192	 * want the last block padded as well.  Otherwise, use the
193	 * default block size and accept archive_write_open_file()'s
194	 * default padding decisions.
195	 */
196	if (bsdtar->bytes_per_block != 0) {
197		archive_write_set_bytes_per_block(a, bsdtar->bytes_per_block);
198		archive_write_set_bytes_in_last_block(a,
199		    bsdtar->bytes_per_block);
200	} else
201		archive_write_set_bytes_per_block(a, DEFAULT_BYTES_PER_BLOCK);
202
203	if (bsdtar->compress_program) {
204		archive_write_set_compression_program(a, bsdtar->compress_program);
205	} else {
206		switch (bsdtar->create_compression) {
207		case 0:
208			r = archive_write_set_compression_none(a);
209			break;
210		case 'j': case 'y':
211			r = archive_write_set_compression_bzip2(a);
212			break;
213		case 'J':
214			r = archive_write_set_compression_xz(a);
215			break;
216		case OPTION_LZMA:
217			r = archive_write_set_compression_lzma(a);
218			break;
219		case 'z':
220			r = archive_write_set_compression_gzip(a);
221			break;
222		case 'Z':
223			r = archive_write_set_compression_compress(a);
224			break;
225		default:
226			lafe_errc(1, 0,
227			    "Unrecognized compression option -%c",
228			    bsdtar->create_compression);
229		}
230		if (r != ARCHIVE_OK) {
231			lafe_errc(1, 0,
232			    "Unsupported compression option -%c",
233			    bsdtar->create_compression);
234		}
235	}
236
237	if (ARCHIVE_OK != archive_write_set_options(a, bsdtar->option_options))
238		lafe_errc(1, 0, "%s", archive_error_string(a));
239	if (ARCHIVE_OK != archive_write_open_file(a, bsdtar->filename))
240		lafe_errc(1, 0, "%s", archive_error_string(a));
241	write_archive(a, bsdtar);
242}
243
244/*
245 * Same as 'c', except we only support tar or empty formats in
246 * uncompressed files on disk.
247 */
248void
249tar_mode_r(struct bsdtar *bsdtar)
250{
251	int64_t	end_offset;
252	int	format;
253	struct archive *a;
254	struct archive_entry *entry;
255	int	r;
256
257	/* Sanity-test some arguments and the file. */
258	test_for_append(bsdtar);
259
260	format = ARCHIVE_FORMAT_TAR_PAX_RESTRICTED;
261
262#if defined(__BORLANDC__)
263	bsdtar->fd = open(bsdtar->filename, O_RDWR | O_CREAT | O_BINARY);
264#else
265	bsdtar->fd = open(bsdtar->filename, O_RDWR | O_CREAT | O_BINARY, 0666);
266#endif
267	if (bsdtar->fd < 0)
268		lafe_errc(1, errno,
269		    "Cannot open %s", bsdtar->filename);
270
271	a = archive_read_new();
272	archive_read_support_compression_all(a);
273	archive_read_support_format_tar(a);
274	archive_read_support_format_gnutar(a);
275	r = archive_read_open_fd(a, bsdtar->fd, 10240);
276	if (r != ARCHIVE_OK)
277		lafe_errc(1, archive_errno(a),
278		    "Can't read archive %s: %s", bsdtar->filename,
279		    archive_error_string(a));
280	while (0 == archive_read_next_header(a, &entry)) {
281		if (archive_compression(a) != ARCHIVE_COMPRESSION_NONE) {
282			archive_read_finish(a);
283			close(bsdtar->fd);
284			lafe_errc(1, 0,
285			    "Cannot append to compressed archive.");
286		}
287		/* Keep going until we hit end-of-archive */
288		format = archive_format(a);
289	}
290
291	end_offset = archive_read_header_position(a);
292	archive_read_finish(a);
293
294	/* Re-open archive for writing */
295	a = archive_write_new();
296	archive_write_set_compression_none(a);
297	/*
298	 * Set the format to be used for writing.  To allow people to
299	 * extend empty files, we need to allow them to specify the format,
300	 * which opens the possibility that they will specify a format that
301	 * doesn't match the existing format.  Hence, the following bit
302	 * of arcane ugliness.
303	 */
304
305	if (bsdtar->create_format != NULL) {
306		/* If the user requested a format, use that, but ... */
307		archive_write_set_format_by_name(a,
308		    bsdtar->create_format);
309		/* ... complain if it's not compatible. */
310		format &= ARCHIVE_FORMAT_BASE_MASK;
311		if (format != (int)(archive_format(a) & ARCHIVE_FORMAT_BASE_MASK)
312		    && format != ARCHIVE_FORMAT_EMPTY) {
313			lafe_errc(1, 0,
314			    "Format %s is incompatible with the archive %s.",
315			    bsdtar->create_format, bsdtar->filename);
316		}
317	} else {
318		/*
319		 * Just preserve the current format, with a little care
320		 * for formats that libarchive can't write.
321		 */
322		if (format == ARCHIVE_FORMAT_TAR_GNUTAR)
323			/* TODO: When gtar supports pax, use pax restricted. */
324			format = ARCHIVE_FORMAT_TAR_USTAR;
325		if (format == ARCHIVE_FORMAT_EMPTY)
326			format = ARCHIVE_FORMAT_TAR_PAX_RESTRICTED;
327		archive_write_set_format(a, format);
328	}
329	if (lseek(bsdtar->fd, end_offset, SEEK_SET) < 0)
330		lafe_errc(1, errno, "Could not seek to archive end");
331	if (ARCHIVE_OK != archive_write_set_options(a, bsdtar->option_options))
332		lafe_errc(1, 0, "%s", archive_error_string(a));
333	if (ARCHIVE_OK != archive_write_open_fd(a, bsdtar->fd))
334		lafe_errc(1, 0, "%s", archive_error_string(a));
335
336	write_archive(a, bsdtar); /* XXX check return val XXX */
337
338	close(bsdtar->fd);
339	bsdtar->fd = -1;
340}
341
342void
343tar_mode_u(struct bsdtar *bsdtar)
344{
345	int64_t			 end_offset;
346	struct archive		*a;
347	struct archive_entry	*entry;
348	int			 format;
349	struct archive_dir_entry	*p;
350	struct archive_dir	 archive_dir;
351
352	bsdtar->archive_dir = &archive_dir;
353	memset(&archive_dir, 0, sizeof(archive_dir));
354
355	format = ARCHIVE_FORMAT_TAR_PAX_RESTRICTED;
356
357	/* Sanity-test some arguments and the file. */
358	test_for_append(bsdtar);
359
360	bsdtar->fd = open(bsdtar->filename, O_RDWR | O_BINARY);
361	if (bsdtar->fd < 0)
362		lafe_errc(1, errno,
363		    "Cannot open %s", bsdtar->filename);
364
365	a = archive_read_new();
366	archive_read_support_compression_all(a);
367	archive_read_support_format_tar(a);
368	archive_read_support_format_gnutar(a);
369	if (archive_read_open_fd(a, bsdtar->fd,
370	    bsdtar->bytes_per_block != 0 ? bsdtar->bytes_per_block :
371		DEFAULT_BYTES_PER_BLOCK) != ARCHIVE_OK) {
372		lafe_errc(1, 0,
373		    "Can't open %s: %s", bsdtar->filename,
374		    archive_error_string(a));
375	}
376
377	/* Build a list of all entries and their recorded mod times. */
378	while (0 == archive_read_next_header(a, &entry)) {
379		if (archive_compression(a) != ARCHIVE_COMPRESSION_NONE) {
380			archive_read_finish(a);
381			close(bsdtar->fd);
382			lafe_errc(1, 0,
383			    "Cannot append to compressed archive.");
384		}
385		add_dir_list(bsdtar, archive_entry_pathname(entry),
386		    archive_entry_mtime(entry),
387		    archive_entry_mtime_nsec(entry));
388		/* Record the last format determination we see */
389		format = archive_format(a);
390		/* Keep going until we hit end-of-archive */
391	}
392
393	end_offset = archive_read_header_position(a);
394	archive_read_finish(a);
395
396	/* Re-open archive for writing. */
397	a = archive_write_new();
398	archive_write_set_compression_none(a);
399	/*
400	 * Set format to same one auto-detected above, except that
401	 * we don't write GNU tar format, so use ustar instead.
402	 */
403	if (format == ARCHIVE_FORMAT_TAR_GNUTAR)
404		format = ARCHIVE_FORMAT_TAR_USTAR;
405	archive_write_set_format(a, format);
406	if (bsdtar->bytes_per_block != 0) {
407		archive_write_set_bytes_per_block(a, bsdtar->bytes_per_block);
408		archive_write_set_bytes_in_last_block(a,
409		    bsdtar->bytes_per_block);
410	} else
411		archive_write_set_bytes_per_block(a, DEFAULT_BYTES_PER_BLOCK);
412	if (lseek(bsdtar->fd, end_offset, SEEK_SET) < 0)
413		lafe_errc(1, errno, "Could not seek to archive end");
414	if (ARCHIVE_OK != archive_write_set_options(a, bsdtar->option_options))
415		lafe_errc(1, 0, "%s", archive_error_string(a));
416	if (ARCHIVE_OK != archive_write_open_fd(a, bsdtar->fd))
417		lafe_errc(1, 0, "%s", archive_error_string(a));
418
419	write_archive(a, bsdtar);
420
421	close(bsdtar->fd);
422	bsdtar->fd = -1;
423
424	while (bsdtar->archive_dir->head != NULL) {
425		p = bsdtar->archive_dir->head->next;
426		free(bsdtar->archive_dir->head->name);
427		free(bsdtar->archive_dir->head);
428		bsdtar->archive_dir->head = p;
429	}
430	bsdtar->archive_dir->tail = NULL;
431}
432
433
434/*
435 * Write user-specified files/dirs to opened archive.
436 */
437static void
438write_archive(struct archive *a, struct bsdtar *bsdtar)
439{
440	const char *arg;
441	struct archive_entry *entry, *sparse_entry;
442
443	/* Allocate a buffer for file data. */
444	if ((bsdtar->buff = malloc(FILEDATABUFLEN)) == NULL)
445		lafe_errc(1, 0, "cannot allocate memory");
446
447	if ((bsdtar->resolver = archive_entry_linkresolver_new()) == NULL)
448		lafe_errc(1, 0, "cannot create link resolver");
449	archive_entry_linkresolver_set_strategy(bsdtar->resolver,
450	    archive_format(a));
451	if ((bsdtar->diskreader = archive_read_disk_new()) == NULL)
452		lafe_errc(1, 0, "Cannot create read_disk object");
453	archive_read_disk_set_standard_lookup(bsdtar->diskreader);
454
455	if (bsdtar->names_from_file != NULL)
456		archive_names_from_file(bsdtar, a);
457
458	while (*bsdtar->argv) {
459		arg = *bsdtar->argv;
460		if (arg[0] == '-' && arg[1] == 'C') {
461			arg += 2;
462			if (*arg == '\0') {
463				bsdtar->argv++;
464				arg = *bsdtar->argv;
465				if (arg == NULL) {
466					lafe_warnc(0, "%s",
467					    "Missing argument for -C");
468					bsdtar->return_value = 1;
469					goto cleanup;
470				}
471			}
472			set_chdir(bsdtar, arg);
473		} else {
474			if (*arg != '/' && (arg[0] != '@' || arg[1] != '/'))
475				do_chdir(bsdtar); /* Handle a deferred -C */
476			if (*arg == '@') {
477				if (append_archive_filename(bsdtar, a,
478				    arg + 1) != 0)
479					break;
480			} else
481				write_hierarchy(bsdtar, a, arg);
482		}
483		bsdtar->argv++;
484	}
485
486	entry = NULL;
487	archive_entry_linkify(bsdtar->resolver, &entry, &sparse_entry);
488	while (entry != NULL) {
489		write_entry_backend(bsdtar, a, entry);
490		archive_entry_free(entry);
491		entry = NULL;
492		archive_entry_linkify(bsdtar->resolver, &entry, &sparse_entry);
493	}
494
495	if (archive_write_close(a)) {
496		lafe_warnc(0, "%s", archive_error_string(a));
497		bsdtar->return_value = 1;
498	}
499
500cleanup:
501	/* Free file data buffer. */
502	free(bsdtar->buff);
503	archive_entry_linkresolver_free(bsdtar->resolver);
504	bsdtar->resolver = NULL;
505	archive_read_finish(bsdtar->diskreader);
506	bsdtar->diskreader = NULL;
507
508	if (bsdtar->option_totals) {
509		fprintf(stderr, "Total bytes written: %s\n",
510		    tar_i64toa(archive_position_compressed(a)));
511	}
512
513	archive_write_finish(a);
514}
515
516/*
517 * Archive names specified in file.
518 *
519 * Unless --null was specified, a line containing exactly "-C" will
520 * cause the next line to be a directory to pass to chdir().  If
521 * --null is specified, then a line "-C" is just another filename.
522 */
523static void
524archive_names_from_file(struct bsdtar *bsdtar, struct archive *a)
525{
526	struct lafe_line_reader *lr;
527	const char *line;
528
529	bsdtar->next_line_is_dir = 0;
530
531	lr = lafe_line_reader(bsdtar->names_from_file, bsdtar->option_null);
532	while ((line = lafe_line_reader_next(lr)) != NULL) {
533		if (bsdtar->next_line_is_dir) {
534			set_chdir(bsdtar, line);
535			bsdtar->next_line_is_dir = 0;
536		} else if (!bsdtar->option_null && strcmp(line, "-C") == 0)
537			bsdtar->next_line_is_dir = 1;
538		else {
539			if (*line != '/')
540				do_chdir(bsdtar); /* Handle a deferred -C */
541			write_hierarchy(bsdtar, a, line);
542		}
543	}
544	lafe_line_reader_free(lr);
545	if (bsdtar->next_line_is_dir)
546		lafe_errc(1, errno,
547		    "Unexpected end of filename list; "
548		    "directory expected after -C");
549}
550
551/*
552 * Copy from specified archive to current archive.  Returns non-zero
553 * for write errors (which force us to terminate the entire archiving
554 * operation).  If there are errors reading the input archive, we set
555 * bsdtar->return_value but return zero, so the overall archiving
556 * operation will complete and return non-zero.
557 */
558static int
559append_archive_filename(struct bsdtar *bsdtar, struct archive *a,
560    const char *filename)
561{
562	struct archive *ina;
563	int rc;
564
565	if (strcmp(filename, "-") == 0)
566		filename = NULL; /* Library uses NULL for stdio. */
567
568	ina = archive_read_new();
569	archive_read_support_format_all(ina);
570	archive_read_support_compression_all(ina);
571	if (archive_read_open_file(ina, filename, 10240)) {
572		lafe_warnc(0, "%s", archive_error_string(ina));
573		bsdtar->return_value = 1;
574		return (0);
575	}
576
577	rc = append_archive(bsdtar, a, ina);
578
579	if (rc != ARCHIVE_OK) {
580		lafe_warnc(0, "Error reading archive %s: %s",
581		    filename, archive_error_string(ina));
582		bsdtar->return_value = 1;
583	}
584	archive_read_finish(ina);
585
586	return (rc);
587}
588
589static int
590append_archive(struct bsdtar *bsdtar, struct archive *a, struct archive *ina)
591{
592	struct archive_entry *in_entry;
593	int e;
594
595	while (ARCHIVE_OK == (e = archive_read_next_header(ina, &in_entry))) {
596		if (!new_enough(bsdtar, archive_entry_pathname(in_entry),
597			archive_entry_stat(in_entry)))
598			continue;
599		if (lafe_excluded(bsdtar->matching, archive_entry_pathname(in_entry)))
600			continue;
601		if (bsdtar->option_interactive &&
602		    !yes("copy '%s'", archive_entry_pathname(in_entry)))
603			continue;
604		if (bsdtar->verbose)
605			safe_fprintf(stderr, "a %s",
606			    archive_entry_pathname(in_entry));
607		if (need_report())
608			report_write(bsdtar, a, in_entry, 0);
609
610		e = archive_write_header(a, in_entry);
611		if (e != ARCHIVE_OK) {
612			if (!bsdtar->verbose)
613				lafe_warnc(0, "%s: %s",
614				    archive_entry_pathname(in_entry),
615				    archive_error_string(a));
616			else
617				fprintf(stderr, ": %s", archive_error_string(a));
618		}
619		if (e == ARCHIVE_FATAL)
620			exit(1);
621
622		if (e >= ARCHIVE_WARN) {
623			if (archive_entry_size(in_entry) == 0)
624				archive_read_data_skip(ina);
625			else if (copy_file_data(bsdtar, a, ina, in_entry))
626				exit(1);
627		}
628
629		if (bsdtar->verbose)
630			fprintf(stderr, "\n");
631	}
632
633	return (e == ARCHIVE_EOF ? ARCHIVE_OK : e);
634}
635
636/* Helper function to copy data between archives. */
637static int
638copy_file_data(struct bsdtar *bsdtar, struct archive *a,
639    struct archive *ina, struct archive_entry *entry)
640{
641	ssize_t	bytes_read;
642	ssize_t	bytes_written;
643	int64_t	progress = 0;
644
645	bytes_read = archive_read_data(ina, bsdtar->buff, FILEDATABUFLEN);
646	while (bytes_read > 0) {
647		if (need_report())
648			report_write(bsdtar, a, entry, progress);
649
650		bytes_written = archive_write_data(a, bsdtar->buff,
651		    bytes_read);
652		if (bytes_written < bytes_read) {
653			lafe_warnc(0, "%s", archive_error_string(a));
654			return (-1);
655		}
656		progress += bytes_written;
657		bytes_read = archive_read_data(ina, bsdtar->buff,
658		    FILEDATABUFLEN);
659	}
660
661	return (0);
662}
663
664/*
665 * Add the file or dir hierarchy named by 'path' to the archive
666 */
667static void
668write_hierarchy(struct bsdtar *bsdtar, struct archive *a, const char *path)
669{
670	struct archive_entry *entry = NULL, *spare_entry = NULL;
671	struct tree *tree;
672	char symlink_mode = bsdtar->symlink_mode;
673	dev_t first_dev = 0;
674	int dev_recorded = 0;
675	int tree_ret;
676
677	tree = tree_open(path);
678
679	if (!tree) {
680		lafe_warnc(errno, "%s: Cannot open", path);
681		bsdtar->return_value = 1;
682		return;
683	}
684
685	while ((tree_ret = tree_next(tree)) != 0) {
686		int r;
687		const char *name = tree_current_path(tree);
688		const struct stat *st = NULL; /* info to use for this entry */
689		const struct stat *lst = NULL; /* lstat() information */
690		int descend;
691
692		if (tree_ret == TREE_ERROR_FATAL)
693			lafe_errc(1, tree_errno(tree),
694			    "%s: Unable to continue traversing directory tree",
695			    name);
696		if (tree_ret == TREE_ERROR_DIR) {
697			lafe_warnc(errno,
698			    "%s: Couldn't visit directory", name);
699			bsdtar->return_value = 1;
700		}
701		if (tree_ret != TREE_REGULAR)
702			continue;
703
704		/*
705		 * If this file/dir is excluded by a filename
706		 * pattern, skip it.
707		 */
708		if (lafe_excluded(bsdtar->matching, name))
709			continue;
710
711		/*
712		 * Get lstat() info from the tree library.
713		 */
714		lst = tree_current_lstat(tree);
715		if (lst == NULL) {
716			/* Couldn't lstat(); must not exist. */
717			lafe_warnc(errno, "%s: Cannot stat", name);
718			/* Return error if files disappear during traverse. */
719			bsdtar->return_value = 1;
720			continue;
721		}
722
723		/*
724		 * Distinguish 'L'/'P'/'H' symlink following.
725		 */
726		switch(symlink_mode) {
727		case 'H':
728			/* 'H': After the first item, rest like 'P'. */
729			symlink_mode = 'P';
730			/* 'H': First item (from command line) like 'L'. */
731			/* FALLTHROUGH */
732		case 'L':
733			/* 'L': Do descend through a symlink to dir. */
734			descend = tree_current_is_dir(tree);
735			/* 'L': Follow symlinks to files. */
736			archive_read_disk_set_symlink_logical(bsdtar->diskreader);
737			/* 'L': Archive symlinks as targets, if we can. */
738			st = tree_current_stat(tree);
739			if (st != NULL)
740				break;
741			/* If stat fails, we have a broken symlink;
742			 * in that case, don't follow the link. */
743			/* FALLTHROUGH */
744		default:
745			/* 'P': Don't descend through a symlink to dir. */
746			descend = tree_current_is_physical_dir(tree);
747			/* 'P': Don't follow symlinks to files. */
748			archive_read_disk_set_symlink_physical(bsdtar->diskreader);
749			/* 'P': Archive symlinks as symlinks. */
750			st = lst;
751			break;
752		}
753
754		if (bsdtar->option_no_subdirs)
755			descend = 0;
756
757		/*
758		 * Are we about to cross to a new filesystem?
759		 */
760		if (!dev_recorded) {
761			/* This is the initial file system. */
762			first_dev = lst->st_dev;
763			dev_recorded = 1;
764		} else if (lst->st_dev == first_dev) {
765			/* The starting file system is always acceptable. */
766		} else if (descend == 0) {
767			/* We're not descending, so no need to check. */
768		} else if (bsdtar->option_dont_traverse_mounts) {
769			descend = 0;
770		} else {
771			/* We're prepared to cross a mount point. */
772
773			/* XXX TODO: check whether this filesystem is
774			 * synthetic and/or local.  Add a new
775			 * --local-only option to skip non-local
776			 * filesystems.  Skip synthetic filesystems
777			 * regardless.
778			 *
779			 * The results should be cached, since
780			 * tree.c doesn't usually visit a directory
781			 * and the directory contents together.  A simple
782			 * move-to-front list should perform quite well.
783			 *
784			 * This is going to be heavily OS dependent:
785			 * FreeBSD's statfs() in conjunction with getvfsbyname()
786			 * provides all of this; NetBSD's statvfs() does
787			 * most of it; other systems will vary.
788			 */
789		}
790
791		/*
792		 * In -u mode, check that the file is newer than what's
793		 * already in the archive; in all modes, obey --newerXXX flags.
794		 */
795		if (!new_enough(bsdtar, name, st)) {
796			if (!descend)
797				continue;
798			if (bsdtar->option_interactive &&
799			    !yes("add '%s'", name))
800				continue;
801			tree_descend(tree);
802			continue;
803		}
804
805		archive_entry_free(entry);
806		entry = archive_entry_new();
807
808		archive_entry_set_pathname(entry, name);
809		archive_entry_copy_sourcepath(entry,
810		    tree_current_access_path(tree));
811
812		/* Populate the archive_entry with metadata from the disk. */
813		/* XXX TODO: Arrange to open a regular file before
814		 * calling this so we can pass in an fd and shorten
815		 * the race to query metadata.  The linkify dance
816		 * makes this more complex than it might sound. */
817#if defined(_WIN32) && !defined(__CYGWIN__)
818		/* TODO: tree.c uses stat(), which is badly broken
819		 * on Windows.  To fix this, we should
820		 * deprecate tree_current_stat() and provide a new
821		 * call tree_populate_entry(t, entry).  This call
822		 * would use stat() internally on POSIX and
823		 * GetInfoByFileHandle() internally on Windows.
824		 * This would be another step towards a tree-walker
825		 * that can be integrated deep into libarchive.
826		 * For now, just set st to NULL on Windows;
827		 * archive_read_disk_entry_from_file() should
828		 * be smart enough to use platform-appropriate
829		 * ways to probe file information.
830		 */
831		st = NULL;
832#endif
833		r = archive_read_disk_entry_from_file(bsdtar->diskreader,
834		    entry, -1, st);
835		if (bsdtar->uid >= 0) {
836			archive_entry_set_uid(entry, bsdtar->uid);
837			if (!bsdtar->uname)
838				archive_entry_set_uname(entry,
839				    archive_read_disk_uname(bsdtar->diskreader,
840					bsdtar->uid));
841		}
842		if (bsdtar->gid >= 0) {
843			archive_entry_set_gid(entry, bsdtar->gid);
844			if (!bsdtar->gname)
845				archive_entry_set_gname(entry,
846				    archive_read_disk_gname(bsdtar->diskreader,
847					bsdtar->gid));
848		}
849		if (bsdtar->uname)
850			archive_entry_set_uname(entry, bsdtar->uname);
851		if (bsdtar->gname)
852			archive_entry_set_gname(entry, bsdtar->gname);
853		if (r != ARCHIVE_OK)
854			lafe_warnc(archive_errno(bsdtar->diskreader),
855			    "%s", archive_error_string(bsdtar->diskreader));
856		if (r < ARCHIVE_WARN)
857			continue;
858
859		/* XXX TODO: Just use flag data from entry; avoid the
860		 * duplicate check here. */
861
862		/*
863		 * If this file/dir is flagged "nodump" and we're
864		 * honoring such flags, skip this file/dir.
865		 */
866#if defined(HAVE_STRUCT_STAT_ST_FLAGS) && defined(UF_NODUMP)
867		/* BSD systems store flags in struct stat */
868		if (bsdtar->option_honor_nodump &&
869		    (lst->st_flags & UF_NODUMP))
870			continue;
871#endif
872
873#if defined(EXT2_IOC_GETFLAGS) && defined(EXT2_NODUMP_FL)
874		/* Linux uses ioctl to read flags. */
875		if (bsdtar->option_honor_nodump) {
876			int fd = open(name, O_RDONLY | O_NONBLOCK | O_BINARY);
877			if (fd >= 0) {
878				unsigned long fflags;
879				int r = ioctl(fd, EXT2_IOC_GETFLAGS, &fflags);
880				close(fd);
881				if (r >= 0 && (fflags & EXT2_NODUMP_FL))
882					continue;
883			}
884		}
885#endif
886
887		/*
888		 * If the user vetoes this file/directory, skip it.
889		 * We want this to be fairly late; if some other
890		 * check would veto this file, we shouldn't bother
891		 * the user with it.
892		 */
893		if (bsdtar->option_interactive &&
894		    !yes("add '%s'", name))
895			continue;
896
897		if (descend)
898			tree_descend(tree);
899
900		/*
901		 * Rewrite the pathname to be archived.  If rewrite
902		 * fails, skip the entry.
903		 */
904		if (edit_pathname(bsdtar, entry))
905			continue;
906
907		/* Display entry as we process it.
908		 * This format is required by SUSv2. */
909		if (bsdtar->verbose)
910			safe_fprintf(stderr, "a %s",
911			    archive_entry_pathname(entry));
912
913		/* Non-regular files get archived with zero size. */
914		if (archive_entry_filetype(entry) != AE_IFREG)
915			archive_entry_set_size(entry, 0);
916
917		archive_entry_linkify(bsdtar->resolver, &entry, &spare_entry);
918
919		while (entry != NULL) {
920			write_entry_backend(bsdtar, a, entry);
921			archive_entry_free(entry);
922			entry = spare_entry;
923			spare_entry = NULL;
924		}
925
926		if (bsdtar->verbose)
927			fprintf(stderr, "\n");
928	}
929	archive_entry_free(entry);
930	tree_close(tree);
931}
932
933/*
934 * Backend for write_entry.
935 */
936static void
937write_entry_backend(struct bsdtar *bsdtar, struct archive *a,
938    struct archive_entry *entry)
939{
940	int fd = -1;
941	int e;
942
943	if (archive_entry_size(entry) > 0) {
944		const char *pathname = archive_entry_sourcepath(entry);
945		fd = open(pathname, O_RDONLY | O_BINARY);
946		if (fd == -1) {
947			bsdtar->return_value = 1;
948			if (!bsdtar->verbose)
949				lafe_warnc(errno,
950				    "%s: could not open file", pathname);
951			else
952				fprintf(stderr, ": %s", strerror(errno));
953			return;
954		}
955	}
956
957	e = archive_write_header(a, entry);
958	if (e != ARCHIVE_OK) {
959		if (!bsdtar->verbose)
960			lafe_warnc(0, "%s: %s",
961			    archive_entry_pathname(entry),
962			    archive_error_string(a));
963		else
964			fprintf(stderr, ": %s", archive_error_string(a));
965	}
966
967	if (e == ARCHIVE_FATAL)
968		exit(1);
969
970	/*
971	 * If we opened a file earlier, write it out now.  Note that
972	 * the format handler might have reset the size field to zero
973	 * to inform us that the archive body won't get stored.  In
974	 * that case, just skip the write.
975	 */
976	if (e >= ARCHIVE_WARN && fd >= 0 && archive_entry_size(entry) > 0) {
977		if (write_file_data(bsdtar, a, entry, fd))
978			exit(1);
979	}
980
981	/*
982	 * If we opened a file, close it now even if there was an error
983	 * which made us decide not to write the archive body.
984	 */
985	if (fd >= 0)
986		close(fd);
987}
988
989static void
990report_write(struct bsdtar *bsdtar, struct archive *a,
991    struct archive_entry *entry, int64_t progress)
992{
993	uint64_t comp, uncomp;
994	int compression;
995
996	if (bsdtar->verbose)
997		fprintf(stderr, "\n");
998	comp = archive_position_compressed(a);
999	uncomp = archive_position_uncompressed(a);
1000	fprintf(stderr, "In: %d files, %s bytes;",
1001	    archive_file_count(a), tar_i64toa(uncomp));
1002	if (comp > uncomp)
1003		compression = 0;
1004	else
1005		compression = (int)((uncomp - comp) * 100 / uncomp);
1006	fprintf(stderr,
1007	    " Out: %s bytes, compression %d%%\n",
1008	    tar_i64toa(comp), compression);
1009	/* Can't have two calls to tar_i64toa() pending, so split the output. */
1010	safe_fprintf(stderr, "Current: %s (%s",
1011	    archive_entry_pathname(entry),
1012	    tar_i64toa(progress));
1013	fprintf(stderr, "/%s bytes)\n",
1014	    tar_i64toa(archive_entry_size(entry)));
1015}
1016
1017
1018/* Helper function to copy file to archive. */
1019static int
1020write_file_data(struct bsdtar *bsdtar, struct archive *a,
1021    struct archive_entry *entry, int fd)
1022{
1023	ssize_t	bytes_read;
1024	ssize_t	bytes_written;
1025	int64_t	progress = 0;
1026
1027	bytes_read = read(fd, bsdtar->buff, FILEDATABUFLEN);
1028	while (bytes_read > 0) {
1029		if (need_report())
1030			report_write(bsdtar, a, entry, progress);
1031
1032		bytes_written = archive_write_data(a, bsdtar->buff,
1033		    bytes_read);
1034		if (bytes_written < 0) {
1035			/* Write failed; this is bad */
1036			lafe_warnc(0, "%s", archive_error_string(a));
1037			return (-1);
1038		}
1039		if (bytes_written < bytes_read) {
1040			/* Write was truncated; warn but continue. */
1041			lafe_warnc(0,
1042			    "%s: Truncated write; file may have grown while being archived.",
1043			    archive_entry_pathname(entry));
1044			return (0);
1045		}
1046		progress += bytes_written;
1047		bytes_read = read(fd, bsdtar->buff, FILEDATABUFLEN);
1048	}
1049	if (bytes_read < 0) {
1050		lafe_warnc(errno,
1051			     "%s: Read error",
1052			     archive_entry_pathname(entry));
1053		bsdtar->return_value = 1;
1054	}
1055	return 0;
1056}
1057
1058/*
1059 * Test if the specified file is new enough to include in the archive.
1060 */
1061static int
1062new_enough(struct bsdtar *bsdtar, const char *path, const struct stat *st)
1063{
1064	struct archive_dir_entry *p;
1065
1066	/*
1067	 * If this file/dir is excluded by a time comparison, skip it.
1068	 */
1069	if (bsdtar->newer_ctime_sec > 0) {
1070		if (st->st_ctime < bsdtar->newer_ctime_sec)
1071			return (0); /* Too old, skip it. */
1072		if (st->st_ctime == bsdtar->newer_ctime_sec
1073		    && ARCHIVE_STAT_CTIME_NANOS(st)
1074		    <= bsdtar->newer_ctime_nsec)
1075			return (0); /* Too old, skip it. */
1076	}
1077	if (bsdtar->newer_mtime_sec > 0) {
1078		if (st->st_mtime < bsdtar->newer_mtime_sec)
1079			return (0); /* Too old, skip it. */
1080		if (st->st_mtime == bsdtar->newer_mtime_sec
1081		    && ARCHIVE_STAT_MTIME_NANOS(st)
1082		    <= bsdtar->newer_mtime_nsec)
1083			return (0); /* Too old, skip it. */
1084	}
1085
1086	/*
1087	 * In -u mode, we only write an entry if it's newer than
1088	 * what was already in the archive.
1089	 */
1090	if (bsdtar->archive_dir != NULL &&
1091	    bsdtar->archive_dir->head != NULL) {
1092		for (p = bsdtar->archive_dir->head; p != NULL; p = p->next) {
1093			if (pathcmp(path, p->name)==0)
1094				return (p->mtime_sec < st->st_mtime ||
1095				    (p->mtime_sec == st->st_mtime &&
1096					p->mtime_nsec
1097					< ARCHIVE_STAT_MTIME_NANOS(st)));
1098		}
1099	}
1100
1101	/* If the file wasn't rejected, include it. */
1102	return (1);
1103}
1104
1105/*
1106 * Add an entry to the dir list for 'u' mode.
1107 *
1108 * XXX TODO: Make this fast.
1109 */
1110static void
1111add_dir_list(struct bsdtar *bsdtar, const char *path,
1112    time_t mtime_sec, int mtime_nsec)
1113{
1114	struct archive_dir_entry	*p;
1115
1116	/*
1117	 * Search entire list to see if this file has appeared before.
1118	 * If it has, override the timestamp data.
1119	 */
1120	p = bsdtar->archive_dir->head;
1121	while (p != NULL) {
1122		if (strcmp(path, p->name)==0) {
1123			p->mtime_sec = mtime_sec;
1124			p->mtime_nsec = mtime_nsec;
1125			return;
1126		}
1127		p = p->next;
1128	}
1129
1130	p = malloc(sizeof(*p));
1131	if (p == NULL)
1132		lafe_errc(1, ENOMEM, "Can't read archive directory");
1133
1134	p->name = strdup(path);
1135	if (p->name == NULL)
1136		lafe_errc(1, ENOMEM, "Can't read archive directory");
1137	p->mtime_sec = mtime_sec;
1138	p->mtime_nsec = mtime_nsec;
1139	p->next = NULL;
1140	if (bsdtar->archive_dir->tail == NULL) {
1141		bsdtar->archive_dir->head = bsdtar->archive_dir->tail = p;
1142	} else {
1143		bsdtar->archive_dir->tail->next = p;
1144		bsdtar->archive_dir->tail = p;
1145	}
1146}
1147
1148static void
1149test_for_append(struct bsdtar *bsdtar)
1150{
1151	struct stat s;
1152
1153	if (*bsdtar->argv == NULL && bsdtar->names_from_file == NULL)
1154		lafe_errc(1, 0, "no files or directories specified");
1155	if (bsdtar->filename == NULL)
1156		lafe_errc(1, 0, "Cannot append to stdout.");
1157
1158	if (bsdtar->create_compression != 0)
1159		lafe_errc(1, 0,
1160		    "Cannot append to %s with compression", bsdtar->filename);
1161
1162	if (stat(bsdtar->filename, &s) != 0)
1163		return;
1164
1165	if (!S_ISREG(s.st_mode) && !S_ISBLK(s.st_mode))
1166		lafe_errc(1, 0,
1167		    "Cannot append to %s: not a regular file.",
1168		    bsdtar->filename);
1169
1170/* Is this an appropriate check here on Windows? */
1171/*
1172	if (GetFileType(handle) != FILE_TYPE_DISK)
1173		lafe_errc(1, 0, "Cannot append");
1174*/
1175
1176}
1177