Merge from vendor branch LIBARCHIVE:
[dragonfly.git] / contrib / libarchive-2 / tar / read.c
1 /*-
2  * Copyright (c) 2003-2007 Tim Kientzle
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  *
14  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR(S) ``AS IS'' AND ANY EXPRESS OR
15  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
16  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
17  * IN NO EVENT SHALL THE AUTHOR(S) BE LIABLE FOR ANY DIRECT, INDIRECT,
18  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
19  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
20  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
21  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
22  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
23  * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
24  */
25
26 #include "bsdtar_platform.h"
27 __FBSDID("$FreeBSD: src/usr.bin/tar/read.c,v 1.38 2008/05/26 17:10:10 kientzle Exp $");
28
29 #ifdef HAVE_SYS_TYPES_H
30 #include <sys/types.h>
31 #endif
32 #ifdef MAJOR_IN_MKDEV
33 #include <sys/mkdev.h>
34 #elif defined(MAJOR_IN_SYSMACROS)
35 #include <sys/sysmacros.h>
36 #endif
37 #ifdef HAVE_SYS_PARAM_H
38 #include <sys/param.h>
39 #endif
40 #ifdef HAVE_SYS_STAT_H
41 #include <sys/stat.h>
42 #endif
43
44 #ifdef HAVE_ERRNO_H
45 #include <errno.h>
46 #endif
47 #ifdef HAVE_GRP_H
48 #include <grp.h>
49 #endif
50 #ifdef HAVE_LIMITS_H
51 #include <limits.h>
52 #endif
53 #ifdef HAVE_PWD_H
54 #include <pwd.h>
55 #endif
56 #include <stdio.h>
57 #ifdef HAVE_STDLIB_H
58 #include <stdlib.h>
59 #endif
60 #ifdef HAVE_STRING_H
61 #include <string.h>
62 #endif
63 #ifdef HAVE_TIME_H
64 #include <time.h>
65 #endif
66 #ifdef HAVE_UNISTD_H
67 #include <unistd.h>
68 #endif
69
70 #include "bsdtar.h"
71
72 static void     list_item_verbose(struct bsdtar *, FILE *,
73                     struct archive_entry *);
74 static void     read_archive(struct bsdtar *bsdtar, char mode);
75
76 void
77 tar_mode_t(struct bsdtar *bsdtar)
78 {
79         read_archive(bsdtar, 't');
80         unmatched_inclusions_warn(bsdtar, "Not found in archive");
81 }
82
83 void
84 tar_mode_x(struct bsdtar *bsdtar)
85 {
86         /* We want to catch SIGINFO and SIGUSR1. */
87         siginfo_init(bsdtar);
88
89         read_archive(bsdtar, 'x');
90
91         unmatched_inclusions_warn(bsdtar, "Not found in archive");
92         /* Restore old SIGINFO + SIGUSR1 handlers. */
93         siginfo_done(bsdtar);
94 }
95
96 static void
97 progress_func(void * cookie)
98 {
99         struct bsdtar * bsdtar = cookie;
100
101         siginfo_printinfo(bsdtar, 0);
102 }
103
104 /*
105  * Handle 'x' and 't' modes.
106  */
107 static void
108 read_archive(struct bsdtar *bsdtar, char mode)
109 {
110         FILE                     *out;
111         struct archive           *a;
112         struct archive_entry     *entry;
113         const struct stat        *st;
114         int                       r;
115
116         while (*bsdtar->argv) {
117                 include(bsdtar, *bsdtar->argv);
118                 bsdtar->argv++;
119         }
120
121         if (bsdtar->names_from_file != NULL)
122                 include_from_file(bsdtar, bsdtar->names_from_file);
123
124         a = archive_read_new();
125         if (bsdtar->compress_program != NULL)
126                 archive_read_support_compression_program(a, bsdtar->compress_program);
127         else
128                 archive_read_support_compression_all(a);
129         archive_read_support_format_all(a);
130         if (archive_read_open_file(a, bsdtar->filename,
131             bsdtar->bytes_per_block != 0 ? bsdtar->bytes_per_block :
132             DEFAULT_BYTES_PER_BLOCK))
133                 bsdtar_errc(bsdtar, 1, 0, "Error opening archive: %s",
134                     archive_error_string(a));
135
136         do_chdir(bsdtar);
137
138         if (mode == 'x') {
139                 /* Set an extract callback so that we can handle SIGINFO. */
140                 archive_read_extract_set_progress_callback(a, progress_func,
141                     bsdtar);
142         }
143
144         if (mode == 'x' && bsdtar->option_chroot) {
145 #if HAVE_CHROOT
146                 if (chroot(".") != 0)
147                         bsdtar_errc(bsdtar, 1, errno, "Can't chroot to \".\"");
148 #else
149                 bsdtar_errc(bsdtar, 1, 0,
150                     "chroot isn't supported on this platform");
151 #endif
152         }
153
154         for (;;) {
155                 /* Support --fast-read option */
156                 if (bsdtar->option_fast_read &&
157                     unmatched_inclusions(bsdtar) == 0)
158                         break;
159
160                 r = archive_read_next_header(a, &entry);
161                 if (r == ARCHIVE_EOF)
162                         break;
163                 if (r < ARCHIVE_OK)
164                         bsdtar_warnc(bsdtar, 0, "%s", archive_error_string(a));
165                 if (r <= ARCHIVE_WARN)
166                         bsdtar->return_value = 1;
167                 if (r == ARCHIVE_RETRY) {
168                         /* Retryable error: try again */
169                         bsdtar_warnc(bsdtar, 0, "Retrying...");
170                         continue;
171                 }
172                 if (r == ARCHIVE_FATAL)
173                         break;
174
175                 if (bsdtar->option_numeric_owner) {
176                         archive_entry_set_uname(entry, NULL);
177                         archive_entry_set_gname(entry, NULL);
178                 }
179
180                 /*
181                  * Exclude entries that are too old.
182                  */
183                 st = archive_entry_stat(entry);
184                 if (bsdtar->newer_ctime_sec > 0) {
185                         if (st->st_ctime < bsdtar->newer_ctime_sec)
186                                 continue; /* Too old, skip it. */
187                         if (st->st_ctime == bsdtar->newer_ctime_sec
188                             && ARCHIVE_STAT_CTIME_NANOS(st)
189                             <= bsdtar->newer_ctime_nsec)
190                                 continue; /* Too old, skip it. */
191                 }
192                 if (bsdtar->newer_mtime_sec > 0) {
193                         if (st->st_mtime < bsdtar->newer_mtime_sec)
194                                 continue; /* Too old, skip it. */
195                         if (st->st_mtime == bsdtar->newer_mtime_sec
196                             && ARCHIVE_STAT_MTIME_NANOS(st)
197                             <= bsdtar->newer_mtime_nsec)
198                                 continue; /* Too old, skip it. */
199                 }
200
201                 /*
202                  * Note that pattern exclusions are checked before
203                  * pathname rewrites are handled.  This gives more
204                  * control over exclusions, since rewrites always lose
205                  * information.  (For example, consider a rewrite
206                  * s/foo[0-9]/foo/.  If we check exclusions after the
207                  * rewrite, there would be no way to exclude foo1/bar
208                  * while allowing foo2/bar.)
209                  */
210                 if (excluded(bsdtar, archive_entry_pathname(entry)))
211                         continue; /* Excluded by a pattern test. */
212
213                 /*
214                  * Modify the pathname as requested by the user.  We
215                  * do this for -t as well to give users a way to
216                  * preview the effects of their rewrites.  We also do
217                  * this before extraction security checks (including
218                  * leading '/' removal).  Note that some rewrite
219                  * failures prevent extraction.
220                  */
221                 if (edit_pathname(bsdtar, entry))
222                         continue; /* Excluded by a rewrite failure. */
223
224                 if (mode == 't') {
225                         /* Perversely, gtar uses -O to mean "send to stderr"
226                          * when used with -t. */
227                         out = bsdtar->option_stdout ? stderr : stdout;
228
229                         if (bsdtar->verbose < 2)
230                                 safe_fprintf(out, "%s",
231                                     archive_entry_pathname(entry));
232                         else
233                                 list_item_verbose(bsdtar, out, entry);
234                         fflush(out);
235                         r = archive_read_data_skip(a);
236                         if (r == ARCHIVE_WARN) {
237                                 fprintf(out, "\n");
238                                 bsdtar_warnc(bsdtar, 0, "%s",
239                                     archive_error_string(a));
240                         }
241                         if (r == ARCHIVE_RETRY) {
242                                 fprintf(out, "\n");
243                                 bsdtar_warnc(bsdtar, 0, "%s",
244                                     archive_error_string(a));
245                         }
246                         if (r == ARCHIVE_FATAL) {
247                                 fprintf(out, "\n");
248                                 bsdtar_warnc(bsdtar, 0, "%s",
249                                     archive_error_string(a));
250                                 bsdtar->return_value = 1;
251                                 break;
252                         }
253                         fprintf(out, "\n");
254                 } else {
255                         if (bsdtar->option_interactive &&
256                             !yes("extract '%s'", archive_entry_pathname(entry)))
257                                 continue;
258
259                         /*
260                          * Format here is from SUSv2, including the
261                          * deferred '\n'.
262                          */
263                         if (bsdtar->verbose) {
264                                 safe_fprintf(stderr, "x %s",
265                                     archive_entry_pathname(entry));
266                                 fflush(stderr);
267                         }
268
269                         /* Tell the SIGINFO-handler code what we're doing. */
270                         siginfo_setinfo(bsdtar, "extracting",
271                             archive_entry_pathname(entry), 0);
272                         siginfo_printinfo(bsdtar, 0);
273
274                         if (bsdtar->option_stdout)
275                                 r = archive_read_data_into_fd(a, 1);
276                         else
277                                 r = archive_read_extract(a, entry,
278                                     bsdtar->extract_flags);
279                         if (r != ARCHIVE_OK) {
280                                 if (!bsdtar->verbose)
281                                         safe_fprintf(stderr, "%s",
282                                             archive_entry_pathname(entry));
283                                 safe_fprintf(stderr, ": %s",
284                                     archive_error_string(a));
285                                 if (!bsdtar->verbose)
286                                         fprintf(stderr, "\n");
287                                 bsdtar->return_value = 1;
288                         }
289                         if (bsdtar->verbose)
290                                 fprintf(stderr, "\n");
291                         if (r == ARCHIVE_FATAL)
292                                 break;
293                 }
294         }
295
296         if (bsdtar->verbose > 2)
297                 fprintf(stdout, "Archive Format: %s,  Compression: %s\n",
298                     archive_format_name(a), archive_compression_name(a));
299
300         archive_read_finish(a);
301 }
302
303
304 /*
305  * Display information about the current file.
306  *
307  * The format here roughly duplicates the output of 'ls -l'.
308  * This is based on SUSv2, where 'tar tv' is documented as
309  * listing additional information in an "unspecified format,"
310  * and 'pax -l' is documented as using the same format as 'ls -l'.
311  */
312 static void
313 list_item_verbose(struct bsdtar *bsdtar, FILE *out, struct archive_entry *entry)
314 {
315         const struct stat       *st;
316         char                     tmp[100];
317         size_t                   w;
318         const char              *p;
319         const char              *fmt;
320         time_t                   tim;
321         static time_t            now;
322
323         st = archive_entry_stat(entry);
324
325         /*
326          * We avoid collecting the entire list in memory at once by
327          * listing things as we see them.  However, that also means we can't
328          * just pre-compute the field widths.  Instead, we start with guesses
329          * and just widen them as necessary.  These numbers are completely
330          * arbitrary.
331          */
332         if (!bsdtar->u_width) {
333                 bsdtar->u_width = 6;
334                 bsdtar->gs_width = 13;
335         }
336         if (!now)
337                 time(&now);
338         fprintf(out, "%s %d ",
339             archive_entry_strmode(entry),
340             (int)(st->st_nlink));
341
342         /* Use uname if it's present, else uid. */
343         p = archive_entry_uname(entry);
344         if ((p == NULL) || (*p == '\0')) {
345                 sprintf(tmp, "%lu ", (unsigned long)st->st_uid);
346                 p = tmp;
347         }
348         w = strlen(p);
349         if (w > bsdtar->u_width)
350                 bsdtar->u_width = w;
351         fprintf(out, "%-*s ", (int)bsdtar->u_width, p);
352
353         /* Use gname if it's present, else gid. */
354         p = archive_entry_gname(entry);
355         if (p != NULL && p[0] != '\0') {
356                 fprintf(out, "%s", p);
357                 w = strlen(p);
358         } else {
359                 sprintf(tmp, "%lu", (unsigned long)st->st_gid);
360                 w = strlen(tmp);
361                 fprintf(out, "%s", tmp);
362         }
363
364         /*
365          * Print device number or file size, right-aligned so as to make
366          * total width of group and devnum/filesize fields be gs_width.
367          * If gs_width is too small, grow it.
368          */
369         if (S_ISCHR(st->st_mode) || S_ISBLK(st->st_mode)) {
370                 sprintf(tmp, "%lu,%lu",
371                     (unsigned long)major(st->st_rdev),
372                     (unsigned long)minor(st->st_rdev)); /* ls(1) also casts here. */
373         } else {
374                 /*
375                  * Note the use of platform-dependent macros to format
376                  * the filesize here.  We need the format string and the
377                  * corresponding type for the cast.
378                  */
379                 sprintf(tmp, BSDTAR_FILESIZE_PRINTF,
380                     (BSDTAR_FILESIZE_TYPE)st->st_size);
381         }
382         if (w + strlen(tmp) >= bsdtar->gs_width)
383                 bsdtar->gs_width = w+strlen(tmp)+1;
384         fprintf(out, "%*s", (int)(bsdtar->gs_width - w), tmp);
385
386         /* Format the time using 'ls -l' conventions. */
387         tim = (time_t)st->st_mtime;
388         if (abs(tim - now) > (365/2)*86400)
389                 fmt = bsdtar->day_first ? "%e %b  %Y" : "%b %e  %Y";
390         else
391                 fmt = bsdtar->day_first ? "%e %b %H:%M" : "%b %e %H:%M";
392         strftime(tmp, sizeof(tmp), fmt, localtime(&tim));
393         fprintf(out, " %s ", tmp);
394         safe_fprintf(out, "%s", archive_entry_pathname(entry));
395
396         /* Extra information for links. */
397         if (archive_entry_hardlink(entry)) /* Hard link */
398                 safe_fprintf(out, " link to %s",
399                     archive_entry_hardlink(entry));
400         else if (S_ISLNK(st->st_mode)) /* Symbolic link */
401                 safe_fprintf(out, " -> %s", archive_entry_symlink(entry));
402 }