xref: /original-bsd/bin/pax/ar_subs.c (revision b4971bb3)
1 /*-
2  * Copyright (c) 1992 Keith Muller.
3  * Copyright (c) 1992, 1993
4  *	The Regents of the University of California.  All rights reserved.
5  *
6  * This code is derived from software contributed to Berkeley by
7  * Keith Muller of the University of California, San Diego.
8  *
9  * %sccs.include.redist.c%
10  */
11 
12 #ifndef lint
13 static char sccsid[] = "@(#)ar_subs.c	8.1 (Berkeley) 05/31/93";
14 #endif /* not lint */
15 
16 #include <sys/types.h>
17 #include <sys/time.h>
18 #include <sys/stat.h>
19 #include <sys/param.h>
20 #include <signal.h>
21 #include <string.h>
22 #include <stdio.h>
23 #include <ctype.h>
24 #include <fcntl.h>
25 #include <errno.h>
26 #include <unistd.h>
27 #include <stdlib.h>
28 #include "pax.h"
29 #include "extern.h"
30 
31 static void wr_archive __P((register ARCHD *, int is_app));
32 static int get_arc __P((void));
33 static int next_head __P((register ARCHD *));
34 extern sigset_t s_mask;
35 
36 /*
37  * Routines which control the overall operation modes of pax as specified by
38  * the user: list, append, read ...
39  */
40 
41 static char hdbuf[BLKMULT];             /* space for archive header on read */
42 u_long flcnt;				/* number of files processed */
43 
44 /*
45  * list()
46  *	list the contents of an archive which match user supplied pattern(s)
47  *	(no pattern matches all).
48  */
49 
50 #if __STDC__
51 void
52 list(void)
53 #else
54 void
55 list()
56 #endif
57 {
58 	register ARCHD *arcn;
59 	register int res;
60 	ARCHD archd;
61 	time_t now;
62 
63 	arcn = &archd;
64 	/*
65 	 * figure out archive type; pass any format specific options to the
66 	 * archive option processing routine; call the format init routine. We
67 	 * also save current time for ls_list() so we do not make a system
68 	 * call for each file we need to print. If verbose (vflag) start up
69 	 * the name and group caches.
70 	 */
71 	if ((get_arc() < 0) || ((*frmt->options)() < 0) ||
72 	    ((*frmt->st_rd)() < 0))
73 		return;
74 
75 	if (vflag && ((uidtb_start() < 0) || (gidtb_start() < 0)))
76 		return;
77 
78 	now = time((time_t *)NULL);
79 
80 	/*
81 	 * step through the archive until the format says it is done
82 	 */
83 	while (next_head(arcn) == 0) {
84 		/*
85 		 * check for pattern, and user specified options match.
86 		 * When all patterns are matched we are done.
87 		 */
88 		if ((res = pat_match(arcn)) < 0)
89 			break;
90 
91 		if ((res == 0) && (sel_chk(arcn) == 0)) {
92 			/*
93 			 * pattern resulted in a selected file
94 			 */
95 			if (pat_sel(arcn) < 0)
96 				break;
97 
98 			/*
99 			 * modify the name as requested by the user if name
100 			 * survives modification, do a listing of the file
101 			 */
102 			if ((res = mod_name(arcn)) < 0)
103 				break;
104 			if (res == 0)
105 				ls_list(arcn, now);
106 		}
107 
108 		/*
109 		 * skip to next archive format header using values calculated
110 		 * by the format header read routine
111 		 */
112 		if (rd_skip(arcn->skip + arcn->pad) == 1)
113 			break;
114 	}
115 
116 	/*
117 	 * all done, let format have a chance to cleanup, and make sure that
118 	 * the patterns supplied by the user were all matched
119 	 */
120 	(void)(*frmt->end_rd)();
121 	(void)sigprocmask(SIG_BLOCK, &s_mask, (sigset_t *)NULL);
122 	ar_close();
123 	pat_chk();
124 }
125 
126 /*
127  * extract()
128  *	extract the member(s) of an archive as specified by user supplied
129  *	pattern(s) (no patterns extracts all members)
130  */
131 
132 #if __STDC__
133 void
134 extract(void)
135 #else
136 void
137 extract()
138 #endif
139 {
140 	register ARCHD *arcn;
141 	register int res;
142 	off_t cnt;
143 	ARCHD archd;
144 	struct stat sb;
145 	int fd;
146 
147 	arcn = &archd;
148 	/*
149 	 * figure out archive type; pass any format specific options to the
150 	 * archive option processing routine; call the format init routine;
151 	 * start up the directory modification time and access mode database
152 	 */
153 	if ((get_arc() < 0) || ((*frmt->options)() < 0) ||
154 	    ((*frmt->st_rd)() < 0) || (dir_start() < 0))
155 		return;
156 
157 	/*
158 	 * When we are doing interactive rename, we store the mapping of names
159 	 * so we can fix up hard links files later in the archive.
160 	 */
161 	if (iflag && (name_start() < 0))
162 		return;
163 
164 	/*
165 	 * step through each entry on the archive until the format read routine
166 	 * says it is done
167 	 */
168 	while (next_head(arcn) == 0) {
169 
170 		/*
171 		 * check for pattern, and user specified options match. When
172 		 * all the patterns are matched we are done
173 		 */
174 		if ((res = pat_match(arcn)) < 0)
175 			break;
176 
177 		if ((res > 0) || (sel_chk(arcn) != 0)) {
178 			/*
179 			 * file is not selected. skip past any file data and
180 			 * padding and go back for the next archive member
181 			 */
182 			(void)rd_skip(arcn->skip + arcn->pad);
183 			continue;
184 		}
185 
186 		/*
187 		 * with -u or -D only extract when the archive member is newer
188 		 * than the file with the same name in the file system (nos
189 		 * test of being the same type is required).
190 		 * NOTE: this test is done BEFORE name modifications as
191 		 * specified by pax. this operation can be confusing to the
192 		 * user who might expect the test to be done on an existing
193 		 * file AFTER the name mod. In honesty the pax spec is probably
194 		 * flawed in this respect.
195 		 */
196 		if ((uflag || Dflag) && ((lstat(arcn->name, &sb) == 0))) {
197 			if (uflag && Dflag) {
198 				if ((arcn->sb.st_mtime <= sb.st_mtime) &&
199 				    (arcn->sb.st_ctime <= sb.st_ctime)) {
200 					(void)rd_skip(arcn->skip + arcn->pad);
201 					continue;
202 				}
203 			} else if (Dflag) {
204 				if (arcn->sb.st_ctime <= sb.st_ctime) {
205 					(void)rd_skip(arcn->skip + arcn->pad);
206 					continue;
207 				}
208 			} else if (arcn->sb.st_mtime <= sb.st_mtime) {
209 				(void)rd_skip(arcn->skip + arcn->pad);
210 				continue;
211 			}
212 		}
213 
214 		/*
215 		 * this archive member is now been selected. modify the name.
216 		 */
217 		if ((pat_sel(arcn) < 0) || ((res = mod_name(arcn)) < 0))
218 			break;
219 		if (res > 0) {
220 			/*
221 			 * a bad name mod, skip and purge name from link table
222 			 */
223 			purg_lnk(arcn);
224 			(void)rd_skip(arcn->skip + arcn->pad);
225 			continue;
226 		}
227 
228 		/*
229 		 * Non standard -Y and -Z flag. When the exisiting file is
230 		 * same age or newer skip
231 		 */
232 		if ((Yflag || Zflag) && ((lstat(arcn->name, &sb) == 0))) {
233 			if (Yflag && Zflag) {
234 				if ((arcn->sb.st_mtime <= sb.st_mtime) &&
235 				    (arcn->sb.st_ctime <= sb.st_ctime)) {
236 					(void)rd_skip(arcn->skip + arcn->pad);
237 					continue;
238 				}
239 			} else if (Yflag) {
240 				if (arcn->sb.st_ctime <= sb.st_ctime) {
241 					(void)rd_skip(arcn->skip + arcn->pad);
242 					continue;
243 				}
244 			} else if (arcn->sb.st_mtime <= sb.st_mtime) {
245 				(void)rd_skip(arcn->skip + arcn->pad);
246 				continue;
247 			}
248 		}
249 
250 		if (vflag) {
251 			(void)fputs(arcn->name, stderr);
252 			vfpart = 1;
253 		}
254 
255 		/*
256 		 * all ok, extract this member based on type
257 		 */
258 		if ((arcn->type != PAX_REG) && (arcn->type != PAX_CTG)) {
259 			/*
260 			 * process archive members that are not regular files.
261 			 * throw out padding and any data that might follow the
262 			 * header (as determined by the format).
263 			 */
264 			if ((arcn->type == PAX_HLK) || (arcn->type == PAX_HRG))
265 				res = lnk_creat(arcn);
266 			else
267 				res = node_creat(arcn);
268 
269 			(void)rd_skip(arcn->skip + arcn->pad);
270 			if (res < 0)
271 				purg_lnk(arcn);
272 
273 			if (vflag && vfpart) {
274 				(void)putc('\n', stderr);
275 				vfpart = 0;
276 			}
277 			continue;
278 		}
279 		/*
280 		 * we have a file with data here. If we can not create it, skip
281 		 * over the data and purge the name from hard link table
282 		 */
283 		if ((fd = file_creat(arcn)) < 0) {
284 			(void)rd_skip(arcn->skip + arcn->pad);
285 			purg_lnk(arcn);
286 			continue;
287 		}
288 		/*
289 		 * extract the file from the archive and skip over padding and
290 		 * any unprocessed data
291 		 */
292 		res = (*frmt->rd_data)(arcn, fd, &cnt);
293 		file_close(arcn, fd);
294 		if (vflag && vfpart) {
295 			(void)putc('\n', stderr);
296 			vfpart = 0;
297 		}
298 		if (!res)
299 			(void)rd_skip(cnt + arcn->pad);
300 	}
301 
302 	/*
303 	 * all done, restore directory modes and times as required; make sure
304 	 * all patterns supplied by the user were matched; block off signals
305 	 * to avoid chance for multiple entry into the cleanup code.
306 	 */
307 	(void)(*frmt->end_rd)();
308 	(void)sigprocmask(SIG_BLOCK, &s_mask, (sigset_t *)NULL);
309 	ar_close();
310 	proc_dir();
311 	pat_chk();
312 }
313 
314 /*
315  * wr_archive()
316  *	Write an archive. used in both creating a new archive and appends on
317  *	previously written archive.
318  */
319 
320 #if __STDC__
321 static void
322 wr_archive(register ARCHD *arcn, int is_app)
323 #else
324 static void
325 wr_archive(arcn, is_app)
326 	register ARCHD *arcn;
327 	int is_app;
328 #endif
329 {
330 	register int res;
331 	register int hlk;
332 	register int wr_one;
333 	off_t cnt;
334 	int (*wrf)();
335 	int fd = -1;
336 
337 	/*
338 	 * if this format supports hard link storage, start up the database
339 	 * that detects them.
340 	 */
341 	if (((hlk = frmt->hlk) == 1) && (lnk_start() < 0))
342 		return;
343 
344 	/*
345 	 * start up the file traversal code and format specific write
346 	 */
347 	if ((ftree_start() < 0) || ((*frmt->st_wr)() < 0))
348 		return;
349 	wrf = frmt->wr;
350 
351 	/*
352 	 * When we are doing interactive rename, we store the mapping of names
353 	 * so we can fix up hard links files later in the archive.
354 	 */
355 	if (iflag && (name_start() < 0))
356 		return;
357 
358 	/*
359 	 * if this not append, and there are no files, we do no write a trailer
360 	 */
361 	wr_one = is_app;
362 
363 	/*
364 	 * while there are files to archive, process them one at at time
365 	 */
366 	while (next_file(arcn) == 0) {
367 		/*
368 		 * check if this file meets user specified options match.
369 		 */
370 		if (sel_chk(arcn) != 0)
371 			continue;
372 		fd = -1;
373 		if (uflag) {
374 			/*
375 			 * only archive if this file is newer than a file with
376 			 * the same name that is already stored on the archive
377 			 */
378 			if ((res = chk_ftime(arcn)) < 0)
379 				break;
380 			if (res > 0)
381 				continue;
382 		}
383 
384 		/*
385 		 * this file is considered selected now. see if this is a hard
386 		 * link to a file already stored
387 		 */
388 		ftree_sel(arcn);
389 		if (hlk && (chk_lnk(arcn) < 0))
390 			break;
391 
392 		if ((arcn->type == PAX_REG) || (arcn->type == PAX_HRG) ||
393 		    (arcn->type == PAX_CTG)) {
394 			/*
395 			 * we will have to read this file. by opening it now we
396 			 * can avoid writing a header to the archive for a file
397 			 * we were later unable to read (we also purge it from
398 			 * the link table).
399 			 */
400 			if ((fd = open(arcn->org_name, O_RDONLY, 0)) < 0) {
401 				syswarn(1,errno, "Unable to open %s to read",
402 					arcn->org_name);
403 				purg_lnk(arcn);
404 				continue;
405 			}
406 		}
407 
408 		/*
409 		 * Now modify the name as requested by the user
410 		 */
411 		if ((res = mod_name(arcn)) < 0) {
412 			/*
413 			 * name modification says to skip this file, close the
414 			 * file and purge link table entry
415 			 */
416 			rdfile_close(arcn, &fd);
417 			purg_lnk(arcn);
418 			break;
419 		}
420 
421 		if ((res > 0) || (docrc && (set_crc(arcn, fd) < 0))) {
422 			/*
423 			 * unable to obtain the crc we need, close the file,
424 			 * purge link table entry
425 			 */
426 			rdfile_close(arcn, &fd);
427 			purg_lnk(arcn);
428 			continue;
429 		}
430 
431 		if (vflag) {
432 			(void)fputs(arcn->name, stderr);
433 			vfpart = 1;
434 		}
435 		++flcnt;
436 
437 		/*
438 		 * looks safe to store the file, have the format specific
439 		 * routine write routine store the file header on the archive
440 		 */
441 		if ((res = (*wrf)(arcn)) < 0) {
442 			rdfile_close(arcn, &fd);
443 			break;
444 		}
445 		wr_one = 1;
446 		if (res > 0) {
447 			/*
448 			 * format write says no file data needs to be stored
449 			 * so we are done messing with this file
450 			 */
451 			if (vflag && vfpart) {
452 				(void)putc('\n', stderr);
453 				vfpart = 0;
454 			}
455 			rdfile_close(arcn, &fd);
456 			continue;
457 		}
458 
459 		/*
460 		 * Add file data to the archive, quit on write error. if we
461 		 * cannot write the entire file contents to the archive we
462 		 * must pad the archive to replace the missing file data
463 		 * (otherwise during an extract the file header for the file
464 		 * which FOLLOWS this one will not be where we expect it to
465 		 * be).
466 		 */
467 		res = (*frmt->wr_data)(arcn, fd, &cnt);
468 		rdfile_close(arcn, &fd);
469 		if (vflag && vfpart) {
470 			(void)putc('\n', stderr);
471 			vfpart = 0;
472 		}
473 		if (res < 0)
474 			break;
475 
476 		/*
477 		 * pad as required, cnt is number of bytes not written
478 		 */
479 		if (((cnt > 0) && (wr_skip(cnt) < 0)) ||
480 		    ((arcn->pad > 0) && (wr_skip(arcn->pad) < 0)))
481 			break;
482 	}
483 
484 	/*
485 	 * tell format to write trailer; pad to block boundry; reset directory
486 	 * mode/access times, and check if all patterns supplied by the user
487 	 * were matched. block off signals to avoid chance for multiple entry
488 	 * into the cleanup code
489 	 */
490 	if (wr_one) {
491 		(*frmt->end_wr)();
492 		wr_fin();
493 	}
494 	(void)sigprocmask(SIG_BLOCK, &s_mask, (sigset_t *)NULL);
495 	ar_close();
496 	if (tflag)
497 		proc_dir();
498 	ftree_chk();
499 }
500 
501 /*
502  * append()
503  *	Add file to previously written archive. Archive format specified by the
504  *	user must agree with archive. The archive is read first to collect
505  *	modification times (if -u) and locate the archive trailer. The archive
506  *	is positioned in front of the record with the trailer and wr_archive()
507  *	is called to add the new members.
508  *	PAX IMPLEMENTATION DETAIL NOTE:
509  *	-u is implemented by adding the new members to the end of the archive.
510  *	Care is taken so that these do not end up as links to the older
511  *	version of the same file already stored in the archive. It is expected
512  *	when extraction occurs these newer versions will over-write the older
513  *	ones stored "earlier" in the archive (this may be a bad assumption as
514  *	it depends on the implementation of the program doing the extraction).
515  *	It is really difficult to splice in members without either re-writing
516  *	the entire archive (from the point were the old version was), or having
517  *	assistance of the format specification in terms of a special update
518  *	header that invalidates a previous archive record. The posix spec left
519  *	the method used to implement -u unspecified. This pax is able to
520  *	over write existing files that it creates.
521  */
522 
523 #if __STDC__
524 void
525 append(void)
526 #else
527 void
528 append()
529 #endif
530 {
531 	register ARCHD *arcn;
532 	register int res;
533 	ARCHD archd;
534 	FSUB *orgfrmt;
535 	int udev;
536 	off_t tlen;
537 
538 	arcn = &archd;
539 	orgfrmt = frmt;
540 
541 	/*
542 	 * Do not allow an append operation if the actual archive is of a
543 	 * different format than the user specified foramt.
544 	 */
545 	if (get_arc() < 0)
546 		return;
547 	if ((orgfrmt != NULL) && (orgfrmt != frmt)) {
548 		warn(1, "Cannot mix current archive format %s with %s",
549 		    frmt->name, orgfrmt->name);
550 		return;
551 	}
552 
553 	/*
554 	 * pass the format any options and start up format
555 	 */
556 	if (((*frmt->options)() < 0) || ((*frmt->st_rd)() < 0))
557 		return;
558 
559 	/*
560 	 * if we only are adding members that are newer, we need to save the
561 	 * mod times for all files we see.
562 	 */
563 	if (uflag && (ftime_start() < 0))
564 		return;
565 
566 	/*
567 	 * some archive formats encode hard links by recording the device and
568 	 * file serial number (inode) but copy the file anyway (multiple times)
569 	 * to the archive. When we append, we run the risk that newly added
570 	 * files may have the same device and inode numbers as those recorded
571 	 * on the archive but during a previous run. If this happens, when the
572 	 * archive is extracted we get INCORRECT hard links. We avoid this by
573 	 * remapping the device numbers so that newly added files will never
574 	 * use the same device number as one found on the archive. remapping
575 	 * allows new members to safely have links among themselves. remapping
576 	 * also avoids problems with file inode (serial number) truncations
577 	 * when the inode number is larger than storage space in the archive
578 	 * header. See the remap routines for more details.
579 	 */
580 	if ((udev = frmt->udev) && (dev_start() < 0))
581 		return;
582 
583 	/*
584 	 * reading the archive may take a long time. If verbose tell the user
585 	 */
586 	if (vflag) {
587 		(void)fputs("pax: Reading archive to position at the end...",
588 		     stderr);
589 		vfpart = 1;
590 	}
591 
592 	/*
593 	 * step through the archive until the format says it is done
594 	 */
595 	while (next_head(arcn) == 0) {
596 		/*
597 		 * check if this file meets user specified options.
598 		 */
599 		if (sel_chk(arcn) != 0) {
600 			if (rd_skip(arcn->skip + arcn->pad) == 1)
601 				break;
602 			continue;
603 		}
604 
605 		if (uflag) {
606 			/*
607 			 * see if this is the newest version of this file has
608 			 * already been seen, if so skip.
609 			 */
610 			if ((res = chk_ftime(arcn)) < 0)
611 				break;
612 			if (res > 0) {
613 				if (rd_skip(arcn->skip + arcn->pad) == 1)
614 					break;
615 				continue;
616 			}
617 		}
618 
619 		/*
620 		 * Store this device number. Device numbers seen during the
621 		 * read phase of append will cause newly appended files with a
622 		 * device number seen in the old part of the archive to be
623 		 * remapped to an unused device number.
624 		 */
625 		if ((udev && (add_dev(arcn) < 0)) ||
626 		    (rd_skip(arcn->skip + arcn->pad) == 1))
627 			break;
628 	}
629 
630 	/*
631 	 * done, finish up read and get the number of bytes to back up so we
632 	 * can add new members. The format might have used the hard link table,
633 	 * purge it.
634 	 */
635 	tlen = (*frmt->end_rd)();
636 	lnk_end();
637 
638 	/*
639 	 * try to postion for write, if this fails quit. if any error occurs,
640 	 * we will refuse to write
641 	 */
642 	if (appnd_start(tlen) < 0)
643 		return;
644 
645 	/*
646 	 * tell the user we are done reading.
647 	 */
648 	if (vflag && vfpart) {
649 		(void)fputs("done.\n", stderr);
650 		vfpart = 0;
651 	}
652 
653 	/*
654 	 * go to the writing phase to add the new members
655 	 */
656 	wr_archive(arcn, 1);
657 }
658 
659 /*
660  * archive()
661  *	write a new archive
662  */
663 
664 #if __STDC__
665 void
666 archive(void)
667 #else
668 void
669 archive()
670 #endif
671 {
672 	ARCHD archd;
673 
674 	/*
675 	 * if we only are adding members that are newer, we need to save the
676 	 * mod times for all files; set up for writing; pass the format any
677 	 * options write the archive
678 	 */
679 	if ((uflag && (ftime_start() < 0)) || (wr_start() < 0))
680 		return;
681 	if ((*frmt->options)() < 0)
682 		return;
683 
684 	wr_archive(&archd, 0);
685 }
686 
687 /*
688  * copy()
689  *	copy files from one part of the file system to another. this does not
690  *	use any archive storage. The EFFECT OF THE COPY IS THE SAME as if an
691  *	archive was written and then extracted in the destination directory
692  *	(except the files are forced to be under the destination directory).
693  */
694 
695 #if __STDC__
696 void
697 copy(void)
698 #else
699 void
700 copy()
701 #endif
702 {
703 	register ARCHD *arcn;
704 	register int res;
705 	register int fddest;
706 	register char *dest_pt;
707 	register int dlen;
708 	register int drem;
709 	int fdsrc = -1;
710 	struct stat sb;
711 	ARCHD archd;
712 	char dirbuf[PAXPATHLEN+1];
713 
714 	arcn = &archd;
715 	/*
716 	 * set up the destination dir path and make sure it is a directory. We
717 	 * make sure we have a trailing / on the destination
718 	 */
719 	dlen = l_strncpy(dirbuf, dirptr, PAXPATHLEN);
720 	dest_pt = dirbuf + dlen;
721 	if (*(dest_pt-1) != '/') {
722 		*dest_pt++ = '/';
723 		++dlen;
724 	}
725 	*dest_pt = '\0';
726 	drem = PAXPATHLEN - dlen;
727 
728 	if (stat(dirptr, &sb) < 0) {
729 		syswarn(1, errno, "Cannot access destination directory %s",
730 			dirptr);
731 		return;
732 	}
733 	if (!S_ISDIR(sb.st_mode)) {
734 		warn(1, "Destination is not a directory %s", dirptr);
735 		return;
736 	}
737 
738 	/*
739 	 * start up the hard link table; file traversal routines and the
740 	 * modification time and access mode database
741 	 */
742 	if ((lnk_start() < 0) || (ftree_start() < 0) || (dir_start() < 0))
743 		return;
744 
745 	/*
746 	 * When we are doing interactive rename, we store the mapping of names
747 	 * so we can fix up hard links files later in the archive.
748 	 */
749 	if (iflag && (name_start() < 0))
750 		return;
751 
752 	/*
753 	 * set up to cp file trees
754 	 */
755 	cp_start();
756 
757 	/*
758 	 * while there are files to archive, process them
759 	 */
760 	while (next_file(arcn) == 0) {
761 		fdsrc = -1;
762 
763 		/*
764 		 * check if this file meets user specified options
765 		 */
766 		if (sel_chk(arcn) != 0)
767 			continue;
768 
769 		/*
770 		 * if there is already a file in the destination directory with
771 		 * the same name and it is newer, skip the one stored on the
772 		 * archive.
773 		 * NOTE: this test is done BEFORE name modifications as
774 		 * specified by pax. this can be confusing to the user who
775 		 * might expect the test to be done on an existing file AFTER
776 		 * the name mod. In honesty the pax spec is probably flawed in
777 		 * this respect
778 		 */
779 		if (uflag || Dflag) {
780 			/*
781 			 * create the destination name
782 			 */
783 			if (*(arcn->name) == '/')
784 				res = 1;
785 			else
786 				res = 0;
787 			if ((arcn->nlen - res) > drem) {
788 				warn(1, "Destination pathname too long %s",
789 					arcn->name);
790 				continue;
791 			}
792 			(void)strncpy(dest_pt, arcn->name + res, drem);
793 			dirbuf[PAXPATHLEN] = '\0';
794 
795 			/*
796 			 * if existing file is same age or newer skip
797 			 */
798 			res = lstat(dirbuf, &sb);
799 			*dest_pt = '\0';
800 
801 		    	if (res == 0) {
802 				if (uflag && Dflag) {
803 					if ((arcn->sb.st_mtime<=sb.st_mtime) &&
804 			    		    (arcn->sb.st_ctime<=sb.st_ctime))
805 						continue;
806 				} else if (Dflag) {
807 					if (arcn->sb.st_ctime <= sb.st_ctime)
808 						continue;
809 				} else if (arcn->sb.st_mtime <= sb.st_mtime)
810 					continue;
811 			}
812 		}
813 
814 		/*
815 		 * this file is considered selected. See if this is a hard link
816 		 * to a previous file; modify the name as requested by the
817 		 * user; set the final destination.
818 		 */
819 		ftree_sel(arcn);
820 		if ((chk_lnk(arcn) < 0) || ((res = mod_name(arcn)) < 0))
821 			break;
822 		if ((res > 0) || (set_dest(arcn, dirbuf, dlen) < 0)) {
823 			/*
824 			 * skip file, purge from link table
825 			 */
826 			purg_lnk(arcn);
827 			continue;
828 		}
829 
830 		/*
831 		 * Non standard -Y and -Z flag. When the exisiting file is
832 		 * same age or newer skip
833 		 */
834 		if ((Yflag || Zflag) && ((lstat(arcn->name, &sb) == 0))) {
835 			if (Yflag && Zflag) {
836 				if ((arcn->sb.st_mtime <= sb.st_mtime) &&
837 				    (arcn->sb.st_ctime <= sb.st_ctime))
838 					continue;
839 			} else if (Yflag) {
840 				if (arcn->sb.st_ctime <= sb.st_ctime)
841 					continue;
842 			} else if (arcn->sb.st_mtime <= sb.st_mtime)
843 				continue;
844 		}
845 
846 		if (vflag) {
847 			(void)fputs(arcn->name, stderr);
848 			vfpart = 1;
849 		}
850 		++flcnt;
851 
852 		/*
853 		 * try to create a hard link to the src file if requested
854 		 * but make sure we are not trying to overwrite ourselves.
855 		 */
856 		if (lflag)
857 			res = cross_lnk(arcn);
858 		else
859 			res = chk_same(arcn);
860 		if (res <= 0) {
861 			if (vflag && vfpart) {
862 				(void)putc('\n', stderr);
863 				vfpart = 0;
864 			}
865 			continue;
866 		}
867 
868 		/*
869 		 * have to create a new file
870 		 */
871 		if ((arcn->type != PAX_REG) && (arcn->type != PAX_CTG)) {
872 			/*
873 			 * create a link or special file
874 			 */
875 			if ((arcn->type == PAX_HLK) || (arcn->type == PAX_HRG))
876 				res = lnk_creat(arcn);
877 			else
878 				res = node_creat(arcn);
879 			if (res < 0)
880 				purg_lnk(arcn);
881 			if (vflag && vfpart) {
882 				(void)putc('\n', stderr);
883 				vfpart = 0;
884 			}
885 			continue;
886 		}
887 
888 		/*
889 		 * have to copy a regular file to the destination directory.
890 		 * first open source file and then create the destination file
891 		 */
892 		if ((fdsrc = open(arcn->org_name, O_RDONLY, 0)) < 0) {
893 			syswarn(1, errno, "Unable to open %s to read",
894 			    arcn->org_name);
895 			purg_lnk(arcn);
896 			continue;
897 		}
898 		if ((fddest = file_creat(arcn)) < 0) {
899 			rdfile_close(arcn, &fdsrc);
900 			purg_lnk(arcn);
901 			continue;
902 		}
903 
904 		/*
905 		 * copy source file data to the destination file
906 		 */
907 		cp_file(arcn, fdsrc, fddest);
908 		file_close(arcn, fddest);
909 		rdfile_close(arcn, &fdsrc);
910 
911 		if (vflag && vfpart) {
912 			(void)putc('\n', stderr);
913 			vfpart = 0;
914 		}
915 	}
916 
917 	/*
918 	 * restore directory modes and times as required; make sure all
919 	 * patterns were selected block off signals to avoid chance for
920 	 * multiple entry into the cleanup code.
921 	 */
922 	(void)sigprocmask(SIG_BLOCK, &s_mask, (sigset_t *)NULL);
923 	ar_close();
924 	proc_dir();
925 	ftree_chk();
926 }
927 
928 /*
929  * next_head()
930  *	try to find a valid header in the archive. Uses format specific
931  *	routines to extract the header and id the trailer. Trailers may be
932  *	located within a valid header or in an invalid header (the location
933  *	is format specific. The inhead field from the option table tells us
934  *	where to look for the trailer).
935  *	We keep reading (and resyncing) until we get enough contiguous data
936  *	to check for a header. If we cannot find one, we shift by a byte
937  *	add a new byte from the archive to the end of the buffer and try again.
938  *	If we get a read error, we throw out what we have (as we must have
939  *	contiguous data) and start over again.
940  *	ASSUMED: headers fit within a BLKMULT header.
941  * Return:
942  *	0 if we got a header, -1 if we are unable to ever find another one
943  *	(we reached the end of input, or we reached the limit on retries. see
944  *	the specs for rd_wrbuf() for more details)
945  */
946 
947 #if __STDC__
948 static int
949 next_head(register ARCHD *arcn)
950 #else
951 static int
952 next_head(arcn)
953 	register ARCHD *arcn;
954 #endif
955 {
956 	register int ret;
957 	register char *hdend;
958 	register int res;
959 	register int shftsz;
960 	register int hsz;
961 	register int in_resync = 0; 	/* set when we are in resync mode */
962 	int cnt = 0;			/* counter for trailer function */
963 
964 	/*
965 	 * set up initial conditions, we want a whole frmt->hsz block as we
966 	 * have no data yet.
967 	 */
968 	res = hsz = frmt->hsz;
969 	hdend = hdbuf;
970 	shftsz = hsz - 1;
971 	for(;;) {
972 		/*
973 		 * keep looping until we get a contiguous FULL buffer
974 		 * (frmt->hsz is the proper size)
975 		 */
976 		for (;;) {
977 			if ((ret = rd_wrbuf(hdend, res)) == res)
978 				break;
979 
980 			/*
981 			 * some kind of archive read problem, try to resync the
982 			 * storage device, better give the user the bad news.
983 			 */
984 			if ((ret == 0) || (rd_sync() < 0)) {
985 				warn(1,"Premature end of file on archive read");
986 				return(-1);
987 			}
988 			if (!in_resync) {
989 				if (act == APPND) {
990 					warn(1,
991 				          "Archive I/O error, cannot continue");
992 					return(-1);
993 				}
994 				warn(1,"Archive I/O error. Trying to recover.");
995 				++in_resync;
996 			}
997 
998 			/*
999 			 * oh well, throw it all out and start over
1000 			 */
1001 			res = hsz;
1002 			hdend = hdbuf;
1003 		}
1004 
1005 		/*
1006 		 * ok we have a contiguous buffer of the right size. Call the
1007 		 * format read routine. If this was not a valid header and this
1008 		 * format stores trailers outside of the header, call the
1009 		 * format specific trailer routine to check for a trailer. We
1010 		 * have to watch out that we do not mis-identify file data or
1011 		 * block padding as a header or trailer. Format specific
1012 		 * trailer functions must NOT check for the trailer while we
1013 		 * are running in resync mode. Some trailer functions may tell
1014 		 * us that this block cannot contain a valid header either, so
1015 		 * we then throw out the entire block and start over.
1016 		 */
1017 		if ((*frmt->rd)(arcn, hdbuf) == 0)
1018 			break;
1019 
1020 		if (!frmt->inhead) {
1021 			/*
1022 			 * this format has trailers outside of valid headers
1023 			 */
1024 			if ((ret = (*frmt->trail)(hdbuf,in_resync,&cnt)) == 0){
1025 				/*
1026 				 * valid trailer found, drain input as required
1027 				 */
1028 				ar_drain();
1029 				return(-1);
1030 			}
1031 
1032 			if (ret == 1) {
1033 				/*
1034 				 * we are in resync and we were told to throw
1035 				 * the whole block out because none of the
1036 				 * bytes in this block can be used to form a
1037 				 * valid header
1038 				 */
1039 				res = hsz;
1040 				hdend = hdbuf;
1041 				continue;
1042 			}
1043 		}
1044 
1045 		/*
1046 		 * Brute force section.
1047 		 * not a valid header. We may be able to find a header yet. So
1048 		 * we shift over by one byte, and set up to read one byte at a
1049 		 * time from the archive and place it at the end of the buffer.
1050 		 * We will keep moving byte at a time until we find a header or
1051 		 * get a read error and have to start over.
1052 		 */
1053 		if (!in_resync) {
1054 			if (act == APPND) {
1055 				warn(1,"Unable to append, archive header flaw");
1056 				return(-1);
1057 			}
1058 			warn(1,"Invalid header, starting valid header search.");
1059 			++in_resync;
1060 		}
1061 		bcopy(hdbuf+1, hdbuf, shftsz);
1062 		res = 1;
1063 		hdend = hdbuf + shftsz;
1064 	}
1065 
1066 	/*
1067 	 * ok got a valid header, check for trailer if format encodes it in the
1068 	 * the header. NOTE: the parameters are different than trailer routines
1069 	 * which encode trailers outside of the header!
1070 	 */
1071 	if (frmt->inhead && ((*frmt->trail)(arcn) == 0)) {
1072 		/*
1073 		 * valid trailer found, drain input as required
1074 		 */
1075 		ar_drain();
1076 		return(-1);
1077 	}
1078 
1079 	++flcnt;
1080 	return(0);
1081 }
1082 
1083 /*
1084  * get_arc()
1085  *	Figure out what format an archive is. Handles archive with flaws by
1086  *	brute force searches for a legal header in any supported format. The
1087  *	format id routines have to be careful to NOT mis-identify a format.
1088  *	ASSUMED: headers fit within a BLKMULT header.
1089  * Return:
1090  *	0 if archive found -1 otherwise
1091  */
1092 
1093 #if __STDC__
1094 static int
1095 get_arc(void)
1096 #else
1097 static int
1098 get_arc()
1099 #endif
1100 {
1101 	register int i;
1102 	register int hdsz = 0;
1103 	register int res;
1104 	register int minhd = BLKMULT;
1105 	char *hdend;
1106 	int notice = 0;
1107 
1108 	/*
1109 	 * find the smallest header size in all archive formats and then set up
1110 	 * to read the archive.
1111 	 */
1112 	for (i = 0; ford[i] >= 0; ++i) {
1113 		if (fsub[ford[i]].hsz < minhd)
1114 			minhd = fsub[ford[i]].hsz;
1115 	}
1116 	if (rd_start() < 0)
1117 		return(-1);
1118 	res = BLKMULT;
1119 	hdsz = 0;
1120 	hdend = hdbuf;
1121 	for(;;) {
1122 		for (;;) {
1123 			/*
1124 			 * fill the buffer with at least the smallest header
1125 			 */
1126 			i = rd_wrbuf(hdend, res);
1127 			if (i > 0)
1128 				hdsz += i;
1129 			if (hdsz >= minhd)
1130 				break;
1131 
1132 			/*
1133 			 * if we cannot recover from a read error quit
1134 			 */
1135 			if ((i == 0) || (rd_sync() < 0))
1136 				goto out;
1137 
1138 			/*
1139 			 * when we get an error none of the data we already
1140 			 * have can be used to create a legal header (we just
1141 			 * got an error in the middle), so we throw it all out
1142 			 * and refill the buffer with fresh data.
1143 			 */
1144 			res = BLKMULT;
1145 			hdsz = 0;
1146 			hdend = hdbuf;
1147 			if (!notice) {
1148 				if (act == APPND)
1149 					return(-1);
1150 				warn(1,"Cannot identify format. Searching...");
1151 				++notice;
1152 			}
1153 		}
1154 
1155 		/*
1156 		 * we have at least the size of the smallest header in any
1157 		 * archive format. Look to see if we have a match. The array
1158 		 * ford[] is used to specify the header id order to reduce the
1159 		 * chance of incorrectly id'ing a valid header (some formats
1160 		 * may be subsets of each other and the order would then be
1161 		 * important).
1162 		 */
1163 		for (i = 0; ford[i] >= 0; ++i) {
1164 			if ((*fsub[ford[i]].id)(hdbuf, hdsz) < 0)
1165 				continue;
1166 			frmt = &(fsub[ford[i]]);
1167 			/*
1168 			 * yuck, to avoid slow special case code in the extract
1169 			 * routines, just push this header back as if it was
1170 			 * not seen. We have left extra space at start of the
1171 			 * buffer for this purpose. This is a bit ugly, but
1172 			 * adding all the special case code is far worse.
1173 			 */
1174 			pback(hdbuf, hdsz);
1175 			return(0);
1176 		}
1177 
1178 		/*
1179 		 * We have a flawed archive, no match. we start searching, but
1180 		 * we never allow additions to flawed archives
1181 		 */
1182 		if (!notice) {
1183 			if (act == APPND)
1184 				return(-1);
1185 			warn(1, "Cannot identify format. Searching...");
1186 			++notice;
1187 		}
1188 
1189 		/*
1190 		 * brute force search for a header that we can id.
1191 		 * we shift through byte at a time. this is slow, but we cannot
1192 		 * determine the nature of the flaw in the archive in a
1193 		 * portable manner
1194 		 */
1195 		if (--hdsz > 0) {
1196 			bcopy(hdbuf+1, hdbuf, hdsz);
1197 			res = BLKMULT - hdsz;
1198 			hdend = hdbuf + hdsz;
1199 		} else {
1200 			res = BLKMULT;
1201 			hdend = hdbuf;
1202 			hdsz = 0;
1203 		}
1204 	}
1205 
1206     out:
1207 	/*
1208 	 * we cannot find a header, bow, apologize and quit
1209 	 */
1210 	warn(1, "Sorry, unable to determine archive format.");
1211 	return(-1);
1212 }
1213