2 #============================================================= -*-perl-*-
4 # BackupPC_tarIncCreate: create a tar archive of an existing incremental dump
9 # Usage: BackupPC_tarIncCreate [options]
14 # -h host Host from which the tar archive is created.
15 # -n dumpNum Dump number from which the tar archive is created.
16 # A negative number means relative to the end (eg -1
17 # means the most recent dump, -2 2nd most recent etc).
18 # -s shareName Share name from which the tar archive is created.
21 # -t print summary totals
22 # -r pathRemove path prefix that will be replaced with pathAdd
23 # -p pathAdd new path prefix
24 # -b BLOCKS BLOCKS x 512 bytes per record (default 20; same as tar)
25 # -w writeBufSz write buffer size (default 1MB)
27 # The -h, -n and -s options specify which dump is used to generate
28 # the tar archive. The -r and -p options can be used to relocate
29 # the paths in the tar archive so extracted files can be placed
30 # in a location different from their original location.
33 # Craig Barratt <cbarratt@users.sourceforge.net>
34 # Ivan Klaric <iklaric@gmail.com>
35 # Dobrica Pavlinusic <dpavlin@rot13.org>
38 # Copyright (C) 2001-2003 Craig Barratt
40 # This program is free software; you can redistribute it and/or modify
41 # it under the terms of the GNU General Public License as published by
42 # the Free Software Foundation; either version 2 of the License, or
43 # (at your option) any later version.
45 # This program is distributed in the hope that it will be useful,
46 # but WITHOUT ANY WARRANTY; without even the implied warranty of
47 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
48 # GNU General Public License for more details.
50 # You should have received a copy of the GNU General Public License
51 # along with this program; if not, write to the Free Software
52 # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
54 #========================================================================
56 # Version 2.1.0, released 20 Jun 2004.
58 # See http://backuppc.sourceforge.net.
60 #========================================================================
64 use lib "__INSTALLDIR__/lib";
69 use BackupPC::Attrib qw(:all);
70 use BackupPC::FileZIO;
72 use BackupPC::SearchLib;
73 use Time::HiRes qw/time/;
74 use POSIX qw/strftime/;
78 use Data::Dumper; ### FIXME
80 die("BackupPC::Lib->new failed\n") if ( !(my $bpc = BackupPC::Lib->new) );
81 my $TopDir = $bpc->TopDir();
82 my $BinDir = $bpc->BinDir();
83 my %Conf = $bpc->Conf();
84 %BackupPC::SearchLib::Conf = %Conf;
86 my $in_backup_increment;
89 if ( !getopts("th:n:p:r:s:b:w:vdf", \%opts) ) {
93 -h host host from which the tar archive is created
94 -n dumpNum dump number from which the tar archive is created
95 A negative number means relative to the end (eg -1
96 means the most recent dump, -2 2nd most recent etc).
97 -s shareName share name from which the tar archive is created
100 -t print summary totals
101 -r pathRemove path prefix that will be replaced with pathAdd
102 -p pathAdd new path prefix
103 -b BLOCKS BLOCKS x 512 bytes per record (default 20; same as tar)
104 -w writeBufSz write buffer size (default 1048576 = 1MB)
105 -f overwrite existing parts
112 if ( $opts{h} !~ /^([\w\.\s-]+)$/ ) {
113 die "$0: bad host name '$opts{h}'\n";
117 if ( $opts{n} !~ /^(-?\d+)$/ ) {
118 die "$0: bad dump number '$opts{n}'\n";
123 foreach my $c (qw/gzip md5sum tee/) {
124 $bin->{$c} = which($c) || die "$0 needs $c, install it\n";
127 my @Backups = $bpc->BackupInfoRead($Host);
133 my $current_tar_size = 0;
134 my $total_increment_size = 0;
137 $Num = $Backups[@Backups + $Num]{num} if ( -@Backups <= $Num && $Num < 0 );
138 for ( $i = 0 ; $i < @Backups ; $i++ ) {
139 last if ( $Backups[$i]{num} == $Num );
141 if ( $i >= @Backups ) {
142 die "$0: bad backup number $Num for host $Host\n";
145 my $PathRemove = $1 if ( $opts{r} =~ /(.+)/ );
146 my $PathAdd = $1 if ( $opts{p} =~ /(.+)/ );
147 if ( $opts{s} !~ /^([\w\s\.\/\$-]+)$/ && $opts{s} ne "*" ) {
148 die "$0: bad share name '$opts{s}'\n";
150 our $ShareName = $opts{s};
151 our $view = BackupPC::View->new($bpc, $Host, \@Backups);
155 my $dsn = $Conf{SearchDSN};
156 my $db_user = $Conf{SearchUser} || '';
158 my $dbh = DBI->connect($dsn, $db_user, "", { RaiseError => 1, AutoCommit => 0} );
160 my $sth_inc_size = $dbh->prepare(qq{
166 my $sth_backup_parts = $dbh->prepare(qq{
167 insert into backup_parts (
174 ) values (?,?,?,?,?,?)
178 # This constant and the line of code below that uses it are borrowed
179 # from Archive::Tar. Thanks to Calle Dybedahl and Stephen Zander.
182 # Archive::Tar is Copyright 1997 Calle Dybedahl. All rights reserved.
183 # Copyright 1998 Stephen Zander. All rights reserved.
186 = 'a100 a8 a8 a8 a12 a12 A8 a1 a100 a6 a2 a32 a32 a8 a8 a155 x12';
187 my $tar_header_length = 512;
189 my $BufSize = $opts{w} || 1048576; # 1MB or 2^20
191 my $WriteBufSz = ($opts{b} || 20) * $tar_header_length;
193 my(%UidCache, %GidCache);
194 my(%HardLinkExtraFiles, @HardLinks);
197 # Write out all the requested files/directories
200 my $max_file_size = $Conf{'MaxArchiveFileSize'} || die "problem with MaxArchiveFileSize parametar";
202 my $tar_dir = $Conf{InstallDir}.'/'.$Conf{GzipTempDir};
203 die "problem with $tar_dir, check GzipTempDir in configuration\n" unless (-d $tar_dir && -w $tar_dir);
205 my $tar_file = BackupPC::SearchLib::getGzipName($Host, $ShareName, $Num) || die "can't getGzipName($Host, $ShareName, $Num)";
207 my $tar_path_final = $tar_dir . '/' . $tar_file;
208 my $tar_path = $tar_path_final . '.tmp';
210 $tar_path =~ s#//#/#g;
212 my $sth = $dbh->prepare(qq{
216 JOIN shares on shares.id = shareid
217 JOIN hosts on hosts.id = shares.hostid
218 WHERE hosts.name = ? and shares.name = ? and backups.num = ?
220 $sth->execute($Host, $ShareName, $Num);
221 my ($backup_id) = $sth->fetchrow_array;
225 # delete exising backup_parts
226 my $sth_delete_backup_parts = $dbh->prepare(qq{
227 delete from backup_parts
230 $sth_delete_backup_parts->execute($backup_id);
233 print STDERR "backup_id: $backup_id working dir: $tar_dir, max uncompressed size $max_file_size bytes, tar $tar_file\n" if ($opts{d});
235 if (-e $tar_path_final) {
237 rmtree $tar_path_final || die "can't remove $tar_path_final: $!";
239 die "$tar_path_final allready exists\n";
246 my $items_in_part = 0;
252 return if ($current_tar_size == 0);
254 print STDERR "\n\t+ $part:";
257 # Finish with two null 512 byte headers,
258 # and then round out a full block.
260 my $data = "\0" x ($tar_header_length * 2);
261 TarWrite($fh, \$data);
262 TarWrite($fh, undef);
264 close($fh) || die "can't close archive part $part: $!";
266 my $file = $tar_path . '/' . $part;
268 my $md5 = read_file( $file . '.md5' ) || die "can't read md5sum file ${file}.md5";
271 my $size = (stat( $file . '.tar.gz' ))[7] || die "can't stat ${file}.tar.gz";
273 print "$file, $size bytes, $items_in_part items";
275 $sth_backup_parts->execute(
284 $total_increment_size += $size;
290 print STDERR "# rename $from -> $to\n" if ($opts{d});
291 rename $from, $to || die "can't move $from -> $to: $!\n";
295 print STDERR " single" if ($opts{v});
296 move("${tar_path}/1.tar.gz", "${tar_path_final}.tar.gz");
297 move("${tar_path}/1.md5", "${tar_path_final}.md5");
298 rmtree $tar_path or die "can't remove temporary dir $tar_path: $!";
300 print STDERR " [last]" if ($opts{v});
301 move("${tar_path}", "${tar_path_final}");
303 # if this archive was single part, remove it
304 foreach my $suffix (qw/.tar.gz .md5/) {
305 my $path = $tar_path_final . $suffix;
306 unlink $path if (-e $path);
310 $sth_inc_size->execute(
311 $total_increment_size,
315 print "\n\ttotal $total_increment_size bytes";
324 # if this is first part, create directory
328 print STDERR "# deleting existing $tar_path\n" if ($opts{d});
331 mkdir($tar_path) || die "can't create directory $tar_path: $!";
334 print STDERR "ABORTED: cleanup temp dir ";
340 $SIG{'INT'} = \&abort_cleanup;
341 $SIG{'QUIT'} = \&abort_cleanup;
342 $SIG{'__DIE__'} = \&abort_cleanup;
346 my $file = $tar_path . '/' . $part;
349 # create comprex pipe which will pass output through gzip
350 # for compression, create file on disk using tee
351 # and pipe same output to md5sum to create checksum
354 my $cmd = '| ' . $bin->{'gzip'} . ' ' . $Conf{GzipLevel} . ' ' .
355 '| ' . $bin->{'tee'} . ' ' . $file . '.tar.gz' . ' ' .
356 '| ' . $bin->{'md5sum'} . ' - > ' . $file . '.md5';
358 print STDERR "## $cmd\n" if ($opts{d});
360 open($fh, $cmd) or die "can't open $cmd: $!";
363 $current_tar_size = 0;
369 if (seedCache($Host, $ShareName, $Num)) {
370 archiveWrite($fh, '/');
371 archiveWriteHardLinks($fh);
372 new_tar_part( close => 1 );
374 print STDERR "NOTE: no files found for $Host:$ShareName, increment $Num\n" if ($opts{v});
375 # remove temporary files if there are no files
378 my $sth = $dbh->prepare(qq{
379 update backups set inc_size = 0, inc_deleted = true
382 $sth->execute($backup_id);
387 # print out totals if requested
390 print STDERR "Done: $FileCnt files, $ByteCnt bytes, $DirCnt dirs,",
391 " $SpecialCnt specials, $ErrorCnt errors\n";
393 if ( $ErrorCnt && !$FileCnt && !$DirCnt ) {
395 # Got errors, with no files or directories; exit with non-zero
398 die "got errors or no files\n";
401 $sth_inc_size->finish;
402 $sth_backup_parts->finish;
404 $dbh->commit || die "can't commit changes to database";
409 ###########################################################################
411 ###########################################################################
415 my($fh, $dir, $tarPathOverride) = @_;
417 if ( $dir =~ m{(^|/)\.\.(/|$)} ) {
418 print(STDERR "$0: bad directory '$dir'\n");
422 $dir = "/" if ( $dir eq "." );
423 #print(STDERR "calling find with $Num, $ShareName, $dir\n");
425 if ( $view->find($Num, $ShareName, $dir, 0, \&TarWriteFile,
426 $fh, $tarPathOverride) < 0 ) {
427 print(STDERR "$0: bad share or directory '$ShareName/$dir'\n");
434 # Write out any hardlinks (if any)
436 sub archiveWriteHardLinks
439 foreach my $hdr ( @HardLinks ) {
441 if ( defined($PathRemove)
442 && substr($hdr->{linkname}, 0, length($PathRemove)+1)
443 eq ".$PathRemove" ) {
444 substr($hdr->{linkname}, 0, length($PathRemove)+1) = ".$PathAdd";
446 TarWriteFileInfo($fh, $hdr);
449 %HardLinkExtraFiles = ();
456 $UidCache{$uid} = (getpwuid($uid))[0] if ( !exists($UidCache{$uid}) );
457 return $UidCache{$uid};
464 $GidCache{$gid} = (getgrgid($gid))[0] if ( !exists($GidCache{$gid}) );
465 return $GidCache{$gid};
470 my($fh, $dataRef) = @_;
473 if ( !defined($dataRef) ) {
475 # do flush by padding to a full $WriteBufSz
477 my $data = "\0" x ($WriteBufSz - length($WriteBuf));
481 # poor man's tell :-)
482 $current_tar_size += length($$dataRef);
484 if ( length($WriteBuf) + length($$dataRef) < $WriteBufSz ) {
486 # just buffer and return
488 $WriteBuf .= $$dataRef;
491 my $done = $WriteBufSz - length($WriteBuf);
492 if ( syswrite($fh, $WriteBuf . substr($$dataRef, 0, $done))
494 die "Unable to write to output file ($!)\n";
496 while ( $done + $WriteBufSz <= length($$dataRef) ) {
497 if ( syswrite($fh, substr($$dataRef, $done, $WriteBufSz))
499 die "Unable to write to output file ($!)\n";
501 $done += $WriteBufSz;
503 $WriteBuf = substr($$dataRef, $done);
510 if ( $size % $tar_header_length ) {
511 my $data = "\0" x ($tar_header_length - ($size % $tar_header_length));
512 TarWrite($fh, \$data);
520 $hdr->{uname} = UidLookup($hdr->{uid}) if ( !defined($hdr->{uname}) );
521 $hdr->{gname} = GidLookup($hdr->{gid}) if ( !defined($hdr->{gname}) );
522 my $devmajor = defined($hdr->{devmajor}) ? sprintf("%07o", $hdr->{devmajor})
524 my $devminor = defined($hdr->{devminor}) ? sprintf("%07o", $hdr->{devminor})
527 if ( $hdr->{size} >= 2 * 65536 * 65536 ) {
529 # GNU extension for files >= 8GB: send size in big-endian binary
531 $sizeStr = pack("c4 N N", 0x80, 0, 0, 0,
532 $hdr->{size} / (65536 * 65536),
533 $hdr->{size} % (65536 * 65536));
534 } elsif ( $hdr->{size} >= 1 * 65536 * 65536 ) {
536 # sprintf octal only handles up to 2^32 - 1
538 $sizeStr = sprintf("%03o", $hdr->{size} / (1 << 24))
539 . sprintf("%08o", $hdr->{size} % (1 << 24));
541 $sizeStr = sprintf("%011o", $hdr->{size});
543 my $data = pack($tar_pack_header,
544 substr($hdr->{name}, 0, 99),
545 sprintf("%07o", $hdr->{mode}),
546 sprintf("%07o", $hdr->{uid}),
547 sprintf("%07o", $hdr->{gid}),
549 sprintf("%011o", $hdr->{mtime}),
550 "", #checksum field - space padded by pack("A8")
552 substr($hdr->{linkname}, 0, 99),
553 $hdr->{magic} || 'ustar ',
554 $hdr->{version} || ' ',
561 substr($data, 148, 7) = sprintf("%06o\0", unpack("%16C*",$data));
562 TarWrite($fh, \$data);
570 # Handle long link names (symbolic links)
572 if ( length($hdr->{linkname}) > 99 ) {
574 my $data = $hdr->{linkname} . "\0";
575 $h{name} = "././\@LongLink";
577 $h{size} = length($data);
578 TarWriteHeader($fh, \%h);
579 TarWrite($fh, \$data);
580 TarWritePad($fh, length($data));
583 # Handle long file names
585 if ( length($hdr->{name}) > 99 ) {
587 my $data = $hdr->{name} . "\0";
588 $h{name} = "././\@LongLink";
590 $h{size} = length($data);
591 TarWriteHeader($fh, \%h);
592 TarWrite($fh, \$data);
593 TarWritePad($fh, length($data));
595 TarWriteHeader($fh, $hdr);
599 # seed cache of files in this increment
602 my ($host, $share, $dumpNo) = @_;
604 print STDERR curr_time(), "$host:$share #$dumpNo" if ($opts{v});
608 JOIN shares on shares.id = shareid
609 JOIN hosts on hosts.id = shares.hostid
610 WHERE hosts.name = ? and shares.name = ? and backupnum = ?
613 my $sth = $dbh->prepare($sql);
614 $sth->execute($host, $share, $dumpNo);
615 my $count = $sth->rows;
616 print STDERR " $count items, parts:" if ($opts{v});
617 while (my $row = $sth->fetchrow_arrayref) {
618 #print STDERR "+ ", $row->[0],"\n";
619 $in_backup_increment->{ $row->[0] } = $row->[1];
628 # calculate overhad for one file in tar
630 sub tar_overhead($) {
631 my $name = shift || '';
633 # header, padding of file and two null blocks at end
634 my $len = 4 * $tar_header_length;
636 # if filename is longer than 99 chars subtract blocks for
638 if ( length($name) > 99 ) {
639 $len += int( ( length($name) + $tar_header_length ) / $tar_header_length ) * $tar_header_length;
650 my($hdr, $fh, $tarPathOverride) = @_;
652 my $tarPath = $hdr->{relPath};
653 $tarPath = $tarPathOverride if ( defined($tarPathOverride) );
655 $tarPath =~ s{//+}{/}g;
657 #print STDERR "? $tarPath\n" if ($opts{d});
658 my $size = $in_backup_increment->{$tarPath};
659 return unless (defined($size));
661 # is this file too large to fit into MaxArchiveFileSize?
663 if ( ($current_tar_size + tar_overhead($tarPath) + $size) > $max_file_size ) {
664 print STDERR "# tar file $current_tar_size + $tar_header_length + $size > $max_file_size, splitting\n" if ($opts{d});
668 #print STDERR "A $tarPath [$size] tell: $current_tar_size\n" if ($opts{d});
671 if ( defined($PathRemove)
672 && substr($tarPath, 0, length($PathRemove)) eq $PathRemove ) {
673 substr($tarPath, 0, length($PathRemove)) = $PathAdd;
675 $tarPath = "./" . $tarPath if ( $tarPath !~ /^\.\// );
676 $tarPath =~ s{//+}{/}g;
677 $hdr->{name} = $tarPath;
679 if ( $hdr->{type} == BPC_FTYPE_DIR ) {
681 # Directory: just write the header
683 $hdr->{name} .= "/" if ( $hdr->{name} !~ m{/$} );
684 TarWriteFileInfo($fh, $hdr);
686 } elsif ( $hdr->{type} == BPC_FTYPE_FILE ) {
688 # Regular file: write the header and file
690 my $f = BackupPC::FileZIO->open($hdr->{fullPath}, 0, $hdr->{compress});
691 if ( !defined($f) ) {
692 print(STDERR "Unable to open file $hdr->{fullPath}\n");
696 # do we need to split file?
697 if ($hdr->{size} < $max_file_size) {
698 TarWriteFileInfo($fh, $hdr);
700 while ( $f->read(\$data, $BufSize) > 0 ) {
701 TarWrite($fh, \$data);
702 $size += length($data);
705 TarWritePad($fh, $size);
709 my $full_size = $hdr->{size};
710 my $orig_name = $hdr->{name};
711 my $max_part_size = $max_file_size - tar_overhead($hdr->{name});
713 my $parts = int(($full_size + $max_part_size - 1) / $max_part_size);
714 print STDERR "# splitting $orig_name [$full_size bytes] into $parts parts\n" if ($opts{d});
715 foreach my $subpart ( 1 .. $parts ) {
717 if ($subpart < $parts) {
718 $hdr->{size} = $max_part_size;
720 $hdr->{size} = $full_size % $max_part_size;
722 $hdr->{name} = $orig_name . '/' . $subpart;
723 print STDERR "## creating part $subpart ",$hdr->{name}, " [", $hdr->{size}," bytes]\n";
725 TarWriteFileInfo($fh, $hdr);
728 for ( 1 .. int($hdr->{size} / $BufSize) ) {
729 my $r_size = $f->read(\$data, $BufSize);
730 die "expected $BufSize bytes read, got $r_size bytes!" if ($r_size != $BufSize);
731 TarWrite($fh, \$data);
732 $size += length($data);
735 my $size_left = $hdr->{size} % $BufSize;
736 my $r_size = $f->read(\$data, $size_left);
737 die "expected $size_left bytes last read, got $r_size bytes!" if ($r_size != $size_left);
739 TarWrite($fh, \$data);
740 $size += length($data);
741 TarWritePad($fh, $size);
747 $ByteCnt += $full_size;
750 } elsif ( $hdr->{type} == BPC_FTYPE_HARDLINK ) {
752 # Hardlink file: either write a hardlink or the complete file
753 # depending upon whether the linked-to file will be written
756 # Start by reading the contents of the link.
758 my $f = BackupPC::FileZIO->open($hdr->{fullPath}, 0, $hdr->{compress});
759 if ( !defined($f) ) {
760 print(STDERR "Unable to open file $hdr->{fullPath}\n");
765 while ( $f->read(\$data, $BufSize) > 0 ) {
766 $hdr->{linkname} .= $data;
770 my $name = $hdr->{linkname};
772 if ( $HardLinkExtraFiles{$name} ) {
774 # Target file will be or was written, so just remember
775 # the hardlink so we can dump it later.
777 push(@HardLinks, $hdr);
781 # Have to dump the original file. Just call the top-level
782 # routine, so that we save the hassle of dealing with
783 # mangling, merging and attributes.
785 $HardLinkExtraFiles{$hdr->{linkname}} = 1;
786 archiveWrite($fh, $hdr->{linkname}, $hdr->{name});
788 } elsif ( $hdr->{type} == BPC_FTYPE_SYMLINK ) {
790 # Symbolic link: read the symbolic link contents into the header
791 # and write the header.
793 my $f = BackupPC::FileZIO->open($hdr->{fullPath}, 0, $hdr->{compress});
794 if ( !defined($f) ) {
795 print(STDERR "Unable to open symlink file $hdr->{fullPath}\n");
800 while ( $f->read(\$data, $BufSize) > 0 ) {
801 $hdr->{linkname} .= $data;
805 TarWriteFileInfo($fh, $hdr);
807 } elsif ( $hdr->{type} == BPC_FTYPE_CHARDEV
808 || $hdr->{type} == BPC_FTYPE_BLOCKDEV
809 || $hdr->{type} == BPC_FTYPE_FIFO ) {
811 # Special files: for char and block special we read the
812 # major and minor numbers from a plain file.
814 if ( $hdr->{type} != BPC_FTYPE_FIFO ) {
815 my $f = BackupPC::FileZIO->open($hdr->{fullPath}, 0,
818 if ( !defined($f) || $f->read(\$data, $BufSize) < 0 ) {
819 print(STDERR "Unable to open/read char/block special file"
820 . " $hdr->{fullPath}\n");
821 $f->close if ( defined($f) );
826 if ( $data =~ /(\d+),(\d+)/ ) {
827 $hdr->{devmajor} = $1;
828 $hdr->{devminor} = $2;
832 TarWriteFileInfo($fh, $hdr);
835 print(STDERR "Got unknown type $hdr->{type} for $hdr->{name}\n");
840 my $t_fmt = '%Y-%m-%d %H:%M:%S';
842 return strftime($t_fmt,localtime());