--- foxridge-archiver/archiver.pl 2005/03/23 12:12:08 1.4 +++ foxridge-archiver/archiver.pl 2005/10/05 13:35:12 1.7 @@ -16,25 +16,44 @@ $|=1; # # program version -my $version = "0.6 (ROC 23.3.2005)"; +my $version = "0.7.2 (ROC 5.10.2005)"; # short help -my $shorthelp = "MPIWG archiver $version\nuse:\n archiver [options] docpath\noptions:\n -premigrate don't delete archived files\n"; +my $help = "MPIWG archiver $version +use: archiver [options] docpath +options: + -debug show debugging info + -premigrate don't delete archived files + -force archive even if already archived + -replace rewrite index file +"; # read command line parameters my $args = MPIWGStor::parseargs; +if (! scalar(%$args)) { + print $help, "\n"; + exit 1; +} # debug level -my $debug = (exists $$args{'debug'}) ? $$args{'debug'} : 0; +$debug = (exists $$args{'debug'}) ? $$args{'debug'} : 0; + +# force archiving +my $force_archive = (exists $$args{'force'}) ? $$args{'force'} : 0; + +# rewrite index file +my $rewrite_index = (exists $$args{'replace'}) ? $$args{'replace'} : 0; # rewrite XML file (necessary for archive date!) my $fix_xml = 1; my $xml_changed = 0; + # XML namespace (not really implemented!) my $namespace = ""; # archive name (archive-path element, usually == $docdir) my $archname; + # archive storage date (now) my $archdate = stime(time); @@ -44,54 +63,52 @@ my $delete_junk_files = 1; # delete data files after archiving my $delete_data_files = 1; +# don't delete archived files with "-premigrate" +if (exists $$args{'premigrate'}) { + $delete_data_files = not $$args{'premigrate'}; +} +if ($delete_data_files) { + logger('INFO', "going to remove successfully archived files from disk"); +} + ####################################################### # external programs # my $archprog = "/opt/tivoli/tsm/client/ba/bin/dsmc"; if (! -x $archprog) { - logger('ABORT', "TSM client program '$archprog' missing!!\n"); + logger('ABORT', "TSM client program '$archprog' missing!"); exit 1; } my $checkprog = "/usr/local/mpiwg/archive/metacheck"; if (! -x $checkprog) { - logger('ABORT', "meta data checking program '$checkprog' missing!!\n"); + logger('ABORT', "meta data checking program '$checkprog' missing!"); exit 1; } # log file for archiver my $log_file = "/var/log/mpiwg-archiver.log"; if (! open LOG, ">>$log_file") { - logger('ABORT', "unable to write log file '$log_file'!!\n"); + logger('ABORT', "unable to write log file '$log_file'!"); exit 1; } ####################################################### # check parameters that were passed to the program # -if ($#ARGV < 0) { - print $shorthelp; - exit 1; -} + my $docdir = $$args{'path'}; # strip double slashes $docdir =~ s/\/\//\//; # strip trailing slashes $docdir =~ s/\/+$//; if (! -d $docdir) { - logger('ABORT', "document directory \'$docdir\' doesn't exist!\n"); + logger('ABORT', "document directory \'$docdir\' doesn't exist!"); exit 1; } -# don't delete archived files with "-premigrate" -if (exists $$args{'premigrate'}) { - $delete_data_files = not $$args{'premigrate'}; -} -if ($delete_data_files) { - logger('INFO', "going to remove successfully archived files from disk"); -} my $metafile = "$docdir/index.meta"; if (! -f $metafile) { - logger('ABORT', "metadata index file \'$metafile\' doesn't exist!\n"); + logger('ABORT', "metadata index file \'$metafile\' doesn't exist!"); exit 1; } @@ -122,7 +139,7 @@ sub read_resource_meta { # get archive-path $archname = MPIWGStor::sstrip($rootnode->findvalue('child::archive-path')); if (! $archname) { - logger('ABORT', "archive-name element missing!!\n"); + logger('ABORT', "archive-name element missing!"); exit 1; } @@ -133,7 +150,7 @@ sub read_resource_meta { foreach my $fn (@filenodes) { my $name = MPIWGStor::sstrip($fn->findvalue('child::name')); my $path = MPIWGStor::sstrip($fn->findvalue('child::path')); - logger('DEBUG', "FILE ($path)$name\n"); + logger('DEBUG', "FILE ($path)$name"); my $f = ($path) ? "$path/$name" : "$name"; $files{$f} = $name; } @@ -143,7 +160,7 @@ sub read_resource_meta { # my $stordatenode = ($rootnode->find('child::archive-storage-date'))->get_node(1); if ($stordatenode) { - logger('WARNING', "archive storage date exists! Resource already archived?\n"); + logger('WARNING', "archive storage date exists! Resource already archived?"); $warncnt++; # delete old date $stordatenode->removeChildNodes; @@ -186,7 +203,7 @@ sub run_archive { } } } else { - logger('ABORT', "unable to start archive command '$archcmd'!!\n"); + logger('ABORT', "unable to start archive command '$archcmd'!!"); exit 1; } @@ -209,10 +226,10 @@ sub check_files { my $fp = "$docdir/$ft"; #print " fp: $fp\n"; if ($$archived{$fp}) { - logger('DEBUG', "$ft archived OK\n"); + logger('DEBUG', "$ft archived OK"); $$archived{$fp} = "OK"; } else { - logger('ERROR', "file '$ft' missing from archive!\n"); + logger('ERROR', "file '$ft' missing from archive!"); $errcnt++; } } @@ -221,19 +238,19 @@ sub check_files { if ($$archived{$fa} ne "OK") { my ($fn, $fp) = MPIWGStor::split_file_path($fa); if ($MPIWGStor::index_files{$fn}) { - logger('DEBUG', "$fa ignored\n"); + logger('DEBUG', "$fa ignored"); $na--; } else { - logger('WARNING', "$fa archived but not in list!\n"); + logger('WARNING', "$fa archived but not in list!"); $warncnt++; } } } if ($nt > $na) { - logger('WARNING', "less files were archived ($na vs. $nt)!\n"); + logger('WARNING', "less files were archived ($na vs. $nt)!"); } elsif ($na > $nt) { - logger('WARNING', "more files were archived ($na vs. $nt)!\n"); + logger('WARNING', "more files were archived ($na vs. $nt)!"); } } @@ -261,9 +278,9 @@ sub delete_files { next unless (-f $f); # delete files if (unlink $f) { - logger('INFO', "remove $f ($fn)\n"); + logger('DEBUG', "remove $f ($fn)"); } else { - logger('ERROR', "unable to delete $f!\n"); + logger('ERROR', "unable to delete $f!"); $errcnt++; } } @@ -275,7 +292,7 @@ sub delete_files { # dont't remove document dir (shouldn't be empty anyway) next if ($d eq $docdir); if (-d $d) { - logger('INFO', "remove dir $d\n"); + logger('DEBUG', "remove dir $d"); rmdir $d; } } @@ -292,7 +309,7 @@ sub delete_all_files { my ($files, $dir) = @_; if (! opendir DIR, $dir) { - logger('ERROR', "unable to read directory $dir!\n"); + logger('ERROR', "unable to read directory $dir!"); $errcnt++; return; } @@ -306,28 +323,28 @@ sub delete_all_files { if (-f "$dir/$f") { # $f is a file if (unlink "$dir/$f") { - logger('INFO', "removed $f\n"); + logger('DEBUG', "removed $f"); } else { - logger('ERROR', "unable to delete $f!\n"); + logger('ERROR', "unable to delete $f!"); $errcnt++; } } elsif (-d _) { # $f is a directory (unlink won't work) if ((system 'rm', '-r', "$dir/$f") == 0) { - logger('INFO', "removed directory $f\n"); + logger('DEBUG', "removed directory $f"); } else { - logger('ERROR', "unable to delete directory $f!\n"); + logger('ERROR', "unable to delete directory $f!"); $errcnt++; } } else { - logger('ERROR', "funny object $dir/$f!\n"); + logger('ERROR', "funny object $dir/$f!"); $errcnt++; } } else { # $f is not in the list if (-d "$dir/$f") { # recurse into directories - logger('DEBUG', "enter $dir/$f\n"); + logger('DEBUG', "enter $dir/$f"); delete_all_files($files, "$dir/$f"); } } @@ -339,22 +356,58 @@ sub delete_all_files { # main # -logger('START', "archiver $version at $archdate\n"); +logger('START', "archiver $version at $archdate"); # make shure the right user is running this program my $user = getlogin; -#if (($user ne "archive")||($user ne "root")) { -# logger("ABORT", "you ($user) must be archive or root user to run this program!"); -# exit 1; -#} +if (($user ne "archive")&&($user ne "root")) { + logger("WARNING", "you ($user) should be archive or root user to run this program!"); +} + +# check for .archived file +if (-f "$docdir/.archived") { + if (not $force_archive) { + logger('ABORT', "already archived! (.archived file exists)"); + exit 1; + } else { + logger('WARNING', "resource already archived? (.archived file exists)"); + $warncnt++; + } +} # use metacheck first -if (system("$checkprog $docdir >/dev/null") == 0) { - logger('INFO', "resource '$docdir' check OK\n"); +my $check_opts="-add-files"; +if ($rewrite_index) { + $check_opts = "-replace"; +} +if (open CHECK, "$checkprog $check_opts $docdir |") { + my @errors; + my $msg; + while () { + chomp; + if (/^ERROR/) { + push @errors, $_; + } + $msg = $_; + } + if ($msg =~ /^DONE/) { + logger('DEBUG', "checking index file: $msg"); + logger('INFO', "resource '$docdir' check OK"); + } else { + logger('DEBUG', "errors checking index file:\n " . join("\n ", @errors) . "\n $msg"); + logger('ABORT', "resource '$docdir' check failed!"); + exit 1; + } } else { - logger('ABORT', "resource '$docdir' check failed!!\n"); + logger('ABORT', "unable to run $checkprog"); exit 1; } +# if (system("$checkprog $docdir >/dev/null") == 0) { +# logger('INFO', "resource '$docdir' check OK"); +# } else { +# logger('ABORT', "resource '$docdir' check failed!!"); +# exit 1; +# } # read index.meta file my ($document, $rootnode) = MPIWGStor::read_xml($metafile); @@ -362,15 +415,15 @@ my ($document, $rootnode) = MPIWGStor::r # check file and add archive date my $files_to_archive = read_resource_meta($rootnode); -print "INFO: ", scalar keys %$files_to_archive, " files to archive\n"; +logger('INFO', (scalar keys %$files_to_archive) . " files to archive"); -# check for .archived file +# remove .archived file if (-f "$docdir/.archived") { if (unlink "$docdir/.archived") { - logger('WARNING', "existing .archived file has been removed! Resource already archived?\n"); + logger('WARNING', "existing .archived file has been removed!"); $warncnt++; } else { - logger('ERROR', "unable to remove existing .archived file!\n"); + logger('ERROR', "unable to remove existing .archived file!"); $errcnt++; } } @@ -382,7 +435,7 @@ if ($delete_junk_files) { # write new index.meta if ($errcnt > 0) { - logger('ABORT', "there were errors!\n"); + logger('ABORT', "there were errors!"); exit 1; } else { if ($fix_xml) { @@ -394,7 +447,7 @@ if ($errcnt > 0) { my $archived_files = run_archive(); my $num_archfiles = scalar keys %$archived_files; -logger('INFO', "$num_archfiles files archived\n"); +logger('INFO', "$num_archfiles files archived"); # check list of archived files check_files($files_to_archive, $archived_files); @@ -412,8 +465,8 @@ if ($errcnt == 0) { } } -logger('INFO', "$warncnt warnings\n"); -logger('INFO', "$errcnt errors\n"); +logger('INFO', "$warncnt warnings"); +logger('INFO', "$errcnt errors"); if ($errcnt > 0) { logger('ABORT', "there were errors! ($num_archfiles files archived) at " . stime(time)); exit 1;