version 1.4, 2004/07/13 18:32:49
|
version 1.6, 2017/03/16 17:00:43
|
Line 1
|
Line 1
|
#!/usr/local/bin/perl -w |
#!/usr/bin/perl -w |
|
|
use strict; |
use strict; |
use XML::SAX; |
use XML::SAX; |
Line 17 $|=1;
|
Line 17 $|=1;
|
# |
# |
|
|
# program version |
# program version |
my $version = "0.2.1 (13.07.2004)"; |
my $version = "0.3 (27.9.2004)"; |
|
|
# read command line parameters |
# read command line parameters |
my $args = MPIWGStor::parseargs; |
my $args = MPIWGStor::parseargs; |
Line 229 sub readURLIndex {
|
Line 229 sub readURLIndex {
|
my ($tag, $val, $attr) = @$me; |
my ($tag, $val, $attr) = @$me; |
my $meta = ""; |
my $meta = ""; |
my $file = ""; |
my $file = ""; |
|
my $mtime = ""; |
if ($tag =~ /index\/resource$/) { |
if ($tag =~ /index\/resource$/) { |
if ($attr =~ /metaLink=\"([^\"]+)\"/) { |
if ($attr =~ /metaLink=\"([^\"]+)\"/) { |
$meta = $1; |
$meta = $1; |
Line 236 sub readURLIndex {
|
Line 237 sub readURLIndex {
|
if ($attr =~ /resourceLink=\"([^\"]+)\"/) { |
if ($attr =~ /resourceLink=\"([^\"]+)\"/) { |
$file = $1; |
$file = $1; |
} |
} |
|
if ($attr =~ /modificationDate=\"([^\"]+)\"/) { |
|
$mtime = $1; |
|
} |
if ($meta =~ /^http:/) { |
if ($meta =~ /^http:/) { |
harvestURL($meta, $file); |
harvestURL($meta, $file, $mtime); |
} |
} |
} |
} |
} |
} |
Line 251 sub readURLIndex {
|
Line 255 sub readURLIndex {
|
# in the database (under $filepath) |
# in the database (under $filepath) |
# |
# |
sub harvestURL { |
sub harvestURL { |
my ($metaurl, $fileurl) = @_; |
my ($metaurl, $fileurl, $filetime) = @_; |
logger('DEBUG', "fetching from url '$metaurl' for '$fileurl'"); |
logger('DEBUG', "fetching from url '$metaurl' for '$fileurl'"); |
|
# if no filetime then now |
|
$filetime = stime(time) unless ($filetime); |
|
# register file in db |
|
my $fid = registerFile("$fileurl", $filetime); |
|
if ($fid) { |
# try to parse index file |
# try to parse index file |
my $ret = eval{$metaParser->parse_uri($metaurl)}; |
my $ret = eval{$metaParser->parse_uri($metaurl)}; |
if ($@) { |
if ($@) { |
Line 269 sub harvestURL {
|
Line 278 sub harvestURL {
|
$warncnt++; |
$warncnt++; |
return; |
return; |
} |
} |
# filetime is now |
|
my $filetime = stime(time); |
|
# register file in db |
|
my $fid = registerFile("$fileurl", $filetime); |
|
if ($fid) { |
|
# file is new/modified |
# file is new/modified |
registerMeta($fid, @data); |
registerMeta($fid, @data); |
} |
} |