Annotation of foxridge-archiver/MPIWGStor.pm, revision 1.4
1.1 casties 1:
2: #
3: # Library with definitions and common routines for MPIWG storage system
4: # scripts
5: #
6:
7: package MPIWGStor;
8:
9: use strict;
10: use vars qw(@ISA @EXPORT $VERSION
11: $debug %junk_files %index_files $index_file_perm $archived_index_file_perm
12: $file_perm);
13: use Exporter;
14:
1.4 ! casties 15: $VERSION = 0.6.1; # ROC 8.8.2005
1.1 casties 16:
17: @ISA = qw(Exporter);
18:
19: @EXPORT = qw($debug %junk_files %index_files $index_file_perm $archived_index_file_perm
20: $file_perm
21: &parseargs &logger &stime &s2stime &ymd_date &split_file_path &sstrip
1.3 casties 22: &valid_file_name &valid_dir_name &park_file &unpark_file
23: &read_xml &write_xml &add_text_element &create_element_path &create_text_path);
1.1 casties 24:
25: # debug level
26: $debug = 0;
27:
28: # junk files
29: %junk_files = (
30: '.HSResource' => '.HSResource',
31: '.HSancillary' => '.HSancillary',
32: '.HSicon' => '.HSicon',
33: 'Network Trash Folder' => 'Network Trash Folder',
34: 'TheVolumeSettingsFolder' => 'TheVolumeSettingsFolder',
35: '.DS_Store' => '.DS_Store'
36: );
37:
38: # filenames to not delete (but archive)
39: %index_files = (
40: 'index.meta' => 'index.meta',
41: 'index.meta.old' => 'index.meta.old'
42: );
43:
44: # default permissions for normal index files (rw-rw-r--)
45: $index_file_perm = 0664;
46: # default permissions for archived index files (rw-r--r--)
47: $archived_index_file_perm = 0644;
48: # default permissions for other files (rw-rw-r--)
49: $file_perm = 0664;
50:
51:
52: #
53: # $param_hash = parseargs;
54: #
55: # reads @ARGV and returns a hash with all options like "-option=value"
56: # and the last part of the string as "path"
57: #
58: sub parseargs {
59: my %opts;
60: foreach my $s (@ARGV) {
61: if ($s =~ /^-([^=]+)=*(.*)$/) {
62: $opts{$1} = ($2) ? $2 : $1;
63: } else {
64: $opts{'path'} = $s;
65: }
66: }
67: return \%opts;
68: }
69:
70:
71: #
72: # logger($level, $message)
73: #
74: # logs the $message (mostly to stdout)
75: #
76: sub logger {
77: my ($level, $message) = @_;
78: if ($debug || ($level ne "DEBUG")) {
79: print "$level: $message\n";
80: }
81: }
82:
83: #
84: # $stime = stime($utime)
85: #
86: # format utime (seconds since epoch) into string
87: # representation: "YYYY/MM/DD HH:MM:SS"
88: #
89: sub stime {
90: my ($utime) = @_;
91: my ($sec,$min,$hour,$mday,$mon,$year,$wday,$yday,$isdst) =
92: localtime($utime);
93: my $yy = $year + 1900;
94: my $mm = $mon + 1;
95: my $stime = sprintf("%d/%02d/%02d %02d:%02d:%02d",
96: $yy, $mm, $mday, $hour, $min, $sec);
97: return $stime;
98: }
99:
100: #
101: # $stime = s2stime($stime2)
102: #
103: # format db-like time (2003-09-19 12:43:32+02) into string
104: # representation: "YYYY/MM/DD HH:MM:SS"
105: #
106: sub s2stime {
107: my ($s2time) = @_;
108: my $stime = "";
109: if ($s2time =~ /(\d+)-(\d+)-(\d+) (\d+):(\d+):(\d+)/) {
110: my ($year,$mon,$mday,$hour,$min,$sec) = ($1, $2, $3, $4, $5, $6);
111: $stime = sprintf("%d/%02d/%02d %02d:%02d:%02d",
112: $year, $mon, $mday, $hour, $min, $sec);
113: }
114: return $stime;
115: }
116:
117: #
118: # $date = ymd_date($olddate)
119: #
120: # converts a date string in mm/dd/yy format to yyyy/mm/dd format
121: #
122: sub ymd_date {
123: my ($mdy) = @_;
124: my $ydm;
125: if ($mdy =~ /(\d+)\/(\d+)\/(\d+)/) {
126: my $m = $1;
127: my $d = $2;
128: my $y = $3;
129: # extend yy to yyyy
130: $y = ($y < 70) ? (2000 + $y) : (($y < 100) ? ($y + 1900) : $y);
131: $ydm = sprintf "%d/%02d/%02d", $y, $m, $d;
132: }
133: return $ydm;
134: }
135:
136: #
137: # ($name, $path) = split_file_path($fn)
138: #
139: # splits the file path $fn into
140: # file name (the last path element) and path
141: #
142: sub split_file_path {
143: my ($fn) = @_;
144:
145: if ($fn =~ /^(.*)\/([^\/]+)$/) {
146: return ($2, $1);
147: }
1.4 ! casties 148: return ($fn, '.'); # only file name
1.1 casties 149: }
150:
151:
152: #
153: # $name = sstrip($name)
154: #
155: # strips leading and trailing whitespace from $name
156: #
157: sub sstrip {
158: my ($name) = @_;
159:
160: if ($name =~ /\s*(.*)\s*/) {
161: return $1;
162: }
163: return $name;
164: }
165:
166:
167: #
168: # $valid = valid_file_name($name)
169: #
170: # checks if $name is a valid file name
171: #
172: sub valid_file_name {
173: return valid_name($_[0], 0);
174: }
175:
176:
177: #
178: # $valid = valid_dir_name($name)
179: #
180: # checks if $name is a valid directory name
181: #
182: sub valid_dir_name {
183: return valid_name($_[0], 1);
184: }
185:
186:
187: #
188: # $valid = valid_name($name, $mode)
189: #
190: # checks if $name is a valid file ($mode=0) or directory name (mode=1)
191: #
192: sub valid_name {
193: my ($name, $mode) = @_;
194:
195: # whitespace?
196: if ($name =~ /\s+/) {
197: return 0;
198: }
199: # invalid characters
200: if ($name !~ /^[-\w.\/]+$/) {
201: return 0;
202: }
203: # files have extension
204: if ($mode == 0) {
205: if ($name !~ /\.[-\w]+$/) {
206: return 0;
207: }
208: }
209: return 1;
210: }
1.2 casties 211:
212:
213: #
214: # $newfilename = park_file($filename)
215: #
216: # parks a file under a new name (*.bak)
217: #
218: sub park_file {
219: my ($filename) = @_;
220: my $newfn = "";
221: if (-f $filename) {
222: $newfn = "$filename.bak";
223: if (! rename $filename, $newfn) {
224: logger("ABORT", "unable to rename file $filename!");
225: exit 1;
226: }
227: }
228: return $newfn;
229: }
230:
231: #
232: # $filename = unpark_file($filename)
233: #
234: # unparks a file
235: #
236: sub unpark_file {
237: my ($filename) = @_;
238: my $newfn = "$filename.bak";
239: if (-f $newfn) {
240: if (! rename $newfn, $filename) {
241: logger("ABORT", "unable to rename file $newfn!");
242: exit 1;
243: }
244: return $filename;
245: }
246: return "";
247: }
248:
1.1 casties 249:
250:
251: #
252: # ($document, $rootnode) = read_xml($file)
253: #
254: # reads xml meta file $file
255: # returns root node element
256: #
257: sub read_xml {
258: my ($file) = @_;
259: my $document;
260:
261: my $parser = XML::LibXML->new();
262: if (! $parser) {
263: logger("ABORT", "unable to create parser for metadata index file!!");
264: exit 1;
265: }
266:
1.3 casties 267: logger("DEBUG", "index file: $file");
1.1 casties 268: eval { $document = $parser->parse_file($file) };
269: # catch parsing errors
270: if ($@) {
1.3 casties 271: logger("ABORT", "XML syntax error in file $file!!");
1.1 casties 272: exit 1;
273: }
274: my $rootnode = $document->documentElement;
1.3 casties 275: logger("DEBUG", "root element: \'" . $rootnode->nodeName . "\'");
1.1 casties 276:
277: return ($document, $rootnode);
278: }
279:
280:
281: #
282: # write_xml($document, $file)
283: #
284: # saves the XML tree of $document to the file $file
285: #
286: sub write_xml {
287: my ($document, $filename) = @_;
288: # keep backup copy
289: if (-f $filename) {
290: if (! rename $filename, "$filename.old") {
291: logger("ABORT", "unable to change file $filename!");
292: exit 1;
293: }
294: }
295: # write new file
1.3 casties 296: my ($fn, $dir) = split_file_path($filename);
297: if (-d $dir && $document->toFile($filename)) {
1.1 casties 298: logger("INFO", "written new file $filename");
299: chmod $index_file_perm, $filename;
300: } else {
301: logger("ABORT", "unable to write file $filename!");
302: exit 1;
303: }
304: }
1.3 casties 305:
306: #
307: # $elem = add_text_element($node, $name, $value, $namespace)
308: #
309: # creates an XML element with the name $name and the text content
310: # $value attached to the node $node and returns it.
311: #
312: sub add_text_element {
313: my ($node, $name, $value, $namespace) = @_;
314:
315: my $doc = $node->ownerDocument;
316: my $text = $doc->createTextNode($value);
317: my $newnode = $node->addNewChild($namespace, $name);
318: $newnode->addChild($text);
319:
320: return $newnode;
321: }
322:
323: #
324: # $elem = create_element_path($path, $root, $namespace)
325: #
326: # creates and returns a DOM element at the given path from the
327: # given root. path is e.g. meta/bib@type=book. elements are separated
328: # by /, an additional attribute can be specified after the @.
329: #
330: sub create_element_path {
331: my ($path, $root, $namespace) = @_;
332: my $attribute = "";
333: # get attribute
334: if ($path =~ /^(.+)@(.+)$/) {
335: $attribute = $2;
336: $path = $1;
337: }
338: my $point = $root;
339: for my $p (split /\//, $path) {
340: # check if the next path element exists
341: my $n = ($point->findnodes($p))[0];
342: if ($n) {
343: $point = $n;
344: } else {
345: # create if it doesn't exist
346: $point = $point->addNewChild($namespace, $p);
347: }
348: }
349: # add the attribute
350: if ($attribute) {
351: my $dom = $root->getOwner();
352: my ($attkey, $attval) = split /=/, $attribute; #/ silly fontlock...
353: $point->addChild($dom->createAttributeNS($namespace, $attkey, $attval));
354: }
355: return $point;
356: }
357:
358: #
359: # $elem = create_text_path($path, $text, $root, $namespace)
360: #
361: # creates and returns a DOM text element with the given content at the
362: # given path from the given root.
363: #
364: sub create_text_path {
365: my ($path, $text, $root, $namespace) = @_;
366: my $elem = create_element_path($path, $root, $namespace)->appendTextNode($text);
367: return $elem;
368: }
369:
1.1 casties 370:
371:
372: # module init
373: return 1;
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>