annotate makemeta-vlp.pl @ 48:173e9823761e

fixed typo in mapping
author casties
date Thu, 14 Dec 2006 16:50:05 +0100
parents af4323868086
children 8e19bc5ca86a
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
1 #!/usr/local/bin/perl -w
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
2
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
3 use strict;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
4 use XML::LibXML;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
5
22
c3defe3e2780 corrected perl lib path
casties
parents: 21
diff changeset
6 use lib '/usr/local/mpiwg/archive';
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
7 use MPIWGStor;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
8
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
9 # make output unbuffered
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
10 $|=1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
11
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
12 # program version
48
173e9823761e fixed typo in mapping
casties
parents: 44
diff changeset
13 my $version = "0.2.5 (14.12.2006 ROC)";
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
14 my $help =
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
15 "use: makemeta-vlp [options] file.xml
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
16 options:
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
17 -debug show debugging info
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
18 -dry-run simulate, dont'do anything
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
19 -replace replace existing index files
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
20 -online-mode mode for creating online/permanent files
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
21 -archive-mode mode for creating archive/data files
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
22 -access=free adds free access tag for online-mode
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
23 ";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
24 logger("INFO", "makemeta-vlp $version");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
25
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
26 ###########################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
27 # mappings
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
28
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
29 # generic mappings at top level
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
30 my %gen_map = (
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
31 'Custom2_Language' => 'meta/lang',
48
173e9823761e fixed typo in mapping
casties
parents: 44
diff changeset
32 'productionComment' => 'meta/image-acquisition/production-comment',
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
33 'derivedFrom' => 'derived-from/archive-path'
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
34 );
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
35 # sub type switch tag
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
36 my %type_map = (
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
37 'ReferenceType' => 'meta/bib@type'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
38 );
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
39 # sub type mappings
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
40 my %subtype_map = (
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
41 'Book' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
42 '_name' => 'book',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
43 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
44 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
45 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
46 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
47 'Publisher' => 'meta/bib/publisher',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
48 'Edition' => 'meta/bib/edition',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
49 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
50 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
51 'Pages' => 'meta/bib/number-of-pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
52 },
31
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
53 '(Book)' => {
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
54 '_name' => 'book',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
55 'Author' => 'meta/bib/author',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
56 'Title' => 'meta/bib/title',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
57 'Year' => 'meta/bib/year',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
58 'Place_Published' => 'meta/bib/city',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
59 'Publisher' => 'meta/bib/publisher',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
60 'Edition' => 'meta/bib/edition',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
61 'Volume' => 'meta/bib/volume',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
62 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
63 'Pages' => 'meta/bib/number-of-pages',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
64 '#Cover pages only, book sections have been extracted' => 'meta/bib/comment'
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
65 },
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
66 'Book Section' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
67 '_name' => 'inbook',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
68 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
69 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
70 'Year' => 'meta/bib/year',
31
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
71 'SecondaryTitle' => 'meta/bib/book-title',
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
72 'SecondaryAuthor' => 'meta/bib/editor',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
73 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
74 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
75 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
76 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
77 'Edited Book' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
78 '_name' => 'edited-book',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
79 'Author' => 'meta/bib/editor',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
80 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
81 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
82 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
83 'Publisher' => 'meta/bib/publisher',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
84 'Edition' => 'meta/bib/edition',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
85 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
86 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
33
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
87 'Pages' => 'meta/bib/number-of-pages',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
88 '#Cover pages only, book sections have been extracted' => 'meta/bib/comment'
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
89 },
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
90 '(Edited Book)' => {
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
91 '_name' => 'edited-book',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
92 'Author' => 'meta/bib/editor',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
93 'Title' => 'meta/bib/title',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
94 'Year' => 'meta/bib/year',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
95 'Place_Published' => 'meta/bib/city',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
96 'Publisher' => 'meta/bib/publisher',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
97 'Edition' => 'meta/bib/edition',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
98 'Volume' => 'meta/bib/volume',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
99 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
100 'Pages' => 'meta/bib/number-of-pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
101 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
102 'Journal Article' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
103 '_name' => 'journal-article',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
104 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
105 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
106 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
107 'SecondaryTitle' => 'meta/bib/journal',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
108 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
109 'Number_Issue' => 'meta/bib/issue',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
110 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
111 },
38
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
112 '(JournalVolume)' => {
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
113 '_name' => 'journal-volume',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
114 'SecondaryTitle' => 'meta/bib/title',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
115 'SecondaryAuthor' => 'meta/bib/editor',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
116 'Publisher' => 'meta/bib/publisher',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
117 'Place_Published' => 'meta/bib/city',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
118 'Year' => 'meta/bib/year',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
119 'Volume' => 'meta/bib/volume',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
120 'Pages' => 'meta/bib/number-of-pages',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
121 '#Cover pages only, articles have been extracted' => 'meta/bib/comment'
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
122 },
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
123 'Magazine Article' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
124 '_name' => 'magazine-article',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
125 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
126 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
127 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
128 'Secondary_Title' => 'meta/bib/magazine',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
129 'Number_Issue' => 'meta/bib/issue-number',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
130 'Date' => 'meta/bib/issue-date',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
131 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
132 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
133 'Report' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
134 '_name' => 'report',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
135 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
136 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
137 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
138 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
139 'Date' => 'meta/bib/date',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
140 'SecondaryTitle' => 'meta/bib/type',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
141 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
142 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
143 'Trade Catalogue' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
144 '_name' => 'report',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
145 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
146 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
147 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
148 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
149 'Date' => 'meta/bib/date',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
150 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
151 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
152 'ReferenceType' => 'meta/bib/type',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
153 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
154 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
155 'Thesis' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
156 '_name' => 'thesis',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
157 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
158 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
159 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
160 'Publisher' => 'meta/bib/university',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
161 'Date' => 'meta/bib/date',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
162 'TypeOfWork' => 'meta/bib/type',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
163 'Pages' => 'meta/bib/number-of-pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
164 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
165 'Manuscript' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
166 '_name' => 'manuscript',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
167 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
168 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
169 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
170 'Place_Published' => 'meta/bib/location',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
171 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
172 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
173 );
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
174 # language element
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
175 my $lang_field = 'Custom2_Language';
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
176 # languages to iso codes
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
177 my %lang_map = (
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
178 'German' => 'de',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
179 'English' => 'en',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
180 'Italian' => 'it',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
181 'French' => 'fr',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
182 'Latin' => 'la',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
183 'Japanese' => 'ja',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
184 'Dutch' => 'nl',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
185 'Spanish' => 'es',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
186 'Swedish' => 'sv'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
187 );
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
188 # storage fields
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
189 my $arch_id_field = 'ID';
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
190
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
191 #######################################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
192 # internal parameters
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
193 #
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
194
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
195 # storage
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
196 my $lib_arch_dir = '/mpiwg/archive/data/vlp';
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
197 my $lib_online_dir = '/mpiwg/online/permanent/vlp';
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
198
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
199 # read command line parameters
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
200 my $args = MPIWGStor::parseargs;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
201 if (! scalar(%$args)) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
202 print $help, "\n";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
203 exit 1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
204 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
205
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
206 # debug level
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
207 $debug = (exists $$args{'debug'}) ? $$args{'debug'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
208
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
209 # simulate action only
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
210 my $dry_run = (exists $$args{'dry-run'}) ? $$args{'dry-run'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
211 logger('DEBUG', "dry-run: $dry_run");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
212
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
213 # replace existing index files
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
214 my $do_replace = (exists $$args{'replace'}) ? $$args{'replace'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
215 logger('DEBUG', "replace: $do_replace");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
216
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
217 # use online mode
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
218 my $online_mode = (exists $$args{'online-mode'}) ? $$args{'online-mode'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
219 logger('DEBUG', "online_mode: $online_mode");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
220
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
221 # use archive mode
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
222 my $archive_mode = (exists $$args{'archive-mode'}) ? $$args{'archive-mode'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
223 logger('DEBUG', "archive_mode: $archive_mode");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
224
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
225 # access type
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
226 my $access_type = (exists $$args{'access'}) ? $$args{'access'} : "";
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
227
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
228 # index.meta namespace (not really implemented!)
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
229 my $namespace = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
230
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
231
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
232 my $xml_changed = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
233 my $errcnt = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
234 my $warncnt = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
235
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
236 #######################################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
237 # check parameters that were passed to the program
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
238 #
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
239 my $infile = $$args{'path'};
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
240 if (! $infile) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
241 logger("ABORT", "no input file given!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
242 exit 1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
243 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
244 # strip double slashes
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
245 $infile =~ s/\/\//\//;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
246 if (! -f $infile) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
247 logger("ABORT", "input file \'$infile\' doesn't exist!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
248 exit 1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
249 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
250
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
251
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
252 #######################################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
253 # subroutines
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
254 #
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
255
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
256
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
257 sub find_arch_dir {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
258 my ($input_node) = @_;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
259 my $dir = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
260
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
261 my $bib_id = $input_node->findvalue("fm:$arch_id_field");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
262 #logger('DEBUG', "bibdir: $bib_dir");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
263 if ($bib_id) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
264 $dir = "$lib_arch_dir/lit$bib_id";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
265 if (-d $dir) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
266 logger('DEBUG', "directory $dir exists");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
267 return $dir;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
268 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
269 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
270 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
271 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
272
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
273 sub find_permanent_dir {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
274 my ($input_node) = @_;
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
275 my $online_base = $lib_online_dir;
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
276 my $dest_id = sstrip($input_node->findvalue("fm:$arch_id_field"));
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
277 if (! $dest_id) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
278 logger('ERROR', "no ID field for online permanent entry");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
279 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
280 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
281 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
282 my $dir = "$online_base/lit$dest_id";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
283 return $dir;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
284 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
285
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
286
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
287 sub convert_bib {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
288 my ($input_node, $index_root, $index_doc) = @_;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
289 my $cnt = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
290 my $type = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
291 my $type_path = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
292
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
293 # process general stuff first
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
294 foreach my $n ($input_node->getChildNodes()) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
295 my $name = $n->nodeName();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
296 my $val = $n->textContent();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
297 #logger('DEBUG', " NODE: $name = '$val'");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
298 if (exists $gen_map{$name}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
299 # is a general field
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
300 if ($name eq $lang_field) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
301 # language field
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
302 if (not $val) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
303 logger('WARNING', "no language tag");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
304 $warncnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
305 next;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
306 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
307 # convert to iso code
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
308 if (exists $lang_map{$val}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
309 $val = $lang_map{$val};
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
310 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
311 logger('ERROR', "unknown language: $val! skipping...");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
312 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
313 return 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
314 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
315 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
316 create_element_path($gen_map{$name}, $index_root, $namespace)
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
317 ->appendTextNode($val);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
318 $cnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
319 } elsif (exists $type_map{$name}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
320 # is a type field
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
321 $type_path = $type_map{$name};
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
322 $type = $val;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
323 # check with known types
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
324 if (exists $subtype_map{$val}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
325 my $indextype = $subtype_map{$val}->{'_name'};
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
326 create_element_path("$type_path=$indextype", $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
327 $cnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
328 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
329 logger('ERROR', "unknown bib type $val! skipping...");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
330 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
331 return 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
332 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
333 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
334 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
335 # process sub type fields
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
336 if ($type) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
337 foreach my $n ($input_node->getChildNodes()) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
338 my $name = $n->nodeName();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
339 my $val = $n->textContent();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
340 #logger('DEBUG', " NODE: $name = '$val'");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
341 if (exists $subtype_map{$type}->{$name}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
342 create_element_path($subtype_map{$type}->{$name}, $index_root, $namespace)
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
343 ->appendTextNode($val);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
344 $cnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
345 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
346 }
31
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
347 # append additional constant fields (beginning with #)
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
348 foreach my $k (keys %{$subtype_map{$type}}) {
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
349 if ($k =~ /^\#(.*)/) {
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
350 my $val = $1;
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
351 create_text_path($subtype_map{$type}->{$k}, $val, $index_root, $namespace);
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
352 }
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
353 }
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
354 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
355 return $cnt;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
356 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
357
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
358
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
359
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
360 sub process_all_fm_entries {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
361 my ($input_root) = @_;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
362 my $cnt = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
363
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
364 foreach my $n ($input_root->findnodes('fm:ROW')) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
365 logger('INFO', "processing entry $cnt ...");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
366 process_fm_entry($n);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
367 $cnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
368 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
369 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
370
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
371
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
372 sub process_fm_entry {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
373 my ($input_node) = @_;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
374 my $index_doc = XML::LibXML::Document->createDocument('1.0', 'UTF-8');
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
375 my $index_root = $index_doc->createElementNS($namespace, 'resource');
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
376 $index_root->addChild($index_doc->createAttributeNS($namespace, 'version', '1.1'));
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
377 $index_root->addChild($index_doc->createAttributeNS($namespace, 'type', 'MPIWG'));
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
378 $index_doc->setDocumentElement($index_root);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
379
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
380 # try to find the document directory
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
381 my $doc_dir = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
382 if ($online_mode) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
383 $doc_dir = find_permanent_dir($input_node);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
384 } elsif ($archive_mode) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
385 $doc_dir = find_arch_dir($input_node);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
386 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
387 $doc_dir = find_permanent_dir($input_node);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
388 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
389 if (! $doc_dir) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
390 logger('ERROR', "document directory not found! skipping...");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
391 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
392 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
393 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
394
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
395 # check if index.meta exists
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
396 if ( -f "$doc_dir/index.meta") {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
397 if (not $do_replace) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
398 logger('DEBUG', "index file in $doc_dir exists");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
399 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
400 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
401 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
402
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
403 # add standard stuff to index.meta
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
404 my ($docname, $docpath) = split_file_path($doc_dir);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
405 # name and date
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
406 create_text_path('name', $docname, $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
407 create_text_path('archive-path', $doc_dir, $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
408 create_text_path('archive-creation-date', stime(time), $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
409 create_text_path('creator', 'vlp', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
410 create_text_path('description', 'a scanned document', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
411 if ($archive_mode) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
412 # acquisition
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
413 create_text_path('meta/acquisition/date', stime(time), $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
414 create_text_path('meta/acquisition/provider/provider-id', 'vlp', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
415 create_text_path('meta/acquisition/provider/address', 'Max Planck Institute for the History of Science', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
416 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
417 # media
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
418 create_text_path('media-type', 'image', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
419 create_text_path('meta/content-type', 'scanned document', $index_root, $namespace);
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
420 # access
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
421 if ($access_type) {
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
422 if ($access_type eq "free") {
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
423 create_element_path('meta/access-conditions/access@type=free', $index_root, $namespace);
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
424 } else {
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
425 my $acc_tag = create_element_path('meta/access-conditions/access@type=institution', $index_root, $namespace);
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
426 create_text_path('name', $access_type, $acc_tag, $namespace);
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
427 }
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
428 }
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
429
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
430 # convert bib entries
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
431 my $cnt = convert_bib($input_node, $index_root, $index_doc);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
432 if ($cnt == 0) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
433 # error or nothing to convert
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
434 logger('ERROR', "no bibliographic metadata!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
435 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
436 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
437 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
438
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
439 # write new index.meta file
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
440 if ($dry_run) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
441 logger('DEBUG', "would write $doc_dir/index.meta");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
442 logger('DEBUG', $index_doc->toString(1));
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
443 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
444 write_xml($index_doc, "$doc_dir/index.meta");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
445 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
446
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
447 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
448
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
449
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
450
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
451
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
452
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
453 #######################################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
454 # Main
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
455 #
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
456
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
457 # load filemaker xml dump
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
458 my ($input_doc, $input_root) = read_xml($infile);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
459 # set namespace prefix
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
460 my $fm_namespace = $input_root->namespaceURI();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
461 $input_root->setNamespace($fm_namespace, 'fm', 1);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
462
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
463
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
464 process_all_fm_entries($input_root);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
465
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
466
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
467 logger("INFO", "$warncnt warnings");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
468 logger("INFO", "$errcnt errors");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
469 if ($errcnt > 0) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
470 logger("ABORT", "there were errors!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
471 exit 1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
472 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
473 logger("DONE", "done something successfully!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
474 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
475