annotate makemeta-vlp.pl @ 54:8e19bc5ca86a

added some more languages
author casties
date Mon, 02 Feb 2009 12:45:15 +0100
parents 173e9823761e
children 9d7df218f94c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
1 #!/usr/local/bin/perl -w
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
2
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
3 use strict;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
4 use XML::LibXML;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
5
22
c3defe3e2780 corrected perl lib path
casties
parents: 21
diff changeset
6 use lib '/usr/local/mpiwg/archive';
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
7 use MPIWGStor;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
8
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
9 # make output unbuffered
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
10 $|=1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
11
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
12 # program version
54
8e19bc5ca86a added some more languages
casties
parents: 48
diff changeset
13 my $version = "0.2.6 (1.2.2009 ROC)";
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
14 my $help =
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
15 "use: makemeta-vlp [options] file.xml
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
16 options:
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
17 -debug show debugging info
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
18 -dry-run simulate, dont'do anything
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
19 -replace replace existing index files
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
20 -online-mode mode for creating online/permanent files
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
21 -archive-mode mode for creating archive/data files
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
22 -access=free adds free access tag for online-mode
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
23 ";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
24 logger("INFO", "makemeta-vlp $version");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
25
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
26 ###########################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
27 # mappings
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
28
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
29 # generic mappings at top level
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
30 my %gen_map = (
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
31 'Custom2_Language' => 'meta/lang',
48
173e9823761e fixed typo in mapping
casties
parents: 44
diff changeset
32 'productionComment' => 'meta/image-acquisition/production-comment',
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
33 'derivedFrom' => 'derived-from/archive-path'
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
34 );
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
35 # sub type switch tag
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
36 my %type_map = (
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
37 'ReferenceType' => 'meta/bib@type'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
38 );
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
39 # sub type mappings
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
40 my %subtype_map = (
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
41 'Book' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
42 '_name' => 'book',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
43 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
44 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
45 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
46 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
47 'Publisher' => 'meta/bib/publisher',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
48 'Edition' => 'meta/bib/edition',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
49 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
50 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
51 'Pages' => 'meta/bib/number-of-pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
52 },
31
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
53 '(Book)' => {
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
54 '_name' => 'book',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
55 'Author' => 'meta/bib/author',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
56 'Title' => 'meta/bib/title',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
57 'Year' => 'meta/bib/year',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
58 'Place_Published' => 'meta/bib/city',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
59 'Publisher' => 'meta/bib/publisher',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
60 'Edition' => 'meta/bib/edition',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
61 'Volume' => 'meta/bib/volume',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
62 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
63 'Pages' => 'meta/bib/number-of-pages',
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
64 '#Cover pages only, book sections have been extracted' => 'meta/bib/comment'
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
65 },
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
66 'Book Section' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
67 '_name' => 'inbook',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
68 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
69 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
70 'Year' => 'meta/bib/year',
31
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
71 'SecondaryTitle' => 'meta/bib/book-title',
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
72 'SecondaryAuthor' => 'meta/bib/editor',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
73 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
74 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
75 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
76 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
77 'Edited Book' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
78 '_name' => 'edited-book',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
79 'Author' => 'meta/bib/editor',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
80 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
81 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
82 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
83 'Publisher' => 'meta/bib/publisher',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
84 'Edition' => 'meta/bib/edition',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
85 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
86 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
33
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
87 'Pages' => 'meta/bib/number-of-pages',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
88 '#Cover pages only, book sections have been extracted' => 'meta/bib/comment'
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
89 },
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
90 '(Edited Book)' => {
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
91 '_name' => 'edited-book',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
92 'Author' => 'meta/bib/editor',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
93 'Title' => 'meta/bib/title',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
94 'Year' => 'meta/bib/year',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
95 'Place_Published' => 'meta/bib/city',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
96 'Publisher' => 'meta/bib/publisher',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
97 'Edition' => 'meta/bib/edition',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
98 'Volume' => 'meta/bib/volume',
9868f6ed9a54 added (Edited Book) type
casties
parents: 31
diff changeset
99 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
100 'Pages' => 'meta/bib/number-of-pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
101 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
102 'Journal Article' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
103 '_name' => 'journal-article',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
104 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
105 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
106 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
107 'SecondaryTitle' => 'meta/bib/journal',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
108 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
109 'Number_Issue' => 'meta/bib/issue',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
110 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
111 },
38
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
112 '(JournalVolume)' => {
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
113 '_name' => 'journal-volume',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
114 'SecondaryTitle' => 'meta/bib/title',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
115 'SecondaryAuthor' => 'meta/bib/editor',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
116 'Publisher' => 'meta/bib/publisher',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
117 'Place_Published' => 'meta/bib/city',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
118 'Year' => 'meta/bib/year',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
119 'Volume' => 'meta/bib/volume',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
120 'Pages' => 'meta/bib/number-of-pages',
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
121 '#Cover pages only, articles have been extracted' => 'meta/bib/comment'
7bf843ac256b new bib type (JournalVolume)
casties
parents: 33
diff changeset
122 },
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
123 'Magazine Article' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
124 '_name' => 'magazine-article',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
125 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
126 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
127 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
128 'Secondary_Title' => 'meta/bib/magazine',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
129 'Number_Issue' => 'meta/bib/issue-number',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
130 'Date' => 'meta/bib/issue-date',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
131 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
132 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
133 'Report' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
134 '_name' => 'report',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
135 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
136 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
137 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
138 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
139 'Date' => 'meta/bib/date',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
140 'SecondaryTitle' => 'meta/bib/type',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
141 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
142 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
143 'Trade Catalogue' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
144 '_name' => 'report',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
145 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
146 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
147 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
148 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
149 'Date' => 'meta/bib/date',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
150 'Volume' => 'meta/bib/volume',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
151 'NumberOfVolumes' => 'meta/bib/number-of-volumes',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
152 'ReferenceType' => 'meta/bib/type',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
153 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
154 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
155 'Thesis' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
156 '_name' => 'thesis',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
157 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
158 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
159 'Place_Published' => 'meta/bib/city',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
160 'Publisher' => 'meta/bib/university',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
161 'Date' => 'meta/bib/date',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
162 'TypeOfWork' => 'meta/bib/type',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
163 'Pages' => 'meta/bib/number-of-pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
164 },
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
165 'Manuscript' => {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
166 '_name' => 'manuscript',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
167 'Author' => 'meta/bib/author',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
168 'Title' => 'meta/bib/title',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
169 'Year' => 'meta/bib/year',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
170 'Place_Published' => 'meta/bib/location',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
171 'Pages' => 'meta/bib/pages'
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
172 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
173 );
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
174 # language element
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
175 my $lang_field = 'Custom2_Language';
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
176 # languages to iso codes
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
177 my %lang_map = (
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
178 'German' => 'de',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
179 'English' => 'en',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
180 'Italian' => 'it',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
181 'French' => 'fr',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
182 'Latin' => 'la',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
183 'Japanese' => 'ja',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
184 'Dutch' => 'nl',
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
185 'Spanish' => 'es',
54
8e19bc5ca86a added some more languages
casties
parents: 48
diff changeset
186 'Swedish' => 'sv',
8e19bc5ca86a added some more languages
casties
parents: 48
diff changeset
187 'Russian' => 'ru',
8e19bc5ca86a added some more languages
casties
parents: 48
diff changeset
188 'Polish' => 'pl',
8e19bc5ca86a added some more languages
casties
parents: 48
diff changeset
189 'Greek' => 'el'
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
190 );
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
191 # storage fields
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
192 my $arch_id_field = 'ID';
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
193
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
194 #######################################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
195 # internal parameters
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
196 #
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
197
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
198 # storage
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
199 my $lib_arch_dir = '/mpiwg/archive/data/vlp';
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
200 my $lib_online_dir = '/mpiwg/online/permanent/vlp';
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
201
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
202 # read command line parameters
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
203 my $args = MPIWGStor::parseargs;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
204 if (! scalar(%$args)) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
205 print $help, "\n";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
206 exit 1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
207 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
208
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
209 # debug level
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
210 $debug = (exists $$args{'debug'}) ? $$args{'debug'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
211
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
212 # simulate action only
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
213 my $dry_run = (exists $$args{'dry-run'}) ? $$args{'dry-run'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
214 logger('DEBUG', "dry-run: $dry_run");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
215
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
216 # replace existing index files
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
217 my $do_replace = (exists $$args{'replace'}) ? $$args{'replace'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
218 logger('DEBUG', "replace: $do_replace");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
219
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
220 # use online mode
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
221 my $online_mode = (exists $$args{'online-mode'}) ? $$args{'online-mode'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
222 logger('DEBUG', "online_mode: $online_mode");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
223
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
224 # use archive mode
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
225 my $archive_mode = (exists $$args{'archive-mode'}) ? $$args{'archive-mode'} : 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
226 logger('DEBUG', "archive_mode: $archive_mode");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
227
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
228 # access type
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
229 my $access_type = (exists $$args{'access'}) ? $$args{'access'} : "";
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
230
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
231 # index.meta namespace (not really implemented!)
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
232 my $namespace = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
233
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
234
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
235 my $xml_changed = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
236 my $errcnt = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
237 my $warncnt = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
238
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
239 #######################################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
240 # check parameters that were passed to the program
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
241 #
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
242 my $infile = $$args{'path'};
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
243 if (! $infile) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
244 logger("ABORT", "no input file given!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
245 exit 1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
246 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
247 # strip double slashes
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
248 $infile =~ s/\/\//\//;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
249 if (! -f $infile) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
250 logger("ABORT", "input file \'$infile\' doesn't exist!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
251 exit 1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
252 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
253
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
254
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
255 #######################################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
256 # subroutines
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
257 #
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
258
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
259
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
260 sub find_arch_dir {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
261 my ($input_node) = @_;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
262 my $dir = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
263
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
264 my $bib_id = $input_node->findvalue("fm:$arch_id_field");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
265 #logger('DEBUG', "bibdir: $bib_dir");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
266 if ($bib_id) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
267 $dir = "$lib_arch_dir/lit$bib_id";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
268 if (-d $dir) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
269 logger('DEBUG', "directory $dir exists");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
270 return $dir;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
271 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
272 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
273 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
274 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
275
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
276 sub find_permanent_dir {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
277 my ($input_node) = @_;
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
278 my $online_base = $lib_online_dir;
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
279 my $dest_id = sstrip($input_node->findvalue("fm:$arch_id_field"));
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
280 if (! $dest_id) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
281 logger('ERROR', "no ID field for online permanent entry");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
282 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
283 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
284 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
285 my $dir = "$online_base/lit$dest_id";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
286 return $dir;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
287 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
288
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
289
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
290 sub convert_bib {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
291 my ($input_node, $index_root, $index_doc) = @_;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
292 my $cnt = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
293 my $type = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
294 my $type_path = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
295
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
296 # process general stuff first
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
297 foreach my $n ($input_node->getChildNodes()) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
298 my $name = $n->nodeName();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
299 my $val = $n->textContent();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
300 #logger('DEBUG', " NODE: $name = '$val'");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
301 if (exists $gen_map{$name}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
302 # is a general field
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
303 if ($name eq $lang_field) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
304 # language field
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
305 if (not $val) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
306 logger('WARNING', "no language tag");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
307 $warncnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
308 next;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
309 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
310 # convert to iso code
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
311 if (exists $lang_map{$val}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
312 $val = $lang_map{$val};
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
313 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
314 logger('ERROR', "unknown language: $val! skipping...");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
315 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
316 return 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
317 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
318 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
319 create_element_path($gen_map{$name}, $index_root, $namespace)
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
320 ->appendTextNode($val);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
321 $cnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
322 } elsif (exists $type_map{$name}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
323 # is a type field
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
324 $type_path = $type_map{$name};
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
325 $type = $val;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
326 # check with known types
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
327 if (exists $subtype_map{$val}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
328 my $indextype = $subtype_map{$val}->{'_name'};
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
329 create_element_path("$type_path=$indextype", $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
330 $cnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
331 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
332 logger('ERROR', "unknown bib type $val! skipping...");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
333 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
334 return 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
335 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
336 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
337 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
338 # process sub type fields
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
339 if ($type) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
340 foreach my $n ($input_node->getChildNodes()) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
341 my $name = $n->nodeName();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
342 my $val = $n->textContent();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
343 #logger('DEBUG', " NODE: $name = '$val'");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
344 if (exists $subtype_map{$type}->{$name}) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
345 create_element_path($subtype_map{$type}->{$name}, $index_root, $namespace)
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
346 ->appendTextNode($val);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
347 $cnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
348 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
349 }
31
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
350 # append additional constant fields (beginning with #)
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
351 foreach my $k (keys %{$subtype_map{$type}}) {
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
352 if ($k =~ /^\#(.*)/) {
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
353 my $val = $1;
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
354 create_text_path($subtype_map{$type}->{$k}, $val, $index_root, $namespace);
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
355 }
de63fae5f483 added document type (Book)
casties
parents: 22
diff changeset
356 }
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
357 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
358 return $cnt;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
359 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
360
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
361
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
362
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
363 sub process_all_fm_entries {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
364 my ($input_root) = @_;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
365 my $cnt = 0;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
366
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
367 foreach my $n ($input_root->findnodes('fm:ROW')) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
368 logger('INFO', "processing entry $cnt ...");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
369 process_fm_entry($n);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
370 $cnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
371 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
372 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
373
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
374
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
375 sub process_fm_entry {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
376 my ($input_node) = @_;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
377 my $index_doc = XML::LibXML::Document->createDocument('1.0', 'UTF-8');
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
378 my $index_root = $index_doc->createElementNS($namespace, 'resource');
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
379 $index_root->addChild($index_doc->createAttributeNS($namespace, 'version', '1.1'));
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
380 $index_root->addChild($index_doc->createAttributeNS($namespace, 'type', 'MPIWG'));
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
381 $index_doc->setDocumentElement($index_root);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
382
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
383 # try to find the document directory
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
384 my $doc_dir = "";
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
385 if ($online_mode) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
386 $doc_dir = find_permanent_dir($input_node);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
387 } elsif ($archive_mode) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
388 $doc_dir = find_arch_dir($input_node);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
389 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
390 $doc_dir = find_permanent_dir($input_node);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
391 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
392 if (! $doc_dir) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
393 logger('ERROR', "document directory not found! skipping...");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
394 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
395 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
396 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
397
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
398 # check if index.meta exists
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
399 if ( -f "$doc_dir/index.meta") {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
400 if (not $do_replace) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
401 logger('DEBUG', "index file in $doc_dir exists");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
402 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
403 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
404 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
405
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
406 # add standard stuff to index.meta
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
407 my ($docname, $docpath) = split_file_path($doc_dir);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
408 # name and date
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
409 create_text_path('name', $docname, $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
410 create_text_path('archive-path', $doc_dir, $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
411 create_text_path('archive-creation-date', stime(time), $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
412 create_text_path('creator', 'vlp', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
413 create_text_path('description', 'a scanned document', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
414 if ($archive_mode) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
415 # acquisition
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
416 create_text_path('meta/acquisition/date', stime(time), $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
417 create_text_path('meta/acquisition/provider/provider-id', 'vlp', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
418 create_text_path('meta/acquisition/provider/address', 'Max Planck Institute for the History of Science', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
419 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
420 # media
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
421 create_text_path('media-type', 'image', $index_root, $namespace);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
422 create_text_path('meta/content-type', 'scanned document', $index_root, $namespace);
44
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
423 # access
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
424 if ($access_type) {
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
425 if ($access_type eq "free") {
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
426 create_element_path('meta/access-conditions/access@type=free', $index_root, $namespace);
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
427 } else {
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
428 my $acc_tag = create_element_path('meta/access-conditions/access@type=institution', $index_root, $namespace);
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
429 create_text_path('name', $access_type, $acc_tag, $namespace);
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
430 }
af4323868086 added production-comment, derived-from and access handling
casties
parents: 38
diff changeset
431 }
21
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
432
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
433 # convert bib entries
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
434 my $cnt = convert_bib($input_node, $index_root, $index_doc);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
435 if ($cnt == 0) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
436 # error or nothing to convert
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
437 logger('ERROR', "no bibliographic metadata!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
438 $errcnt++;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
439 return;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
440 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
441
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
442 # write new index.meta file
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
443 if ($dry_run) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
444 logger('DEBUG', "would write $doc_dir/index.meta");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
445 logger('DEBUG', $index_doc->toString(1));
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
446 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
447 write_xml($index_doc, "$doc_dir/index.meta");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
448 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
449
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
450 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
451
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
452
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
453
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
454
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
455
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
456 #######################################################
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
457 # Main
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
458 #
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
459
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
460 # load filemaker xml dump
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
461 my ($input_doc, $input_root) = read_xml($infile);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
462 # set namespace prefix
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
463 my $fm_namespace = $input_root->namespaceURI();
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
464 $input_root->setNamespace($fm_namespace, 'fm', 1);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
465
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
466
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
467 process_all_fm_entries($input_root);
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
468
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
469
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
470 logger("INFO", "$warncnt warnings");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
471 logger("INFO", "$errcnt errors");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
472 if ($errcnt > 0) {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
473 logger("ABORT", "there were errors!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
474 exit 1;
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
475 } else {
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
476 logger("DONE", "done something successfully!");
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
477 }
c8e4e8cb31dd new tool for createing index files for vlp documents
casties
parents:
diff changeset
478