annotate documentViewer.py @ 629:e36bf3226fde

text image viewer eingecheckt
author dwinter
date Tue, 26 May 2015 10:58:27 +0200
parents 7dafe8283312
children 0c3aab828864
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
dwinter
parents:
diff changeset
1 from OFS.Folder import Folder
dwinter
parents:
diff changeset
2 from Products.PageTemplates.ZopePageTemplate import ZopePageTemplate
486
f2c5417b7ff4 more new template stuff
casties
parents: 483
diff changeset
3 from Products.PageTemplates.PageTemplateFile import PageTemplateFile
487
8fd6f26fe29e more new templates
casties
parents: 486
diff changeset
4 from App.ImageFile import ImageFile
0
dwinter
parents:
diff changeset
5 from AccessControl import ClassSecurityInfo
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
6 from AccessControl import getSecurityManager
0
dwinter
parents:
diff changeset
7
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
8 import xml.etree.ElementTree as ET
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
9
489
55e3398e395e more new templates. monkey-patch for App.ImageFile.
casties
parents: 488
diff changeset
10 import os
0
dwinter
parents:
diff changeset
11 import urllib
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
12 import logging
61
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
13 import math
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
14 import urlparse
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
15 import json
231
a88ece9a5e74 *** empty log message ***
abukhman
parents: 230
diff changeset
16
541
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
17 from Products.MetaDataProvider import MetaDataFolder
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
18
623
6012fe93f78c better scheme-less URL code.
casties
parents: 622
diff changeset
19 from SrvTxtUtils import getInt, utf8ify, getText, getHttpData, refreshingImageFileIndexHtml, sslifyUrl
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
20
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
21
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
22 def getMDText(node):
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
23 """returns the @text content from the MetaDataProvider metadata node"""
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
24 if isinstance(node, dict):
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
25 return node.get('@text', None)
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
26
617
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
27 if isinstance(node,list): #more than one text file if there is an attribute don't choose it
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
28 for nodeInList in node:
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
29 attr = nodeInList.get("@attr",None)
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
30 if attr is None:
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
31 return node.get('@text',None)
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
32 return None
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
33
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
34 return node
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
35
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
36 def getParentPath(path, cnt=1):
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
37 """returns pathname shortened by cnt"""
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
38 # make sure path doesn't end with /
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
39 path = path.rstrip('/')
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
40 # split by /, shorten, and reassemble
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
41 return '/'.join(path.split('/')[0:-cnt])
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
42
589
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
43 def getPnForPf(docinfo, pf, default=0):
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
44 """returns image number for image file name or default"""
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
45 if 'imgFileNames' in docinfo:
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
46 pn = docinfo['imgFileNames'].get(pf, None)
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
47 if pn is None:
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
48 # try to cut extension
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
49 xi = pf.rfind('.')
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
50 if xi > 0:
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
51 pf = pf[:xi]
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
52 # try again, else return 0
589
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
53 pn = docinfo['imgFileNames'].get(pf, default)
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
54 else:
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
55 # no extension
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
56 pn = default
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
57
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
58 return pn
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
59
589
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
60 return default
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
61
591
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
62 def getPfForPn(docinfo, pn, default=None):
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
63 """returns image file name for image number or default"""
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
64 if 'imgFileIndexes' in docinfo:
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
65 pn = docinfo['imgFileIndexes'].get(pn, default)
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
66 return pn
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
67
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
68 return default
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
69
585
83eeed69793f new annotator layer for images.
casties
parents: 584
diff changeset
70
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
71 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
72 ## documentViewer class
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
73 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
74 class documentViewer(Folder):
0
dwinter
parents:
diff changeset
75 """document viewer"""
dwinter
parents:
diff changeset
76 meta_type="Document viewer"
dwinter
parents:
diff changeset
77
dwinter
parents:
diff changeset
78 security=ClassSecurityInfo()
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
79 manage_options=Folder.manage_options+(
507
3c01e8f4e72b renamed config tab in ZMI
casties
parents: 506
diff changeset
80 {'label':'Configuration','action':'changeDocumentViewerForm'},
0
dwinter
parents:
diff changeset
81 )
463
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
82
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
83 metadataService = None
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
84 """MetaDataFolder instance"""
525
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
85
0
dwinter
parents:
diff changeset
86
525
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
87 #
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
88 # templates and forms
525
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
89 #
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
90 # viewMode templates
594
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
91 viewer_text = PageTemplateFile('zpt/viewer/viewer_text', globals())
615
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
92 viewer_hocr = PageTemplateFile('zpt/viewer/viewer_hocr', globals())
594
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
93 viewer_xml = PageTemplateFile('zpt/viewer/viewer_xml', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
94 viewer_image = PageTemplateFile('zpt/viewer/viewer_image', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
95 viewer_index = PageTemplateFile('zpt/viewer/viewer_index', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
96 viewer_thumbs = PageTemplateFile('zpt/viewer/viewer_thumbs', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
97 viewer_indexonly = PageTemplateFile('zpt/viewer/viewer_indexonly', globals())
629
e36bf3226fde text image viewer eingecheckt
dwinter
parents: 626
diff changeset
98 viewer_text_image = PageTemplateFile('zpt/viewer/viewer_text_image', globals())
546
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
99 # available layer types (annotator not default)
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
100 builtinLayers = {'text': ['dict','search','gis'],
629
e36bf3226fde text image viewer eingecheckt
dwinter
parents: 626
diff changeset
101 'xml': None, 'image': None, 'index': ['extended'],'text_image': ['dict'],}
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
102 availableLayers = builtinLayers;
525
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
103 # layer templates
594
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
104 layer_text_dict = PageTemplateFile('zpt/viewer/layer_text_dict', globals())
629
e36bf3226fde text image viewer eingecheckt
dwinter
parents: 626
diff changeset
105 layer_text_image_dict = PageTemplateFile('zpt/viewer/layer_text_image_dict', globals())
594
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
106 layer_text_search = PageTemplateFile('zpt/viewer/layer_text_search', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
107 layer_text_annotator = PageTemplateFile('zpt/viewer/layer_text_annotator', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
108 layer_text_gis = PageTemplateFile('zpt/viewer/layer_text_gis', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
109 layer_text_pundit = PageTemplateFile('zpt/viewer/layer_text_pundit', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
110 layer_image_annotator = PageTemplateFile('zpt/viewer/layer_image_annotator', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
111 layer_image_search = PageTemplateFile('zpt/viewer/layer_image_search', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
112 layer_index_extended = PageTemplateFile('zpt/viewer/layer_index_extended', globals())
525
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
113 # toc templates
594
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
114 toc_thumbs = PageTemplateFile('zpt/viewer/toc_thumbs', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
115 toc_text = PageTemplateFile('zpt/viewer/toc_text', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
116 toc_figures = PageTemplateFile('zpt/viewer/toc_figures', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
117 toc_concordance = PageTemplateFile('zpt/viewer/toc_concordance', globals())
609
7962e6891d99 works with new notes and notesHandwritten.
casties
parents: 608
diff changeset
118 toc_notes = PageTemplateFile('zpt/viewer/toc_notes', globals())
594
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
119 toc_handwritten = PageTemplateFile('zpt/viewer/toc_handwritten', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
120 toc_none = PageTemplateFile('zpt/viewer/toc_none', globals())
525
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
121 # other templates
594
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
122 common_template = PageTemplateFile('zpt/viewer/common_template', globals())
da7daa783df4 rearranged viewer templates into folder.
casties
parents: 593
diff changeset
123 info_xml = PageTemplateFile('zpt/viewer/info_xml', globals())
487
8fd6f26fe29e more new templates
casties
parents: 486
diff changeset
124 docuviewer_css = ImageFile('css/docuviewer.css',globals())
532
0b8bed1223ad new layout and styles.
casties
parents: 530
diff changeset
125 # make docuviewer_css refreshable for development
490
6f116b86a226 more new template stuff. moved ImageFile index method to SrvTxtUtils
casties
parents: 489
diff changeset
126 docuviewer_css.index_html = refreshingImageFileIndexHtml
535
510bae2b593b more fixes, e.g. IE support. first version of index page.
casties
parents: 532
diff changeset
127 docuviewer_ie_css = ImageFile('css/docuviewer_ie.css',globals())
510bae2b593b more fixes, e.g. IE support. first version of index page.
casties
parents: 532
diff changeset
128 # make docuviewer_ie_css refreshable for development
585
83eeed69793f new annotator layer for images.
casties
parents: 584
diff changeset
129 #docuviewer_ie_css.index_html = refreshingImageFileIndexHtml
501
29c6d09a506c more cleanup.
casties
parents: 499
diff changeset
130 jquery_js = ImageFile('js/jquery.js',globals())
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
131
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
132
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
133 def __init__(self,id,imageScalerUrl=None,textServerName=None,title="",digilibBaseUrl=None,thumbcols=2,thumbrows=5,authgroups="mpiwg"):
0
dwinter
parents:
diff changeset
134 """init document viewer"""
dwinter
parents:
diff changeset
135 self.id=id
dwinter
parents:
diff changeset
136 self.title=title
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
137 self.thumbcols = thumbcols
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
138 self.thumbrows = thumbrows
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
139 # authgroups is list of authorized groups (delimited by ,)
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
140 self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
141 # create template folder so we can always use template.something
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
142
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
143 templateFolder = Folder('template')
498
3146b4e7b6a5 more clean up.
casties
parents: 491
diff changeset
144 self['template'] = templateFolder # Zope-2.12 style
3146b4e7b6a5 more clean up.
casties
parents: 491
diff changeset
145 #self._setObject('template',templateFolder) # old style
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
146 try:
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
147 import MpdlXmlTextServer
132
39167e96e582 fixed creation of text server on __init__
casties
parents: 130
diff changeset
148 textServer = MpdlXmlTextServer.MpdlXmlTextServer(id='fulltextclient',serverName=textServerName)
498
3146b4e7b6a5 more clean up.
casties
parents: 491
diff changeset
149 templateFolder['fulltextclient'] = textServer
3146b4e7b6a5 more clean up.
casties
parents: 491
diff changeset
150 #templateFolder._setObject('fulltextclient',textServer)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
151 except Exception, e:
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
152 logging.error("Unable to create MpdlXmlTextServer for fulltextclient: "+str(e))
463
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
153
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
154 try:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
155 from Products.zogiLib.zogiLib import zogiLib
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
156 zogilib = zogiLib(id="zogilib", title="zogilib for docuviewer", dlServerURL=imageScalerUrl, layout="book")
498
3146b4e7b6a5 more clean up.
casties
parents: 491
diff changeset
157 templateFolder['zogilib'] = zogilib
3146b4e7b6a5 more clean up.
casties
parents: 491
diff changeset
158 #templateFolder._setObject('zogilib',zogilib)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
159 except Exception, e:
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
160 logging.error("Unable to create zogiLib for 'zogilib': "+str(e))
463
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
161
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
162 try:
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
163 # assume MetaDataFolder instance is called metadata
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
164 self.metadataService = getattr(self, 'metadata')
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
165 except Exception, e:
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
166 logging.error("Unable to find MetaDataFolder 'metadata': "+str(e))
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
167
477
17f0290b2327 small fixes.
casties
parents: 476
diff changeset
168 if digilibBaseUrl is not None:
17f0290b2327 small fixes.
casties
parents: 476
diff changeset
169 self.digilibBaseUrl = digilibBaseUrl
566
4a31608f8b0e more new MpiwgXmlTextServer.
casties
parents: 565
diff changeset
170 self.digilibScalerUrl = digilibBaseUrl + '/servlet/Scaler'
4a31608f8b0e more new MpiwgXmlTextServer.
casties
parents: 565
diff changeset
171 self.digilibViewerUrl = digilibBaseUrl + '/jquery/digilib.html'
477
17f0290b2327 small fixes.
casties
parents: 476
diff changeset
172
623
6012fe93f78c better scheme-less URL code.
casties
parents: 622
diff changeset
173
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
174 # proxy text server methods to fulltextclient
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
175 def getTextPage(self, **args):
498
3146b4e7b6a5 more clean up.
casties
parents: 491
diff changeset
176 """returns full text content of page"""
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
177 return self.template.fulltextclient.getTextPage(**args)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
178
508
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
179 def getSearchResults(self, **args):
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
180 """loads list of search results and stores XML in docinfo"""
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
181 return self.template.fulltextclient.getSearchResults(**args)
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
182
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
183 def getResultsPage(self, **args):
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
184 """returns one page of the search results"""
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
185 return self.template.fulltextclient.getResultsPage(**args)
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
186
516
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
187 def getTextInfo(self, **args):
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
188 """returns document info from the text server"""
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
189 return self.template.fulltextclient.getTextInfo(**args)
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
190
499
3f9703746fef more cleanup. new template for viewMode=index (not pretty so far).
casties
parents: 498
diff changeset
191 def getToc(self, **args):
508
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
192 """loads table of contents and stores XML in docinfo"""
499
3f9703746fef more cleanup. new template for viewMode=index (not pretty so far).
casties
parents: 498
diff changeset
193 return self.template.fulltextclient.getToc(**args)
3f9703746fef more cleanup. new template for viewMode=index (not pretty so far).
casties
parents: 498
diff changeset
194
3f9703746fef more cleanup. new template for viewMode=index (not pretty so far).
casties
parents: 498
diff changeset
195 def getTocPage(self, **args):
3f9703746fef more cleanup. new template for viewMode=index (not pretty so far).
casties
parents: 498
diff changeset
196 """returns one page of the table of contents"""
3f9703746fef more cleanup. new template for viewMode=index (not pretty so far).
casties
parents: 498
diff changeset
197 return self.template.fulltextclient.getTocPage(**args)
3f9703746fef more cleanup. new template for viewMode=index (not pretty so far).
casties
parents: 498
diff changeset
198
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
199 def getRepositoryType(self, **args):
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
200 """get repository type"""
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
201 return self.template.fulltextclient.getRepositoryType(**args)
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
202
559
eabfbad6aeb4 "extended" layer for index view and some bugfixes.
casties
parents: 558
diff changeset
203 def getTextDownloadUrl(self, **args):
610
0488cd12355b gis mode works again.
casties
parents: 609
diff changeset
204 """get URL to download the full text"""
559
eabfbad6aeb4 "extended" layer for index view and some bugfixes.
casties
parents: 558
diff changeset
205 return self.template.fulltextclient.getTextDownloadUrl(**args)
eabfbad6aeb4 "extended" layer for index view and some bugfixes.
casties
parents: 558
diff changeset
206
506
67014399894d cleaned out all 4suite code and weird methods.
casties
parents: 503
diff changeset
207 def getPlacesOnPage(self, **args):
67014399894d cleaned out all 4suite code and weird methods.
casties
parents: 503
diff changeset
208 """get list of gis places on one page"""
67014399894d cleaned out all 4suite code and weird methods.
casties
parents: 503
diff changeset
209 return self.template.fulltextclient.getPlacesOnPage(**args)
307
ec5e920a61e6 *** empty log message ***
abukhman
parents: 256
diff changeset
210
548
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
211 # Thumb list for CoolIris Plugin
499
3f9703746fef more cleanup. new template for viewMode=index (not pretty so far).
casties
parents: 498
diff changeset
212 thumbs_main_rss = PageTemplateFile('zpt/thumbs_main_rss', globals())
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
213 security.declareProtected('View','thumbs_rss')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
214 def thumbs_rss(self,mode,url,viewMode="auto",start=None,pn=1):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
215 '''
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
216 view it
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
217 @param mode: defines how to access the document behind url
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
218 @param url: url which contains display information
590
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
219 @param viewMode: image: display images, text: display text, default is auto (try text, else image)
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
220
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
221 '''
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
222
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
223 if not hasattr(self, 'template'):
590
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
224 # this won't work
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
225 logging.error("template folder missing!")
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
226 return "ERROR: template folder missing!"
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
227
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
228 if not self.digilibBaseUrl:
623
6012fe93f78c better scheme-less URL code.
casties
parents: 622
diff changeset
229 self.digilibBaseUrl = self.findDigilibUrl() or "http://digilib.mpiwg-berlin.mpg.de/digitallibrary"
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
230
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
231 docinfo = self.getDocinfo(mode=mode,url=url)
338
0576f524e2ee *** empty log message ***
abukhman
parents: 337
diff changeset
232 #pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo)
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
233 pageinfo = self.getPageinfo(start=start,pn=pn, docinfo=docinfo)
331
6cde7f02786e *** empty log message ***
abukhman
parents: 330
diff changeset
234 ''' ZDES '''
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
235 pt = getattr(self.template, 'thumbs_main_rss')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
236
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
237 if viewMode=="auto": # automodus gewaehlt
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
238 if docinfo.has_key("textURL") or docinfo.get('textURLPath',None): #texturl gesetzt und textViewer konfiguriert
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
239 viewMode="text"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
240 else:
590
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
241 viewMode="image"
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
242
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
243 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode)
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
244
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
245
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
246 security.declareProtected('View','index_html')
589
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
247 def index_html(self, url, mode="texttool", viewMode="auto", viewLayer=None, tocMode=None, start=None, pn=None, pf=None):
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
248 """
543
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
249 show page
471
415a7026eeda split viewMode in viewMode and viewType
casties
parents: 469
diff changeset
250 @param url: url which contains display information
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
251 @param mode: defines how to access the document behind url
615
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
252 @param viewMode: 'image': display images, 'text': display text, 'xml': display xml, default is 'auto', 'hocr' : hocr format
543
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
253 @param viewLayer: sub-type of viewMode, e.g. layer 'dict' for viewMode='text'
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
254 @param tocMode: type of 'table of contents' for navigation (thumbs, text, figures, none)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
255 """
0
dwinter
parents:
diff changeset
256
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
257 logging.debug("documentViewer(index_html) mode=%s url=%s viewMode=%s viewLayer=%s start=%s pn=%s pf=%s"%(mode,url,viewMode,viewLayer,start,pn,pf))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
258
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
259 if not hasattr(self, 'template'):
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
260 # this won't work
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
261 logging.error("template folder missing!")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
262 return "ERROR: template folder missing!"
617
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
263
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
264 if not getattr(self, 'digilibBaseUrl', None):
132
39167e96e582 fixed creation of text server on __init__
casties
parents: 130
diff changeset
265 self.digilibBaseUrl = self.findDigilibUrl() or "http://digilib.mpiwg-berlin.mpg.de/digitallibrary"
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
266
548
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
267 # mode=filepath should not have toc-thumbs
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
268 if tocMode is None:
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
269 if mode == "filepath":
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
270 tocMode = "none"
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
271 else:
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
272 tocMode = "thumbs"
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
273
543
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
274 # docinfo: information about document (cached)
518
91051b36b9cc uses xml info from doc-info.xql for table of contents now.
casties
parents: 516
diff changeset
275 docinfo = self.getDocinfo(mode=mode,url=url,tocMode=tocMode)
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
276
543
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
277 # userinfo: user settings (cached)
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
278 userinfo = self.getUserinfo()
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
279
471
415a7026eeda split viewMode in viewMode and viewType
casties
parents: 469
diff changeset
280 # auto viewMode: text if there is a text else images
455
0a53fea83df7 more work renovating
casties
parents: 454
diff changeset
281 if viewMode=="auto":
530
5c7433c2515c fix problems with texttool/text
casties
parents: 528
diff changeset
282 if docinfo.get('textURLPath', None):
5c7433c2515c fix problems with texttool/text
casties
parents: 528
diff changeset
283 # docinfo.get('textURL', None) not implemented yet
471
415a7026eeda split viewMode in viewMode and viewType
casties
parents: 469
diff changeset
284 viewMode = "text"
543
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
285 if viewLayer is None and 'viewLayer' not in userinfo:
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
286 # use layer dict as default
508
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
287 viewLayer = "dict"
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
288 else:
590
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
289 viewMode = "image"
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
290
474
0bc4a153863a more cleanup (before reversing macro order)
casties
parents: 473
diff changeset
291 elif viewMode == "text_dict":
0bc4a153863a more cleanup (before reversing macro order)
casties
parents: 473
diff changeset
292 # legacy fix
0bc4a153863a more cleanup (before reversing macro order)
casties
parents: 473
diff changeset
293 viewMode = "text"
503
030251fe9dbc more cleanup.
casties
parents: 501
diff changeset
294 viewLayer = "dict"
474
0bc4a153863a more cleanup (before reversing macro order)
casties
parents: 473
diff changeset
295
590
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
296 elif viewMode == 'images':
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
297 # legacy fix
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
298 viewMode = 'image'
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
299 self.REQUEST['viewMode'] = 'image'
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
300
543
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
301 # safe viewLayer in userinfo
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
302 userinfo['viewLayer'] = viewLayer
548
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
303
543
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
304 # pageinfo: information about page (not cached)
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
305 pageinfo = self.getPageinfo(start=start, pn=pn, pf=pf, docinfo=docinfo, userinfo=userinfo, viewMode=viewMode, viewLayer=viewLayer, tocMode=tocMode)
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
306
475
5a3ab27385ce more new template stuff
casties
parents: 474
diff changeset
307 # get template /template/viewer_$viewMode
5a3ab27385ce more new template stuff
casties
parents: 474
diff changeset
308 pt = getattr(self.template, 'viewer_%s'%viewMode, None)
5a3ab27385ce more new template stuff
casties
parents: 474
diff changeset
309 if pt is None:
5a3ab27385ce more new template stuff
casties
parents: 474
diff changeset
310 logging.error("No template for viewMode=%s!"%viewMode)
5a3ab27385ce more new template stuff
casties
parents: 474
diff changeset
311 # TODO: error page?
5a3ab27385ce more new template stuff
casties
parents: 474
diff changeset
312 return "No template for viewMode=%s!"%viewMode
5a3ab27385ce more new template stuff
casties
parents: 474
diff changeset
313
455
0a53fea83df7 more work renovating
casties
parents: 454
diff changeset
314 # and execute with parameters
471
415a7026eeda split viewMode in viewMode and viewType
casties
parents: 469
diff changeset
315 return pt(docinfo=docinfo, pageinfo=pageinfo)
0
dwinter
parents:
diff changeset
316
525
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
317 def getAvailableLayers(self):
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
318 """returns dict with list of available layers per viewMode"""
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
319 return self.availableLayers
70c3ae5eac7c layers can have their own templates.
casties
parents: 518
diff changeset
320
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
321 def findDigilibUrl(self):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
322 """try to get the digilib URL from zogilib"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
323 url = self.template.zogilib.getDLBaseUrl()
624
80a0191ae51c move sslification to only client-visible urls.
casties
parents: 623
diff changeset
324 return url
480
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
325
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
326 def getScalerUrl(self, fn=None, pn=None, dw=100, dh=100, docinfo=None):
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
327 """returns URL to digilib Scaler with params"""
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
328 url = None
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
329 if docinfo is not None:
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
330 url = docinfo.get('imageURL', None)
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
331
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
332 if url is None:
566
4a31608f8b0e more new MpiwgXmlTextServer.
casties
parents: 565
diff changeset
333 url = self.digilibScalerUrl
480
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
334 if fn is None and docinfo is not None:
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
335 fn = docinfo.get('imagePath','')
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
336
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
337 url += "fn=%s"%fn
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
338
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
339 if pn:
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
340 url += "&pn=%s"%pn
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
341
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
342 url += "&dw=%s&dh=%s"%(dw,dh)
624
80a0191ae51c move sslification to only client-visible urls.
casties
parents: 623
diff changeset
343 return sslifyUrl(url, self, force=True)
126
c6dcf12e3807 added method to get url of viewer instance
casties
parents: 124
diff changeset
344
c6dcf12e3807 added method to get url of viewer instance
casties
parents: 124
diff changeset
345 def getDocumentViewerURL(self):
c6dcf12e3807 added method to get url of viewer instance
casties
parents: 124
diff changeset
346 """returns the URL of this instance"""
c6dcf12e3807 added method to get url of viewer instance
casties
parents: 124
diff changeset
347 return self.absolute_url()
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
348
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
349 def getStyle(self, idx, selected, style=""):
480
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
350 """returns a string with the given style and append 'sel' if idx == selected."""
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
351 #logger("documentViewer (getstyle)", logging.INFO, "idx: %s selected: %s style: %s"%(idx,selected,style))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
352 if idx == selected:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
353 return style + 'sel'
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
354 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
355 return style
74
dwinter
parents: 73
diff changeset
356
478
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
357 def getParams(self, param=None, val=None, params=None, duplicates=None):
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
358 """returns dict with URL parameters.
15394486ab75 working with new templates
casties
parents: 468
diff changeset
359
15394486ab75 working with new templates
casties
parents: 468
diff changeset
360 Takes URL parameters and additionally param=val or dict params.
15394486ab75 working with new templates
casties
parents: 468
diff changeset
361 Deletes key if value is None."""
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
362 # copy existing request params
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
363 newParams=self.REQUEST.form.copy()
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
364 # change single param
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
365 if param is not None:
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
366 if val is None:
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
367 if newParams.has_key(param):
15394486ab75 working with new templates
casties
parents: 468
diff changeset
368 del newParams[param]
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
369 else:
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
370 newParams[param] = str(val)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
371
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
372 # change more params
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
373 if params is not None:
478
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
374 for (k, v) in params.items():
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
375 if v is None:
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
376 # val=None removes param
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
377 if newParams.has_key(k):
15394486ab75 working with new templates
casties
parents: 468
diff changeset
378 del newParams[k]
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
379
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
380 else:
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
381 newParams[k] = v
478
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
382
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
383 if duplicates:
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
384 # eliminate lists (coming from duplicate keys)
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
385 for (k,v) in newParams.items():
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
386 if isinstance(v, list):
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
387 if duplicates == 'comma':
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
388 # make comma-separated list of non-empty entries
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
389 newParams[k] = ','.join([t for t in v if t])
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
390 elif duplicates == 'first':
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
391 # take first non-empty entry
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
392 newParams[k] = [t for t in v if t][0]
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
393
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
394 return newParams
15394486ab75 working with new templates
casties
parents: 468
diff changeset
395
478
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
396 def getLink(self, param=None, val=None, params=None, baseUrl=None, paramSep='&', duplicates='comma'):
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
397 """returns URL to documentviewer with parameter param set to val or from dict params"""
478
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
398 urlParams = self.getParams(param=param, val=val, params=params, duplicates=duplicates)
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
399 # quote values and assemble into query string (not escaping '/')
514
c55e376be01b search works even with unicode...
casties
parents: 513
diff changeset
400 ps = paramSep.join(["%s=%s"%(k, urllib.quote_plus(utf8ify(v), '/')) for (k, v) in urlParams.items()])
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
401 if baseUrl is None:
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
402 baseUrl = self.getDocumentViewerURL()
453
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
403
beb7ccb92564 first version using elementtree instead of 4suite xml
casties
parents: 405
diff changeset
404 url = "%s?%s"%(baseUrl, ps)
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
405 return url
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
406
478
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
407 def getLinkAmp(self, param=None, val=None, params=None, baseUrl=None, duplicates='comma'):
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
408 """link to documentviewer with parameter param set to val"""
478
cd37d6f8d5e8 more cleanup
casties
parents: 477
diff changeset
409 return self.getLink(param=param, val=val, params=params, baseUrl=baseUrl, paramSep='&amp;', duplicates=duplicates)
81
fae97f071724 fixed problem with info.xml when url without index.meta
casties
parents: 79
diff changeset
410
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
411
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
412 def setAvailableLayers(self, newLayerString=None):
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
413 """sets availableLayers to newLayerString or tries to autodetect available layers.
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
414 assumes layer templates have the form layer_{m}_{l} for layer l in mode m.
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
415 newLayerString is parsed as JSON."""
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
416 if newLayerString is not None:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
417 try:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
418 layers = json.loads(newLayerString)
590
ed4485d2748e viewMode "images" changed to "image".
casties
parents: 589
diff changeset
419 if 'text' in layers and 'image' in layers:
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
420 self.availableLayers = layers
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
421 return
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
422 except:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
423 pass
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
424
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
425 logging.error("invalid layers=%s! autodetecting..."%repr(newLayerString))
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
426
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
427 # start with builtin layers
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
428 self.availableLayers = self.builtinLayers.copy()
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
429 # add layers from templates
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
430 for t in self.template:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
431 if t.startswith('layer_'):
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
432 try:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
433 (x, m, l) = t.split('_', 3)
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
434 if m not in self.availableLayers:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
435 # mode m doesn't exist -> new list
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
436 self.availableLayers[m] = [l]
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
437
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
438 else:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
439 # m exists -> append
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
440 if l not in self.availableLayers[m]:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
441 self.availableLayers[m].append()
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
442
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
443 except:
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
444 pass
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
445
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
446 def getAvailableLayersJson(self):
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
447 """returns available layers as JSON string."""
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
448 return json.dumps(self.availableLayers)
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
449
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
450
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
451 def getInfo_xml(self,url,mode):
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
452 """returns info about the document as XML"""
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
453 if not self.digilibBaseUrl:
514
c55e376be01b search works even with unicode...
casties
parents: 513
diff changeset
454 self.digilibBaseUrl = self.findDigilibUrl() or "http://digilib.mpiwg-berlin.mpg.de/digitallibrary"
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
455
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
456 docinfo = self.getDocinfo(mode=mode,url=url)
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
457 pt = getattr(self.template, 'info_xml')
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
458 return pt(docinfo=docinfo)
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
459
528
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
460 def getAuthenticatedUser(self, anon=None):
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
461 """returns the authenticated user object or None. (ignores Zopes anonymous user)"""
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
462 user = getSecurityManager().getUser()
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
463 if user is not None and user.getUserName() != "Anonymous User":
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
464 return user
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
465 else:
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
466 return anon
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
467
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
468 def isAccessible(self, docinfo):
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
469 """returns if access to the resource is granted"""
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
470 access = docinfo.get('accessType', None)
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
471 logging.debug("documentViewer (accessOK) access type %s"%access)
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
472 if access == 'free':
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
473 logging.debug("documentViewer (accessOK) access is free")
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
474 return True
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
475
45
0391fe75aef3 fixed handling of documents with missing access tag
casties
parents: 43
diff changeset
476 elif access is None or access in self.authgroups:
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
477 # only local access -- only logged in users
528
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
478 user = self.getAuthenticatedUser()
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
479 logging.debug("documentViewer (accessOK) user=%s ip=%s"%(user,self.REQUEST.getClientAddr()))
528
f8a5f63eafc0 new viewMode=thumbs.
casties
parents: 526
diff changeset
480 return (user is not None)
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
481
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
482 logging.error("documentViewer (accessOK) unknown access type %s"%access)
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
483 return False
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
484
543
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
485 def getUserinfo(self):
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
486 """returns userinfo object"""
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
487 logging.debug("getUserinfo")
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
488 userinfo = {}
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
489 # look for cached userinfo in session
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
490 if self.REQUEST.SESSION.has_key('userinfo'):
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
491 userinfo = self.REQUEST.SESSION['userinfo']
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
492 # check if its still current?
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
493 else:
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
494 # store in session
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
495 self.REQUEST.SESSION['userinfo'] = userinfo
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
496
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
497 return userinfo
6cdc31e9ed8e fixed problem with dict-mode in default view.
casties
parents: 541
diff changeset
498
612
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
499 def getDocinfoJSON(self, mode, url, tocMode=None):
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
500 """returns docinfo depending on mode"""
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
501 import json
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
502
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
503 dc = self.getDocinfo( mode, url, tocMode)
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
504
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
505 return json.dumps(dc)
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
506
a79e4e4b3e37 json schnittsellen
dwinter
parents: 610
diff changeset
507
518
91051b36b9cc uses xml info from doc-info.xql for table of contents now.
casties
parents: 516
diff changeset
508 def getDocinfo(self, mode, url, tocMode=None):
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
509 """returns docinfo depending on mode"""
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
510 logging.debug("getDocinfo: mode=%s, url=%s"%(mode,url))
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
511 # look for cached docinfo in session
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
512 if self.REQUEST.SESSION.has_key('docinfo'):
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
513 docinfo = self.REQUEST.SESSION['docinfo']
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
514 # check if its still current
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
515 if docinfo is not None and docinfo.get('mode', None) == mode and docinfo.get('url', None) == url:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
516 logging.debug("getDocinfo: docinfo in session. keys=%s"%docinfo.keys())
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
517 return docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
518
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
519 # new docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
520 docinfo = {'mode': mode, 'url': url}
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
521 # add self url
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
522 docinfo['viewerUrl'] = self.getDocumentViewerURL()
625
80a3b1fa5705 more move sslification to only client-visible urls.
casties
parents: 624
diff changeset
523 docinfo['digilibBaseUrl'] = sslifyUrl(self.digilibBaseUrl, self, force=True)
80a3b1fa5705 more move sslification to only client-visible urls.
casties
parents: 624
diff changeset
524 docinfo['digilibScalerUrl'] = sslifyUrl(self.digilibScalerUrl, self, force=True)
80a3b1fa5705 more move sslification to only client-visible urls.
casties
parents: 624
diff changeset
525 docinfo['digilibViewerUrl'] = sslifyUrl(self.digilibViewerUrl, self, force=True)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
526 # get index.meta DOM
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
527 docUrl = None
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
528 metaDom = None
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
529 if mode=="texttool":
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
530 # url points to document dir or index.meta
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
531 metaDom = self.metadataService.getDomFromPathOrUrl(url)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
532 if metaDom is None:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
533 raise IOError("Unable to find index.meta for mode=texttool!")
580
0806cb9061c1 fixed another bug when url starts with /mpiwg/online/
casties
parents: 578
diff changeset
534
0806cb9061c1 fixed another bug when url starts with /mpiwg/online/
casties
parents: 578
diff changeset
535 docUrl = url.replace('/index.meta', '')
0806cb9061c1 fixed another bug when url starts with /mpiwg/online/
casties
parents: 578
diff changeset
536 if url.startswith('/mpiwg/online/'):
0806cb9061c1 fixed another bug when url starts with /mpiwg/online/
casties
parents: 578
diff changeset
537 docUrl = url.replace('/mpiwg/online/', '', 1)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
538
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
539 elif mode=="imagepath":
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
540 # url points to folder with images, index.meta optional
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
541 # asssume index.meta in parent dir
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
542 docUrl = getParentPath(url)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
543 metaDom = self.metadataService.getDomFromPathOrUrl(docUrl)
599
3b79ae4a23ca normalize uri of annotated image.
casties
parents: 594
diff changeset
544 docinfo['imagePath'] = url.replace('/mpiwg/online', '', 1)
615
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
545
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
546 elif mode=="hocr":
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
547 # url points to folder with images, index.meta optional
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
548 # asssume index.meta in parent dir
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
549 docUrl = getParentPath(url)
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
550 metaDom = self.metadataService.getDomFromPathOrUrl(docUrl)
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
551 docinfo['imagePath'] = url.replace('/mpiwg/online', '', 1)
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
552 docinfo['textURLPath'] = url.replace('/mpiwg/online', '', 1)
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
553 if docinfo.get("creator", None) is None:
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
554 docinfo['creator'] = ""
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
555
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
556 if docinfo.get("title", None) is None:
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
557 docinfo['title'] = ""
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
558
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
559 if docinfo.get("documentPath", None) is None:
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
560 docinfo['documentPath'] = url.replace('/mpiwg/online', '', 1)
d6eca930a534 hocr viewer eingebaut
Dirk Wintergruen <dwinter@mpiwg-berlin.mpg.de>
parents: 613
diff changeset
561 docinfo['documentPath'] = url.replace('/pages', '', 1)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
562
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
563 elif mode=="filepath":
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
564 # url points to image file, index.meta optional
566
4a31608f8b0e more new MpiwgXmlTextServer.
casties
parents: 565
diff changeset
565 docinfo['imageURL'] = "%s?fn=%s"%(self.digilibScalerUrl, url)
548
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
566 docinfo['numPages'] = 1
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
567 # asssume index.meta is two path segments up
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
568 docUrl = getParentPath(url, 2)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
569 metaDom = self.metadataService.getDomFromPathOrUrl(docUrl)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
570
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
571 else:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
572 logging.error("documentViewer (getdocinfo) unknown mode: %s!"%mode)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
573 raise ValueError("Unknown mode %s! Has to be one of 'texttool','imagepath','filepath'."%(mode))
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
574
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
575 docinfo['documentUrl'] = docUrl
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
576 # process index.meta contents
473
74e9e74277e9 smaller improvements
casties
parents: 472
diff changeset
577 if metaDom is not None and metaDom.tag == 'resource':
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
578 # document directory name and path
608
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
579 resource = self.metadataService.getResourceData(dom=metaDom, recursive=1)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
580 if resource:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
581 docinfo = self.getDocinfoFromResource(docinfo, resource)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
582
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
583 # texttool info
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
584 texttool = self.metadataService.getTexttoolData(dom=metaDom, recursive=1, all=True)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
585 if texttool:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
586 docinfo = self.getDocinfoFromTexttool(docinfo, texttool)
568
694935574177 more new MpiwgXmlTextServer.
casties
parents: 566
diff changeset
587 # document info from full text server
516
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
588 if docinfo.get('textURLPath', None):
565
1b483194901c more new MpiwgXmlTextServer.
casties
parents: 564
diff changeset
589 docinfo = self.getTextInfo(mode=None, docinfo=docinfo)
568
694935574177 more new MpiwgXmlTextServer.
casties
parents: 566
diff changeset
590 # include list of pages TODO: do we need this always?
694935574177 more new MpiwgXmlTextServer.
casties
parents: 566
diff changeset
591 docinfo = self.getTextInfo(mode='pages', docinfo=docinfo)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
592
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
593 # bib info
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
594 bib = self.metadataService.getBibData(dom=metaDom)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
595 if bib:
548
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
596 # save extended version as 'bibx' TODO: ugly
541
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
597 bibx = self.metadataService.getBibData(dom=metaDom, all=True, recursive=1)
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
598 if len(bibx) == 1:
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
599 # unwrap list if possible
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
600 bibx = bibx[0]
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
601
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
602 docinfo['bibx'] = bibx
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
603 docinfo = self.getDocinfoFromBib(docinfo, bib, bibx)
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
604 else:
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
605 # no bib - try info.xml
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
606 docinfo = self.getDocinfoFromPresentationInfoXml(docinfo)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
607
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
608 # auth info
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
609 access = self.metadataService.getAccessData(dom=metaDom)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
610 if access:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
611 docinfo = self.getDocinfoFromAccess(docinfo, access)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
612
466
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
613 # attribution info
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
614 attribution = self.metadataService.getAttributionData(dom=metaDom)
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
615 if attribution:
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
616 logging.debug("getDocinfo: attribution=%s"%repr(attribution))
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
617 docinfo['attribution'] = attribution
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
618
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
619 # copyright info
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
620 copyright = self.metadataService.getCopyrightData(dom=metaDom)
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
621 if copyright:
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
622 logging.debug("getDocinfo: copyright=%s"%repr(copyright))
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
623 docinfo['copyright'] = copyright
538
dbf25bd05fc6 digilib buttons get icons. pid on index page.
casties
parents: 536
diff changeset
624
dbf25bd05fc6 digilib buttons get icons. pid on index page.
casties
parents: 536
diff changeset
625 # DRI (permanent ID)
581
514902fb6b8a use dri repository=mpiwg as default
casties
parents: 580
diff changeset
626 dri = self.metadataService.getDRI(dom=metaDom, type='mpiwg')
538
dbf25bd05fc6 digilib buttons get icons. pid on index page.
casties
parents: 536
diff changeset
627 if dri:
dbf25bd05fc6 digilib buttons get icons. pid on index page.
casties
parents: 536
diff changeset
628 docinfo['DRI'] = dri
466
1641be8dc6b5 attribution works now
casties
parents: 465
diff changeset
629
578
024b75162437 displays context data on index page
casties
parents: 577
diff changeset
630 # (presentation) context
024b75162437 displays context data on index page
casties
parents: 577
diff changeset
631 ctx = self.metadataService.getContextData(dom=metaDom, all=True)
024b75162437 displays context data on index page
casties
parents: 577
diff changeset
632 if ctx:
024b75162437 displays context data on index page
casties
parents: 577
diff changeset
633 logging.debug("getcontext: ctx=%s"%repr(ctx))
024b75162437 displays context data on index page
casties
parents: 577
diff changeset
634 docinfo['presentationContext'] = ctx
024b75162437 displays context data on index page
casties
parents: 577
diff changeset
635
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
636 # image path
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
637 if mode != 'texttool':
532
0b8bed1223ad new layout and styles.
casties
parents: 530
diff changeset
638 # override image path from texttool with url parameter TODO: how about mode=auto?
599
3b79ae4a23ca normalize uri of annotated image.
casties
parents: 594
diff changeset
639 docinfo['imagePath'] = url.replace('/mpiwg/online', '', 1)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
640
548
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
641 # check numPages
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
642 if docinfo.get('numPages', 0) == 0:
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
643 # number of images from digilib
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
644 if docinfo.get('imagePath', None):
599
3b79ae4a23ca normalize uri of annotated image.
casties
parents: 594
diff changeset
645 imgpath = docinfo['imagePath'].replace('/mpiwg/online', '', 1)
580
0806cb9061c1 fixed another bug when url starts with /mpiwg/online/
casties
parents: 578
diff changeset
646 logging.debug("imgpath=%s"%imgpath)
625
80a3b1fa5705 more move sslification to only client-visible urls.
casties
parents: 624
diff changeset
647 docinfo['imageURL'] = sslifyUrl("%s?fn=%s"%(self.digilibScalerUrl, imgpath), self, force=True)
562
60f5a636bc57 bugfixes for stability.
casties
parents: 561
diff changeset
648 docinfo = self.getDocinfoFromDigilib(docinfo, imgpath)
548
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
649 else:
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
650 # imagePath still missing? try "./pageimg"
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
651 imgPath = os.path.join(docUrl, 'pageimg')
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
652 docinfo = self.getDocinfoFromDigilib(docinfo, imgPath)
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
653 if docinfo.get('numPages', 0) > 0:
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
654 # there are pages
7acc919f52ff mode=filepath works again
casties
parents: 546
diff changeset
655 docinfo['imagePath'] = imgPath
625
80a3b1fa5705 more move sslification to only client-visible urls.
casties
parents: 624
diff changeset
656 docinfo['imageURL'] = sslifyUrl("%s?fn=%s"%(self.digilibScalerUrl, docinfo['imagePath']), self, force=True)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
657
516
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
658 # check numPages
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
659 if docinfo.get('numPages', 0) == 0:
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
660 if docinfo.get('numTextPages', 0) > 0:
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
661 # replace with numTextPages (text-only?)
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
662 docinfo['numPages'] = docinfo['numTextPages']
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
663
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
664 # min and max page no
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
665 docinfo['minPageNo'] = docinfo.get('minPageNo', 1)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
666 docinfo['maxPageNo'] = docinfo.get('maxPageNo', docinfo['numPages'])
516
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
667
608
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
668 # part-of information
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
669 partOfPath = docinfo.get('partOfPath', None)
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
670 if partOfPath is not None:
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
671 partOfDom = self.metadataService.getDomFromPathOrUrl(partOfPath)
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
672 if partOfDom is not None:
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
673 docinfo['partOfLabel'] = self.metadataService.getBibFormattedLabel(dom=partOfDom)
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
674 docinfo['partOfUrl'] = "%s?url=%s"%(self.getDocumentViewerURL(), partOfPath)
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
675 logging.debug("partOfLabel=%s partOfUrl=%s"%(docinfo['partOfLabel'],docinfo['partOfUrl']))
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
676
599
3b79ae4a23ca normalize uri of annotated image.
casties
parents: 594
diff changeset
677 # normalize path
3b79ae4a23ca normalize uri of annotated image.
casties
parents: 594
diff changeset
678 if 'imagePath' in docinfo and not docinfo['imagePath'].startswith('/'):
3b79ae4a23ca normalize uri of annotated image.
casties
parents: 594
diff changeset
679 docinfo['imagePath'] = '/' + docinfo['imagePath']
3b79ae4a23ca normalize uri of annotated image.
casties
parents: 594
diff changeset
680
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
681 logging.debug("documentViewer (getdocinfo) docinfo: keys=%s"%docinfo.keys())
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
682 # store in session
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
683 self.REQUEST.SESSION['docinfo'] = docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
684 return docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
685
516
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
686
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
687 def getDocinfoFromResource(self, docinfo, resource):
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
688 """reads contents of resource element into docinfo"""
608
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
689 logging.debug("getDocinfoFromResource: resource=%s"%(repr(resource)))
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
690 docName = getMDText(resource.get('name', None))
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
691 docinfo['documentName'] = docName
608
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
692 docPath = getMDText(resource.get('archive-path', None))
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
693 if docPath:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
694 # clean up document path
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
695 if docPath[0] != '/':
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
696 docPath = '/' + docPath
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
697
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
698 if docName and (not docPath.endswith(docName)):
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
699 docPath += "/" + docName
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
700
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
701 else:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
702 # use docUrl as docPath
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
703 docUrl = docinfo['documentURL']
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
704 if not docUrl.startswith('http:'):
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
705 docPath = docUrl
608
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
706
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
707 if docPath:
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
708 # fix URLs starting with /mpiwg/online
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
709 docPath = docPath.replace('/mpiwg/online', '', 1)
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
710
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
711 docinfo['documentPath'] = docPath
608
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
712
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
713 # is this part-of?
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
714 partOf = resource.get('is-part-of', None)
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
715 if partOf is not None:
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
716 partOf = getMDText(partOf.get('archive-path', None))
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
717 if partOf is not None:
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
718 docinfo['partOfPath'] = partOf.strip()
0c6056271654 show is-part-of relation in header.
casties
parents: 607
diff changeset
719
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
720 return docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
721
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
722 def getDocinfoFromTexttool(self, docinfo, texttool):
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
723 """reads contents of texttool element into docinfo"""
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
724 logging.debug("texttool=%s"%repr(texttool))
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
725 # unpack list if necessary
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
726 if isinstance(texttool, list):
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
727 texttool = texttool[0]
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
728
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
729 # image dir
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
730 imageDir = getMDText(texttool.get('image', None))
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
731 docPath = getMDText(docinfo.get('documentPath', None))
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
732 if imageDir:
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
733 if imageDir.startswith('/'):
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
734 # absolute path
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
735 imageDir = imageDir.replace('/mpiwg/online', '', 1)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
736 docinfo['imagePath'] = imageDir
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
737
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
738 elif docPath:
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
739 # relative path
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
740 imageDir = os.path.join(docPath, imageDir)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
741 imageDir = imageDir.replace('/mpiwg/online', '', 1)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
742 docinfo['imagePath'] = imageDir
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
743
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
744 # start and end page (for subdocuments of other documents)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
745 imgStartNo = getMDText(texttool.get('image-start-no', None))
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
746 minPageNo = getInt(imgStartNo, 1)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
747 docinfo['minPageNo'] = minPageNo
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
748
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
749 imgEndNo = getMDText(texttool.get('image-end-no', None))
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
750 if imgEndNo:
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
751 docinfo['maxPageNo'] = getInt(imgEndNo)
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
752
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
753 # old style text URL
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
754 textUrl = getMDText(texttool.get('text', None))
617
7aefbddddaf9 alpaha of hocr server support
dwinter
parents: 613
diff changeset
755
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
756 if textUrl and docPath:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
757 if urlparse.urlparse(textUrl)[0] == "": #keine url
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
758 textUrl = os.path.join(docPath, textUrl)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
759
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
760 docinfo['textURL'] = textUrl
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
761
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
762 # new style text-url-path (can be more than one with "repository" attribute)
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
763 textUrlNode = texttool.get('text-url-path', None)
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
764 if not isinstance(textUrlNode, list):
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
765 textUrlNode = [textUrlNode]
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
766
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
767 for tun in textUrlNode:
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
768 textUrl = getMDText(tun)
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
769 if textUrl:
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
770 textUrlAtts = tun.get('@attr')
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
771 if (textUrlAtts and 'repository' in textUrlAtts):
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
772 textRepo = textUrlAtts['repository']
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
773 # use matching repository
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
774 if self.getRepositoryType() == textRepo:
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
775 docinfo['textURLPath'] = textUrl
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
776 docinfo['textURLRepository'] = textRepo
564
31f562fa7214 first version of MpiwgXmlTextServer.
casties
parents: 562
diff changeset
777 break
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
778
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
779 else:
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
780 # no repo attribute - use always
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
781 docinfo['textURLPath'] = textUrl
468
dc7c48912110 attribution and copyright works mostly now
casties
parents: 467
diff changeset
782
dc7c48912110 attribution and copyright works mostly now
casties
parents: 467
diff changeset
783 # page flow
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
784 docinfo['pageFlow'] = getMDText(texttool.get('page-flow', 'ltr'))
468
dc7c48912110 attribution and copyright works mostly now
casties
parents: 467
diff changeset
785
dc7c48912110 attribution and copyright works mostly now
casties
parents: 467
diff changeset
786 # odd pages are left
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
787 docinfo['oddPage'] = getMDText(texttool.get('odd-scan-position', 'left'))
468
dc7c48912110 attribution and copyright works mostly now
casties
parents: 467
diff changeset
788
541
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
789 # number of title page (default 1)
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
790 docinfo['titlePage'] = getMDText(texttool.get('title-scan-no', minPageNo))
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
791
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
792 # old presentation stuff
561
9255acc4518d CLOSED - # 256: display texts from different backends (sandbox)
casties
parents: 560
diff changeset
793 presentation = getMDText(texttool.get('presentation', None))
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
794 if presentation and docPath:
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
795 if presentation.startswith('http:'):
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
796 docinfo['presentationUrl'] = presentation
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
797 else:
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
798 docinfo['presentationUrl'] = os.path.join(docPath, presentation)
602
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
799
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
800 # make sure we have at least fake DC data
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
801 if 'creator' not in docinfo:
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
802 docinfo['creator'] = '[no author found]'
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
803
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
804 if 'title' not in docinfo:
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
805 docinfo['title'] = '[no title found]'
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
806
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
807 if 'date' not in docinfo:
ef1d0a1fc9fa fix bug with no dc-metadata.
casties
parents: 599
diff changeset
808 docinfo['date'] = '[no date found]'
468
dc7c48912110 attribution and copyright works mostly now
casties
parents: 467
diff changeset
809
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
810 return docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
811
541
c4cc01b104d7 better metadata display for index page.
casties
parents: 538
diff changeset
812 def getDocinfoFromBib(self, docinfo, bib, bibx=None):
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
813 """reads contents of bib element into docinfo"""
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
814 logging.debug("getDocinfoFromBib bib=%s"%repr(bib))
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
815 # put all raw bib fields in dict "bib"
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
816 docinfo['bib'] = bib
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
817 bibtype = bib.get('@type', None)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
818 docinfo['bibType'] = bibtype
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
819 # also store DC metadata for convenience
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
820 dc = self.metadataService.getDCMappedData(bib)
536
abd36d4d97b8 new version of index page. improvements for digilib page and thumbnail overview.
casties
parents: 535
diff changeset
821 docinfo['creator'] = dc.get('creator','')
abd36d4d97b8 new version of index page. improvements for digilib page and thumbnail overview.
casties
parents: 535
diff changeset
822 docinfo['title'] = dc.get('title','')
abd36d4d97b8 new version of index page. improvements for digilib page and thumbnail overview.
casties
parents: 535
diff changeset
823 docinfo['date'] = dc.get('date','')
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
824 return docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
825
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
826 def getDocinfoFromAccess(self, docinfo, acc):
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
827 """reads contents of access element into docinfo"""
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
828 #TODO: also read resource type
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
829 logging.debug("getDocinfoFromAccess acc=%s"%repr(acc))
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
830 try:
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
831 acctype = acc['@attr']['type']
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
832 if acctype:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
833 access=acctype
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
834 if access in ['group', 'institution']:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
835 access = acc['name'].lower()
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
836
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
837 docinfo['accessType'] = access
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
838
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
839 except:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
840 pass
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
841
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
842 return docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
843
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
844 def getDocinfoFromDigilib(self, docinfo, path):
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
845 infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?fn="+path
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
846 # fetch data
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
847 txt = getHttpData(infoUrl)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
848 if not txt:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
849 logging.error("Unable to get dir-info from %s"%(infoUrl))
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
850 return docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
851
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
852 dom = ET.fromstring(txt)
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
853 dir = dom
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
854 # save size
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
855 size = dir.findtext('size')
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
856 logging.debug("getDocinfoFromDigilib: size=%s"%size)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
857 if size:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
858 docinfo['numPages'] = int(size)
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
859 else:
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
860 docinfo['numPages'] = 0
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
861 return docinfo
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
862
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
863 # save list of image names and numbers
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
864 imgNames = {}
591
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
865 imgIndexes = {}
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
866 for f in dir:
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
867 fn = f.findtext('name')
591
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
868 pn = getInt(f.findtext('index'))
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
869 imgNames[fn] = pn
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
870 imgIndexes[pn] = fn
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
871
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
872 docinfo['imgFileNames'] = imgNames
591
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
873 docinfo['imgFileIndexes'] = imgIndexes
464
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
874 return docinfo
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
875
19bd41d95f62 first version with new getdocinfo
casties
parents: 463
diff changeset
876
465
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
877 def getDocinfoFromPresentationInfoXml(self,docinfo):
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
878 """gets DC-like bibliographical information from the presentation entry in texttools"""
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
879 url = docinfo.get('presentationUrl', None)
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
880 if not url:
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
881 logging.error("getDocinfoFromPresentation: no URL!")
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
882 return docinfo
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
883
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
884 dom = None
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
885 metaUrl = None
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
886 if url.startswith("http://"):
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
887 # real URL
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
888 metaUrl = url
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
889 else:
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
890 # online path
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
891 server=self.digilibBaseUrl+"/servlet/Texter?fn="
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
892 metaUrl=server+url
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
893
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
894 txt=getHttpData(metaUrl)
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
895 if txt is None:
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
896 logging.error("Unable to read info.xml from %s"%(url))
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
897 return docinfo
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
898
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
899 dom = ET.fromstring(txt)
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
900 docinfo['creator']=getText(dom.find(".//author"))
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
901 docinfo['title']=getText(dom.find(".//title"))
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
902 docinfo['date']=getText(dom.find(".//date"))
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
903 return docinfo
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
904
224aad394350 really works with new getDocinfo
casties
parents: 464
diff changeset
905
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
906 def getPageinfo(self, pn=None, pf=None, start=None, rows=None, cols=None, docinfo=None, userinfo=None, viewMode=None, viewLayer=None, tocMode=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
907 """returns pageinfo with the given parameters"""
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
908 logging.debug("getPageInfo(pn=%s, pf=%s, start=%s, rows=%s, cols=%s, viewMode=%s, viewLayer=%s, tocMode=%s)"%(pn,pf,start,rows,cols,viewMode,viewLayer,tocMode))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
909 pageinfo = {}
471
415a7026eeda split viewMode in viewMode and viewType
casties
parents: 469
diff changeset
910 pageinfo['viewMode'] = viewMode
508
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
911 # split viewLayer if necessary
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
912 if isinstance(viewLayer,basestring):
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
913 viewLayer = viewLayer.split(',')
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
914
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
915 if isinstance(viewLayer, list):
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
916 logging.debug("getPageinfo: viewLayer is list:%s"%viewLayer)
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
917 # save (unique) list in viewLayers
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
918 seen = set()
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
919 viewLayers = [l for l in viewLayer if l and l not in seen and not seen.add(l)]
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
920 pageinfo['viewLayers'] = viewLayers
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
921 # stringify viewLayer
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
922 viewLayer = ','.join(viewLayers)
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
923 else:
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
924 #create list
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
925 pageinfo['viewLayers'] = [viewLayer]
d5a47f82e755 more cleanup.
casties
parents: 507
diff changeset
926
503
030251fe9dbc more cleanup.
casties
parents: 501
diff changeset
927 pageinfo['viewLayer'] = viewLayer
471
415a7026eeda split viewMode in viewMode and viewType
casties
parents: 469
diff changeset
928 pageinfo['tocMode'] = tocMode
415a7026eeda split viewMode in viewMode and viewType
casties
parents: 469
diff changeset
929
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
930 minPageNo = docinfo.get('minPageNo', 1)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
931
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
932 # pf takes precedence over pn
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
933 if pf:
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
934 pageinfo['pf'] = pf
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
935 pn = getPnForPf(docinfo, pf)
589
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
936 # replace pf in request params (used for creating new URLs)
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
937 self.REQUEST.form.pop('pf', None)
d8d6975cebcb more fixes for pf-parameter
casties
parents: 587
diff changeset
938 self.REQUEST.form['pn'] = pn
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
939 else:
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
940 pn = getInt(pn, minPageNo)
591
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
941 pf = getPfForPn(docinfo, pn)
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
942 pageinfo['pf'] = pf
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
943
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
944 pageinfo['pn'] = pn
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
945 rows = int(rows or self.thumbrows)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
946 pageinfo['rows'] = rows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
947 cols = int(cols or self.thumbcols)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
948 pageinfo['cols'] = cols
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
949 grpsize = cols * rows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
950 pageinfo['groupsize'] = grpsize
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
951 # if start is empty use one around pn
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
952 grouppn = math.ceil(float(pn)/float(grpsize))*grpsize-(grpsize-1)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
953 # but not smaller than minPageNo
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
954 start = getInt(start, max(grouppn, minPageNo))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
955 pageinfo['start'] = start
511
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
956 # get number of pages
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
957 numPages = int(docinfo.get('numPages', 0))
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
958 if numPages == 0:
518
91051b36b9cc uses xml info from doc-info.xql for table of contents now.
casties
parents: 516
diff changeset
959 # try numTextPages
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
960 numPages = docinfo.get('numTextPages', 0)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
961 if numPages != 0:
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
962 docinfo['numPages'] = numPages
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
963
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
964 maxPageNo = docinfo.get('maxPageNo', numPages)
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
965 logging.debug("minPageNo=%s maxPageNo=%s start=%s numPages=%s"%(minPageNo,maxPageNo,start,numPages))
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
966 np = maxPageNo
518
91051b36b9cc uses xml info from doc-info.xql for table of contents now.
casties
parents: 516
diff changeset
967
511
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
968 # cache table of contents
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
969 pageinfo['tocPageSize'] = getInt(self.REQUEST.get('tocPageSize', 30))
469
15394486ab75 working with new templates
casties
parents: 468
diff changeset
970 pageinfo['numgroups'] = int(np / grpsize)
15394486ab75 working with new templates
casties
parents: 468
diff changeset
971 if np % grpsize > 0:
15394486ab75 working with new templates
casties
parents: 468
diff changeset
972 pageinfo['numgroups'] += 1
476
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
973
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
974 pageFlowLtr = docinfo.get('pageFlow', 'ltr') != 'rtl'
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
975 oddScanLeft = docinfo.get('oddPage', 'left') != 'right'
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
976 # add zeroth page for two columns
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
977 pageZero = (cols == 2 and (pageFlowLtr != oddScanLeft))
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
978 pageinfo['pageZero'] = pageZero
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
979 pageinfo['pageBatch'] = self.getPageBatch(start=start, rows=rows, cols=cols, pageFlowLtr=pageFlowLtr, pageZero=pageZero, minIdx=minPageNo, maxIdx=np)
516
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
980 # more page parameters
629
e36bf3226fde text image viewer eingecheckt
dwinter
parents: 626
diff changeset
981 #pageinfo['characterNormalization'] = self.REQUEST.get('characterNormalization','reg')
e36bf3226fde text image viewer eingecheckt
dwinter
parents: 626
diff changeset
982 #becuase it is buggy this currently disabled and set to orig.
e36bf3226fde text image viewer eingecheckt
dwinter
parents: 626
diff changeset
983 pageinfo['characterNormalization'] = 'orig'
516
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
984 if docinfo.get('pageNumbers'):
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
985 # get original page numbers
587
6000c7e24d8a new parameter "pf" to specify image file name. (still some issues)
casties
parents: 585
diff changeset
986 pageNumber = docinfo['pageNumbers'].get(pn, None)
516
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
987 if pageNumber is not None:
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
988 pageinfo['pageNumberOrig'] = pageNumber['no']
7d7b639d7be7 add methods to use doc-info.xql.
casties
parents: 514
diff changeset
989 pageinfo['pageNumberOrigNorm'] = pageNumber['non']
158
4f4fe4e56ffe characterNormalization
abukhman
parents: 157
diff changeset
990
511
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
991 # cache search results
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
992 query = self.REQUEST.get('query',None)
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
993 pageinfo['query'] = query
591
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
994 if query and viewMode == 'text':
5850689ecfac ocrsearch layer for images.
casties
parents: 590
diff changeset
995 pageinfo['resultPageSize'] = getInt(self.REQUEST.get('resultPageSize', 10))
511
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
996 queryType = self.REQUEST.get('queryType', 'fulltextMorph')
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
997 pageinfo['queryType'] = queryType
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
998 pageinfo['resultStart'] = getInt(self.REQUEST.get('resultStart', '1'))
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
999 self.getSearchResults(mode=queryType, query=query, pageinfo=pageinfo, docinfo=docinfo)
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
1000
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
1001 # highlighting
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
1002 highlightQuery = self.REQUEST.get('highlightQuery', None)
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
1003 if highlightQuery:
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
1004 pageinfo['highlightQuery'] = highlightQuery
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
1005 pageinfo['highlightElement'] = self.REQUEST.get('highlightElement', '')
551ca1641a5e more cleanup.
casties
parents: 509
diff changeset
1006 pageinfo['highlightElementPos'] = self.REQUEST.get('highlightElementPos', '')
460
76bc2317146f more renovation
casties
parents: 459
diff changeset
1007
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1008 return pageinfo
460
76bc2317146f more renovation
casties
parents: 459
diff changeset
1009
463
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1010
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1011 def getPageBatch(self, start=1, rows=10, cols=2, pageFlowLtr=True, pageZero=False, minIdx=1, maxIdx=0):
613
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1012 """Return dict with array of page information for one screenfull of thumbnails.
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1013
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1014 :param start: index of current page
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1015 :param rows: number of rows in one batch
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1016 :param cols: number of columns in one batch
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1017 :param pageFlowLtr: do indexes increase from left to right
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1018 :param pageZero: is there a zeroth non-visible page
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1019 :param minIdx: minimum index to use
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1020 :param maxIdx: maximum index to use
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1021 :returns: dict with
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1022 first: first page index
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1023 last: last page index
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1024 batches: list of all possible batches(dict: 'start': index, 'end': index)
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1025 pages: list for current batch of rows(list of cols(list of pages(dict: 'idx': index)))
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1026 nextStart: first index of next batch
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1027 prevStart: first index of previous batch
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1028 """
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1029 logging.debug("getPageBatch start=%s minIdx=%s maxIdx=%s"%(start,minIdx,maxIdx))
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1030 batch = {}
480
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1031 grpsize = rows * cols
476
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1032 if maxIdx == 0:
480
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1033 maxIdx = start + grpsize
476
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1034
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1035 np = maxIdx - minIdx + 1
613
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1036 if pageZero:
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1037 # correct number of pages for batching
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1038 np += 1
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1039
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1040 nb = int(math.ceil(np / float(grpsize)))
613
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1041
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1042 # list of all batch start and end points
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1043 batches = []
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1044 if pageZero:
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1045 ofs = minIdx - 1
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1046 else:
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1047 ofs = minIdx
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1048
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1049 for i in range(nb):
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1050 s = i * grpsize + ofs
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1051 e = min((i + 1) * grpsize + ofs - 1, maxIdx)
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1052 batches.append({'start':s, 'end':e})
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1053
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1054 batch['batches'] = batches
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1055
613
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1056 # list of pages for current screen
476
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1057 pages = []
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1058 if pageZero and start == minIdx:
476
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1059 # correct beginning
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1060 idx = minIdx - 1
476
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1061 else:
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1062 idx = start
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1063
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1064 for r in range(rows):
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1065 row = []
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1066 for c in range(cols):
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1067 if idx < minIdx or idx > maxIdx:
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1068 page = {'idx':None}
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1069 else:
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1070 page = {'idx':idx}
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1071
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1072 idx += 1
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1073 if pageFlowLtr:
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1074 row.append(page)
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1075 else:
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1076 row.insert(0, page)
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1077
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1078 pages.append(row)
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1079
607
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1080 if start > minIdx:
cb5a9c4f5e3a CLOSED - # 268: display of subdocuments
casties
parents: 602
diff changeset
1081 batch['prevStart'] = max(start - grpsize, minIdx)
480
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1082 else:
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1083 batch['prevStart'] = None
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1084
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
1085 if start + grpsize <= maxIdx:
613
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1086 if pageZero and start == minIdx:
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1087 # correct nextStart for pageZero
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1088 batch['nextStart'] = grpsize
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1089 else:
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1090 batch['nextStart'] = start + grpsize
480
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1091 else:
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1092 batch['nextStart'] = None
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1093
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1094 batch['pages'] = pages
571
f1906951be2a nicer batching of tocs
casties
parents: 568
diff changeset
1095 batch['first'] = minIdx
f1906951be2a nicer batching of tocs
casties
parents: 568
diff changeset
1096 batch['last'] = maxIdx
613
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1097 logging.debug("batch: %s"%repr(batch))
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1098 return batch
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1099
613
c57d80a649ea CLOSED - # 281: List of thumbnails verschluckt Seite, wenn odd-scan-position gesetzt ist
casties
parents: 612
diff changeset
1100
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1101 def getBatch(self, start=1, size=10, end=0, data=None, fullData=True):
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1102 """returns dict with information for one screenfull of data."""
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1103 batch = {}
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1104 if end == 0:
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1105 end = start + size
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1106
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1107 nb = int(math.ceil(end / float(size)))
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1108 # list of all batch start and end points
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1109 batches = []
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1110 for i in range(nb):
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1111 s = i * size + 1
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1112 e = min((i + 1) * size, end)
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1113 batches.append({'start':s, 'end':e})
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1114
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1115 batch['batches'] = batches
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1116 # list of elements in this batch
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1117 this = []
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1118 j = 0
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
1119 for i in range(start, min(start+size, end+1)):
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1120 if data:
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1121 if fullData:
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
1122 d = data.get(i, None)
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1123 else:
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
1124 d = data.get(j, None)
482
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1125 j += 1
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1126
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1127 else:
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1128 d = i+1
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1129
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1130 this.append(d)
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1131
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1132 batch['this'] = this
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1133 if start > 1:
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1134 batch['prevStart'] = max(start - size, 1)
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1135 else:
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1136 batch['prevStart'] = None
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1137
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1138 if start + size < end:
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1139 batch['nextStart'] = start + size
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1140 else:
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1141 batch['nextStart'] = None
7ca8ac7db06e more new template stuff. more batching methods in documentViewer.
casties
parents: 480
diff changeset
1142
571
f1906951be2a nicer batching of tocs
casties
parents: 568
diff changeset
1143 batch['first'] = start
f1906951be2a nicer batching of tocs
casties
parents: 568
diff changeset
1144 batch['last'] = end
480
50a28442f21c more new template stuff
casties
parents: 479
diff changeset
1145 return batch
476
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1146
1d93a8cb2d8f more new template stuff
casties
parents: 475
diff changeset
1147
546
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1148 def getAnnotatorGroupsForUser(self, user, annotationServerUrl="http://tuxserve03.mpiwg-berlin.mpg.de/AnnotationManager"):
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1149 """returns list of groups {name:*, id:*} on the annotation server for the user"""
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1150 groups = []
623
6012fe93f78c better scheme-less URL code.
casties
parents: 622
diff changeset
1151 # add matching http(s) from our URL
6012fe93f78c better scheme-less URL code.
casties
parents: 622
diff changeset
1152 annotationServerUrl = sslifyUrl(annotationServerUrl, self)
622
bc68ca0d2c0a make annotationServerUrl work with protocol-relative URL (//).
casties
parents: 618
diff changeset
1153
546
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1154 groupsUrl = "%s/annotator/groups?user=%s"%(annotationServerUrl,user)
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1155 data = getHttpData(url=groupsUrl, noExceptions=True)
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1156 if data:
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1157 res = json.loads(data)
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1158 rows = res.get('rows', None)
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1159 if rows is None:
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1160 return groups
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1161 for r in rows:
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1162 groups.append({'id': r.get('id', None), 'name': r.get('name', None), 'uri': r.get('uri', None)})
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1163
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1164 return groups
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1165
626
7dafe8283312 make sslify accessible for templates.
casties
parents: 625
diff changeset
1166 def sslifyUrl(self, url, **args):
7dafe8283312 make sslify accessible for templates.
casties
parents: 625
diff changeset
1167 """returns URL with http or https"""
7dafe8283312 make sslify accessible for templates.
casties
parents: 625
diff changeset
1168 return sslifyUrl(url, **args)
546
2928037f9a75 ASSIGNED - # 249: Annotations shared in groups
casties
parents: 543
diff changeset
1169
463
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1170 security.declareProtected('View management screens','changeDocumentViewerForm')
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1171 changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1172
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
1173 def changeDocumentViewer(self,title="",digilibBaseUrl=None,thumbrows=2,thumbcols=5,authgroups='mpiwg',availableLayers=None,RESPONSE=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1174 """init document viewer"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1175 self.title=title
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1176 self.digilibBaseUrl = digilibBaseUrl
566
4a31608f8b0e more new MpiwgXmlTextServer.
casties
parents: 565
diff changeset
1177 self.digilibScalerUrl = digilibBaseUrl + '/servlet/Scaler'
4a31608f8b0e more new MpiwgXmlTextServer.
casties
parents: 565
diff changeset
1178 self.digilibViewerUrl = digilibBaseUrl + '/jquery/digilib.html'
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
1179 self.thumbrows = thumbrows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
1180 self.thumbcols = thumbcols
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
1181 self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
463
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1182 try:
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1183 # assume MetaDataFolder instance is called metadata
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1184 self.metadataService = getattr(self, 'metadata')
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1185 except Exception, e:
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1186 logging.error("Unable to find MetaDataFolder 'metadata': "+str(e))
526
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
1187
3f375a048402 moved search and dict into separate layers.
casties
parents: 525
diff changeset
1188 self.setAvailableLayers(availableLayers)
463
89ad327b4bbd more renovation
casties
parents: 462
diff changeset
1189
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1190 if RESPONSE is not None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1191 RESPONSE.redirect('manage_main')
623
6012fe93f78c better scheme-less URL code.
casties
parents: 622
diff changeset
1192
0
dwinter
parents:
diff changeset
1193
dwinter
parents:
diff changeset
1194 def manage_AddDocumentViewerForm(self):
dwinter
parents:
diff changeset
1195 """add the viewer form"""
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1196 pt=PageTemplateFile('zpt/addDocumentViewer', globals()).__of__(self)
0
dwinter
parents:
diff changeset
1197 return pt()
dwinter
parents:
diff changeset
1198
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
1199 def manage_AddDocumentViewer(self,id,imageScalerUrl="",textServerName="",title="",RESPONSE=None):
0
dwinter
parents:
diff changeset
1200 """add the viewer"""
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
1201 newObj=documentViewer(id,imageScalerUrl=imageScalerUrl,title=title,textServerName=textServerName)
0
dwinter
parents:
diff changeset
1202 self._setObject(id,newObj)
dwinter
parents:
diff changeset
1203
dwinter
parents:
diff changeset
1204 if RESPONSE is not None:
dwinter
parents:
diff changeset
1205 RESPONSE.redirect('manage_main')