annotate documentViewer.py @ 96:a679c8c7148d

getTranslate, getLemma two functions
author abukhman
date Wed, 21 Apr 2010 15:50:59 +0200
parents db6d594aa4d9
children 2b8fd19432fb
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
1
0
dwinter
parents:
diff changeset
2 from OFS.Folder import Folder
dwinter
parents:
diff changeset
3 from Products.PageTemplates.ZopePageTemplate import ZopePageTemplate
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
4 from Products.PageTemplates.PageTemplateFile import PageTemplateFile
0
dwinter
parents:
diff changeset
5 from AccessControl import ClassSecurityInfo
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
6 from AccessControl import getSecurityManager
0
dwinter
parents:
diff changeset
7 from Globals import package_home
dwinter
parents:
diff changeset
8
dwinter
parents:
diff changeset
9 from Ft.Xml.Domlette import NonvalidatingReader
dwinter
parents:
diff changeset
10 from Ft.Xml.Domlette import PrettyPrint, Print
38
025d3b6cba51 fixes by dirk
casties
parents: 37
diff changeset
11 from Ft.Xml import EMPTY_NAMESPACE, Parse
0
dwinter
parents:
diff changeset
12
83
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
13
0
dwinter
parents:
diff changeset
14 import Ft.Xml.XPath
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
15 import cStringIO
83
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
16 import xmlrpclib
0
dwinter
parents:
diff changeset
17 import os.path
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
18 import sys
0
dwinter
parents:
diff changeset
19 import cgi
dwinter
parents:
diff changeset
20 import urllib
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
21 import logging
61
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
22 import math
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
23
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
24 import urlparse
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
25 from types import *
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
26
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
27 def logger(txt,method,txt2):
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
28 """logging"""
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
29 logging.info(txt+ txt2)
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
30
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
31
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
32 def getInt(number, default=0):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
33 """returns always an int (0 in case of problems)"""
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
34 try:
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
35 return int(number)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
36 except:
62
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
37 return int(default)
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
38
0
dwinter
parents:
diff changeset
39 def getTextFromNode(nodename):
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
40 """get the cdata content of a node"""
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
41 if nodename is None:
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
42 return ""
0
dwinter
parents:
diff changeset
43 nodelist=nodename.childNodes
dwinter
parents:
diff changeset
44 rc = ""
dwinter
parents:
diff changeset
45 for node in nodelist:
dwinter
parents:
diff changeset
46 if node.nodeType == node.TEXT_NODE:
dwinter
parents:
diff changeset
47 rc = rc + node.data
dwinter
parents:
diff changeset
48 return rc
dwinter
parents:
diff changeset
49
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
50 def serializeNode(node, encoding='utf-8'):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
51 """returns a string containing node as XML"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
52 buf = cStringIO.StringIO()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
53 Print(node, stream=buf, encoding=encoding)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
54 s = buf.getvalue()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
55 buf.close()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
56 return s
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
57
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
58
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
59 def getParentDir(path):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
60 """returns pathname shortened by one"""
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
61 return '/'.join(path.split('/')[0:-1])
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
62
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
63
0
dwinter
parents:
diff changeset
64 import socket
dwinter
parents:
diff changeset
65
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
66 def urlopen(url,timeout=2):
0
dwinter
parents:
diff changeset
67 """urlopen mit timeout"""
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
68 socket.setdefaulttimeout(timeout)
0
dwinter
parents:
diff changeset
69 ret=urllib.urlopen(url)
dwinter
parents:
diff changeset
70 socket.setdefaulttimeout(5)
dwinter
parents:
diff changeset
71 return ret
dwinter
parents:
diff changeset
72
dwinter
parents:
diff changeset
73
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
74 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
75 ## documentViewer class
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
76 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
77 class documentViewer(Folder):
0
dwinter
parents:
diff changeset
78 """document viewer"""
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
79 #textViewerUrl="http://127.0.0.1:8080/HFQP/testXSLT/getPage?"
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
80
0
dwinter
parents:
diff changeset
81 meta_type="Document viewer"
dwinter
parents:
diff changeset
82
dwinter
parents:
diff changeset
83 security=ClassSecurityInfo()
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
84 manage_options=Folder.manage_options+(
0
dwinter
parents:
diff changeset
85 {'label':'main config','action':'changeDocumentViewerForm'},
dwinter
parents:
diff changeset
86 )
dwinter
parents:
diff changeset
87
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
88 # templates and forms
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
89 viewer_main = PageTemplateFile('zpt/viewer_main', globals())
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
90 toc_thumbs = PageTemplateFile('zpt/toc_thumbs', globals())
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
91 toc_text = PageTemplateFile('zpt/toc_text', globals())
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
92 toc_figures = PageTemplateFile('zpt/toc_figures', globals())
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
93 page_main_images = PageTemplateFile('zpt/page_main_images', globals())
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
94 page_main_text = PageTemplateFile('zpt/page_main_text', globals())
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
95 page_main_text_dict = PageTemplateFile('zpt/page_main_text_dict', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
96 head_main = PageTemplateFile('zpt/head_main', globals())
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
97 docuviewer_css = PageTemplateFile('css/docuviewer.css', globals())
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
98 info_xml = PageTemplateFile('zpt/info_xml', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
99
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
100 thumbs_main_rss = PageTemplateFile('zpt/thumbs_main_rss', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
101 security.declareProtected('View management screens','changeDocumentViewerForm')
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
102 changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals())
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
103
0
dwinter
parents:
diff changeset
104
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
105 def __init__(self,id,imageScalerUrl=None,textServerName=None,title="",digilibBaseUrl=None,thumbcols=2,thumbrows=5,authgroups="mpiwg"):
0
dwinter
parents:
diff changeset
106 """init document viewer"""
dwinter
parents:
diff changeset
107 self.id=id
dwinter
parents:
diff changeset
108 self.title=title
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
109 self.thumbcols = thumbcols
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
110 self.thumbrows = thumbrows
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
111 # authgroups is list of authorized groups (delimited by ,)
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
112 self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
113 # create template folder so we can always use template.something
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
114
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
115 templateFolder = Folder('template')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
116 #self['template'] = templateFolder # Zope-2.12 style
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
117 self._setObject('template',templateFolder) # old style
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
118 try:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
119 from Products.XMLRpcTools.XMLRpcTools import XMLRpcServerProxy
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
120 xmlRpcClient = XMLRpcServerProxy(id='fulltextclient', serverUrl=textServerName, use_xmlrpc=False)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
121 #templateFolder['fulltextclient'] = xmlRpcClient
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
122 templateFolder._setObject('fulltextclient',xmlRpcClient)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
123 except Exception, e:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
124 logging.error("Unable to create XMLRpcTools for fulltextclient: "+str(e))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
125 try:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
126 from Products.zogiLib.zogiLib import zogiLib
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
127 zogilib = zogiLib(id="zogilib", title="zogilib for docuviewer", dlServerURL=imageScalerUrl, layout="book")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
128 #templateFolder['zogilib'] = zogilib
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
129 templateFolder._setObject('zogilib',zogilib)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
130 except Exception, e:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
131 logging.error("Unable to create zogiLib for zogilib: "+str(e))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
132
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
133
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
134 security.declareProtected('View','thumbs_rss')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
135 def thumbs_rss(self,mode,url,viewMode="auto",start=None,pn=1):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
136 '''
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
137 view it
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
138 @param mode: defines how to access the document behind url
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
139 @param url: url which contains display information
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
140 @param viewMode: if images display images, if text display text, default is images (text,images or auto)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
141
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
142 '''
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
143 logging.debug("HHHHHHHHHHHHHH:load the rss")
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
144 logger("documentViewer (index)", logging.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
145
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
146 if not hasattr(self, 'template'):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
147 # create template folder if it doesn't exist
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
148 self.manage_addFolder('template')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
149
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
150 if not self.digilibBaseUrl:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
151 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
152
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
153 docinfo = self.getDocinfo(mode=mode,url=url)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
154 pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
155 pt = getattr(self.template, 'thumbs_main_rss')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
156
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
157 if viewMode=="auto": # automodus gewaehlt
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
158 if docinfo.get("textURL",'') and self.textViewerUrl: #texturl gesetzt und textViewer konfiguriert
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
159 viewMode="text"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
160 else:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
161 viewMode="images"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
162
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
163 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
164
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
165 security.declareProtected('View','index_html')
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
166 def index_html(self,url,mode="texttool",viewMode="auto",tocMode="thumbs",start=None,pn=1,mk=None, query=None, querySearch=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
167 '''
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
168 view it
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
169 @param mode: defines how to access the document behind url
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
170 @param url: url which contains display information
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
171 @param viewMode: if images display images, if text display text, default is auto (text,images or auto)
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
172 @param tocMode: type of 'table of contents' for navigation (thumbs, text, figures, search)
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
173 @param querySearch: type of different search modes (fulltext, fulltextMorph, xpath, xquery, ftIndex, ftIndexMorph)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
174 '''
0
dwinter
parents:
diff changeset
175
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
176 logging.debug("documentViewer (index) mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
177
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
178 if not hasattr(self, 'template'):
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
179 # this won't work
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
180 logging.error("template folder missing!")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
181 return "ERROR: template folder missing!"
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
182
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
183 if not getattr(self, 'digilibBaseUrl', None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
184 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
185
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
186 docinfo = self.getDocinfo(mode=mode,url=url)
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
187 pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo,viewMode=viewMode,tocMode=tocMode)
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
188 if tocMode != "thumbs":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
189 # get table of contents
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
190 docinfo = self.getToc(mode=tocMode, docinfo=docinfo)
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
191
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
192 if viewMode=="auto": # automodus gewaehlt
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
193 if docinfo.get("textURL",''): #texturl gesetzt und textViewer konfiguriert
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
194 viewMode="text"
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
195 else:
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
196 viewMode="images"
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
197
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
198 pt = getattr(self.template, 'viewer_main')
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
199 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode,mk=self.generateMarks(mk))
0
dwinter
parents:
diff changeset
200
74
dwinter
parents: 73
diff changeset
201 def generateMarks(self,mk):
dwinter
parents: 73
diff changeset
202 ret=""
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
203 if mk is None:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
204 return ""
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
205 if type(mk) is not ListType:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
206 mk=[mk]
74
dwinter
parents: 73
diff changeset
207 for m in mk:
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
208 ret+="mk=%s"%m
74
dwinter
parents: 73
diff changeset
209 return ret
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
210
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
211
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
212 def findDigilibUrl(self):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
213 """try to get the digilib URL from zogilib"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
214 url = self.template.zogilib.getDLBaseUrl()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
215 return url
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
216
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
217 def getStyle(self, idx, selected, style=""):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
218 """returns a string with the given style and append 'sel' if path == selected."""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
219 #logger("documentViewer (getstyle)", logging.INFO, "idx: %s selected: %s style: %s"%(idx,selected,style))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
220 if idx == selected:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
221 return style + 'sel'
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
222 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
223 return style
74
dwinter
parents: 73
diff changeset
224
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
225 def getLink(self,param=None,val=None):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
226 """link to documentviewer with parameter param set to val"""
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
227 params=self.REQUEST.form.copy()
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
228 if param is not None:
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
229 if val is None:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
230 if params.has_key(param):
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
231 del params[param]
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
232 else:
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
233 params[param] = str(val)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
234
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
235 if params.get("mode", None) == "filepath": #wenn beim erst Aufruf filepath gesetzt wurde aendere das nun zu imagepath
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
236 params["mode"] = "imagepath"
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
237 params["url"] = getParentDir(params["url"])
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
238
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
239 # quote values and assemble into query string
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
240 ps = "&".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
241 url=self.REQUEST['URL1']+"?"+ps
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
242 return url
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
243
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
244 def getLinkAmp(self,param=None,val=None):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
245 """link to documentviewer with parameter param set to val"""
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
246 params=self.REQUEST.form.copy()
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
247 if param is not None:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
248 if val is None:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
249 if params.has_key(param):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
250 del params[param]
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
251 else:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
252 params[param] = str(val)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
253
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
254 # quote values and assemble into query string
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
255 logging.info("XYXXXXX: %s"%repr(params.items()))
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
256 ps = "&".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
257 url=self.REQUEST['URL1']+"?"+ps
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
258 return url
81
fae97f071724 fixed problem with info.xml when url without index.meta
casties
parents: 79
diff changeset
259
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
260 def getInfo_xml(self,url,mode):
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
261 """returns info about the document as XML"""
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
262
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
263 if not self.digilibBaseUrl:
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
264 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
265
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
266 docinfo = self.getDocinfo(mode=mode,url=url)
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
267 pt = getattr(self.template, 'info_xml')
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
268 return pt(docinfo=docinfo)
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
269
0
dwinter
parents:
diff changeset
270
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
271 def isAccessible(self, docinfo):
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
272 """returns if access to the resource is granted"""
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
273 access = docinfo.get('accessType', None)
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
274 logger("documentViewer (accessOK)", logging.INFO, "access type %s"%access)
45
0391fe75aef3 fixed handling of documents with missing access tag
casties
parents: 43
diff changeset
275 if access is not None and access == 'free':
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
276 logger("documentViewer (accessOK)", logging.INFO, "access is free")
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
277 return True
45
0391fe75aef3 fixed handling of documents with missing access tag
casties
parents: 43
diff changeset
278 elif access is None or access in self.authgroups:
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
279 # only local access -- only logged in users
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
280 user = getSecurityManager().getUser()
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
281 if user is not None:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
282 #print "user: ", user
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
283 return (user.getUserName() != "Anonymous User")
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
284 else:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
285 return False
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
286
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
287 logger("documentViewer (accessOK)", logging.INFO, "unknown access type %s"%access)
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
288 return False
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
289
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
290
73
dwinter
parents: 71
diff changeset
291 def getDirinfoFromDigilib(self,path,docinfo=None,cut=0):
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
292 """gibt param von dlInfo aus"""
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
293 num_retries = 3
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
294 if docinfo is None:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
295 docinfo = {}
73
dwinter
parents: 71
diff changeset
296
dwinter
parents: 71
diff changeset
297 for x in range(cut):
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
298
73
dwinter
parents: 71
diff changeset
299 path=getParentDir(path)
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
300
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
301 infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
302
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
303 logger("documentViewer (getparamfromdigilib)", logging.INFO, "dirInfo from %s"%(infoUrl))
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
304
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
305 for cnt in range(num_retries):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
306 try:
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
307 # dom = NonvalidatingReader.parseUri(imageUrl)
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
308 txt=urllib.urlopen(infoUrl).read()
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
309 dom = Parse(txt)
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
310 break
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
311 except:
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
312 logger("documentViewer (getdirinfofromdigilib)", logging.ERROR, "error reading %s (try %d)"%(infoUrl,cnt))
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
313 else:
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
314 raise IOError("Unable to get dir-info from %s"%(infoUrl))
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
315
37
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
316 sizes=dom.xpath("//dir/size")
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
317 logger("documentViewer (getparamfromdigilib)", logging.INFO, "dirInfo:size"%sizes)
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
318
37
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
319 if sizes:
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
320 docinfo['numPages'] = int(getTextFromNode(sizes[0]))
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
321 else:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
322 docinfo['numPages'] = 0
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
323
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
324 # TODO: produce and keep list of image names and numbers
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
325
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
326 return docinfo
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
327
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
328
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
329 def getIndexMeta(self, url):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
330 """returns dom of index.meta document at url"""
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
331 num_retries = 3
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
332 dom = None
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
333 metaUrl = None
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
334 if url.startswith("http://"):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
335 # real URL
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
336 metaUrl = url
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
337 else:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
338 # online path
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
339 server=self.digilibBaseUrl+"/servlet/Texter?fn="
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
340 metaUrl=server+url.replace("/mpiwg/online","")
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
341 if not metaUrl.endswith("index.meta"):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
342 metaUrl += "/index.meta"
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
343 logging.debug("METAURL: %s"%metaUrl)
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
344 for cnt in range(num_retries):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
345 try:
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
346 # patch dirk encoding fehler treten dann nicht mehr auf
38
025d3b6cba51 fixes by dirk
casties
parents: 37
diff changeset
347 # dom = NonvalidatingReader.parseUri(metaUrl)
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
348 txt=urllib.urlopen(metaUrl).read()
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
349 dom = Parse(txt)
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
350 break
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
351 except:
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
352 logger("ERROR documentViewer (getIndexMeta)", logging.INFO,"%s (%s)"%sys.exc_info()[0:2])
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
353
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
354 if dom is None:
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
355 raise IOError("Unable to read index meta from %s"%(url))
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
356
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
357 return dom
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
358
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
359 def getPresentationInfoXML(self, url):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
360 """returns dom of info.xml document at url"""
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
361 num_retries = 3
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
362 dom = None
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
363 metaUrl = None
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
364 if url.startswith("http://"):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
365 # real URL
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
366 metaUrl = url
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
367 else:
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
368 # online path
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
369 server=self.digilibBaseUrl+"/servlet/Texter?fn="
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
370 metaUrl=server+url.replace("/mpiwg/online","")
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
371
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
372 for cnt in range(num_retries):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
373 try:
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
374 # patch dirk encoding fehler treten dann nicht mehr auf
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
375 # dom = NonvalidatingReader.parseUri(metaUrl)
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
376 txt=urllib.urlopen(metaUrl).read()
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
377 dom = Parse(txt)
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
378 break
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
379 except:
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
380 logger("ERROR documentViewer (getPresentationInfoXML)", logging.INFO,"%s (%s)"%sys.exc_info()[0:2])
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
381
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
382 if dom is None:
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
383 raise IOError("Unable to read infoXMLfrom %s"%(url))
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
384
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
385 return dom
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
386
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
387
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
388 def getAuthinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
389 """gets authorization info from the index.meta file at path or given by dom"""
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
390 logger("documentViewer (getauthinfofromindexmeta)", logging.INFO,"path: %s"%(path))
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
391
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
392 access = None
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
393
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
394 if docinfo is None:
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
395 docinfo = {}
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
396
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
397 if dom is None:
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
398 for x in range(cut):
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
399 path=getParentDir(path)
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
400 dom = self.getIndexMeta(path)
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
401
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
402 acctype = dom.xpath("//access-conditions/access/@type")
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
403 if acctype and (len(acctype)>0):
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
404 access=acctype[0].value
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
405 if access in ['group', 'institution']:
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
406 access = getTextFromNode(dom.xpath("//access-conditions/access/name")[0]).lower()
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
407
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
408 docinfo['accessType'] = access
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
409 return docinfo
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
410
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
411
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
412 def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
413 """gets bibliographical info from the index.meta file at path or given by dom"""
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
414 logging.debug("documentViewer (getbibinfofromindexmeta) path: %s"%(path))
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
415
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
416 if docinfo is None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
417 docinfo = {}
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
418
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
419 if dom is None:
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
420 for x in range(cut):
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
421 path=getParentDir(path)
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
422 dom = self.getIndexMeta(path)
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
423
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
424 logging.debug("documentViewer (getbibinfofromindexmeta cutted) path: %s"%(path))
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
425 # put in all raw bib fields as dict "bib"
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
426 bib = dom.xpath("//bib/*")
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
427 if bib and len(bib)>0:
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
428 bibinfo = {}
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
429 for e in bib:
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
430 bibinfo[e.localName] = getTextFromNode(e)
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
431 docinfo['bib'] = bibinfo
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
432
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
433 # extract some fields (author, title, year) according to their mapping
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
434 metaData=self.metadata.main.meta.bib
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
435 bibtype=dom.xpath("//bib/@type")
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
436 if bibtype and (len(bibtype)>0):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
437 bibtype=bibtype[0].value
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
438 else:
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
439 bibtype="generic"
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
440
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
441 bibtype=bibtype.replace("-"," ") # wrong typesiin index meta "-" instead of " " (not wrong! ROC)
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
442 docinfo['bib_type'] = bibtype
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
443 bibmap=metaData.generateMappingForType(bibtype)
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
444 # if there is no mapping bibmap is empty (mapping sometimes has empty fields)
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
445 if len(bibmap) > 0 and len(bibmap['author'][0]) > 0:
63
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
446 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
447 docinfo['author']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['author'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
448 except: pass
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
449 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
450 docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
451 except: pass
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
452 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
453 docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
454 except: pass
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
455 logging.debug("documentViewer (getbibinfofromindexmeta) using mapping for %s"%bibtype)
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
456 try:
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
457 docinfo['lang']=getTextFromNode(dom.xpath("//bib/lang")[0])
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
458 except:
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
459 docinfo['lang']=''
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
460
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
461 return docinfo
83
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
462
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
463
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
464 def getDocinfoFromTextTool(self, url, dom=None, docinfo=None):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
465 """parse texttool tag in index meta"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
466 logger("documentViewer (getdocinfofromtexttool)", logging.INFO, "url: %s" % (url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
467 if docinfo is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
468 docinfo = {}
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
469 if docinfo.get('lang', None) is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
470 docinfo['lang'] = '' # default keine Sprache gesetzt
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
471 if dom is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
472 dom = self.getIndexMeta(url)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
473
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
474 archivePath = None
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
475 archiveName = None
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
476
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
477 archiveNames = dom.xpath("//resource/name")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
478 if archiveNames and (len(archiveNames) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
479 archiveName = getTextFromNode(archiveNames[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
480 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
481 logger("documentViewer (getdocinfofromtexttool)", logging.WARNING, "resource/name missing in: %s" % (url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
482
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
483 archivePaths = dom.xpath("//resource/archive-path")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
484 if archivePaths and (len(archivePaths) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
485 archivePath = getTextFromNode(archivePaths[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
486 # clean up archive path
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
487 if archivePath[0] != '/':
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
488 archivePath = '/' + archivePath
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
489 if archiveName and (not archivePath.endswith(archiveName)):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
490 archivePath += "/" + archiveName
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
491 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
492 # try to get archive-path from url
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
493 logger("documentViewer (getdocinfofromtexttool)", logging.WARNING, "resource/archive-path missing in: %s" % (url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
494 if (not url.startswith('http')):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
495 archivePath = url.replace('index.meta', '')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
496
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
497 if archivePath is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
498 # we balk without archive-path
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
499 raise IOError("Missing archive-path (for text-tool) in %s" % (url))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
500
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
501 imageDirs = dom.xpath("//texttool/image")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
502 if imageDirs and (len(imageDirs) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
503 imageDir = getTextFromNode(imageDirs[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
504
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
505 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
506 # we balk with no image tag / not necessary anymore because textmode is now standard
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
507 #raise IOError("No text-tool info in %s"%(url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
508 imageDir = ""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
509 #xquery="//pb"
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
510 docinfo['imagePath'] = "" # keine Bilder
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
511 docinfo['imageURL'] = ""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
512
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
513 if imageDir and archivePath:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
514 #print "image: ", imageDir, " archivepath: ", archivePath
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
515 imageDir = os.path.join(archivePath, imageDir)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
516 imageDir = imageDir.replace("/mpiwg/online", '')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
517 docinfo = self.getDirinfoFromDigilib(imageDir, docinfo=docinfo)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
518 docinfo['imagePath'] = imageDir
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
519
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
520 docinfo['imageURL'] = self.digilibBaseUrl + "/servlet/Scaler?fn=" + imageDir
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
521
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
522 viewerUrls = dom.xpath("//texttool/digiliburlprefix")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
523 if viewerUrls and (len(viewerUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
524 viewerUrl = getTextFromNode(viewerUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
525 docinfo['viewerURL'] = viewerUrl
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
526
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
527 textUrls = dom.xpath("//texttool/text")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
528 if textUrls and (len(textUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
529 textUrl = getTextFromNode(textUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
530 if urlparse.urlparse(textUrl)[0] == "": #keine url
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
531 textUrl = os.path.join(archivePath, textUrl)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
532 # fix URLs starting with /mpiwg/online
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
533 if textUrl.startswith("/mpiwg/online"):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
534 textUrl = textUrl.replace("/mpiwg/online", '', 1)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
535
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
536 docinfo['textURL'] = textUrl
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
537
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
538 textUrls = dom.xpath("//texttool/text-url-path")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
539 if textUrls and (len(textUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
540 textUrl = getTextFromNode(textUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
541 docinfo['textURLPath'] = textUrl
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
542
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
543 presentationUrls = dom.xpath("//texttool/presentation")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
544 docinfo = self.getBibinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get info von bib tag
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
545
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
546 if presentationUrls and (len(presentationUrls) > 0): # ueberschreibe diese durch presentation informationen
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
547 # presentation url ergiebt sich ersetzen von index.meta in der url der fuer die Metadaten
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
548 # durch den relativen Pfad auf die presentation infos
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
549 presentationPath = getTextFromNode(presentationUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
550 if url.endswith("index.meta"):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
551 presentationUrl = url.replace('index.meta', presentationPath)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
552 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
553 presentationUrl = url + "/" + presentationPath
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
554 docinfo = self.getNumPages(docinfo) #im moment einfach auf eins setzen, navigation ueber die thumbs geht natuerlich nicht
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
555 docinfo = self.getBibinfoFromTextToolPresentation(presentationUrl, docinfo=docinfo, dom=dom)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
556
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
557 docinfo = self.getAuthinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get access info
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
558
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
559 return docinfo
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
560
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
561
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
562 def getBibinfoFromTextToolPresentation(self,url,docinfo=None,dom=None):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
563 """gets the bibliographical information from the preseantion entry in texttools
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
564 """
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
565 dom=self.getPresentationInfoXML(url)
62
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
566 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
567 docinfo['author']=getTextFromNode(dom.xpath("//author")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
568 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
569 pass
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
570 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
571 docinfo['title']=getTextFromNode(dom.xpath("//title")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
572 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
573 pass
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
574 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
575 docinfo['year']=getTextFromNode(dom.xpath("//date")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
576 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
577 pass
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
578 return docinfo
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
579
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
580 def getDocinfoFromImagePath(self,path,docinfo=None,cut=0):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
581 """path ist the path to the images it assumes that the index.meta file is one level higher."""
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
582 logger("documentViewer (getdocinfofromimagepath)", logging.INFO,"path: %s"%(path))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
583 if docinfo is None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
584 docinfo = {}
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
585 path=path.replace("/mpiwg/online","")
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
586 docinfo['imagePath'] = path
73
dwinter
parents: 71
diff changeset
587 docinfo=self.getDirinfoFromDigilib(path,docinfo=docinfo,cut=cut)
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
588
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
589 pathorig=path
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
590 for x in range(cut):
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
591 path=getParentDir(path)
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
592 logging.error("PATH:"+path)
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
593 imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn="+path
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
594 docinfo['imageURL'] = imageUrl
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
595
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
596 #path ist the path to the images it assumes that the index.meta file is one level higher.
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
597 docinfo = self.getBibinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
598 docinfo = self.getAuthinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
599 return docinfo
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
600
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
601
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
602 def getDocinfo(self, mode, url):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
603 """returns docinfo depending on mode"""
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
604 logger("documentViewer (getdocinfo)", logging.INFO,"mode: %s, url: %s"%(mode,url))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
605 # look for cached docinfo in session
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
606 if self.REQUEST.SESSION.has_key('docinfo'):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
607 docinfo = self.REQUEST.SESSION['docinfo']
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
608 # check if its still current
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
609 if docinfo is not None and docinfo.get('mode') == mode and docinfo.get('url') == url:
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
610 logger("documentViewer (getdocinfo)", logging.INFO,"docinfo in session: %s"%docinfo)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
611 return docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
612 # new docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
613 docinfo = {'mode': mode, 'url': url}
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
614 if mode=="texttool": #index.meta with texttool information
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
615 docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
616 elif mode=="imagepath":
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
617 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo)
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
618 elif mode=="filepath":
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
619 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo,cut=1)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
620 else:
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
621 logger("documentViewer (getdocinfo)", logging.ERROR,"unknown mode!")
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
622 raise ValueError("Unknown mode %s! Has to be one of 'texttool','imagepath','filepath'."%(mode))
37
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
623
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
624 logger("documentViewer (getdocinfo)", logging.INFO,"docinfo: %s"%docinfo)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
625 self.REQUEST.SESSION['docinfo'] = docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
626 return docinfo
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
627
9884703dae70 new modi
dwinter
parents: 0
diff changeset
628
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
629 def getPageinfo(self, current, start=None, rows=None, cols=None, docinfo=None, viewMode=None, tocMode=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
630 """returns pageinfo with the given parameters"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
631 pageinfo = {}
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
632 current = getInt(current)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
633 pageinfo['current'] = current
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
634 rows = int(rows or self.thumbrows)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
635 pageinfo['rows'] = rows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
636 cols = int(cols or self.thumbcols)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
637 pageinfo['cols'] = cols
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
638 grpsize = cols * rows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
639 pageinfo['groupsize'] = grpsize
61
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
640 start = getInt(start, default=(math.ceil(float(current)/float(grpsize))*grpsize-(grpsize-1)))
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
641 # int(current / grpsize) * grpsize +1))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
642 pageinfo['start'] = start
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
643 pageinfo['end'] = start + grpsize
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
644 if (docinfo is not None) and ('numPages' in docinfo):
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
645 np = int(docinfo['numPages'])
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
646 pageinfo['end'] = min(pageinfo['end'], np)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
647 pageinfo['numgroups'] = int(np / grpsize)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
648 if np % grpsize > 0:
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
649 pageinfo['numgroups'] += 1
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
650
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
651 pageinfo['viewMode'] = viewMode
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
652 pageinfo['tocMode'] = tocMode
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
653 pageinfo['query'] = self.REQUEST.get('query',' ')
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
654 pageinfo['queryType'] = self.REQUEST.get('queryType',' ')
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
655 pageinfo['querySearch'] =self.REQUEST.get('querySearch', 'fulltext')
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
656 pageinfo['tocPageSize'] = self.REQUEST.get('tocPageSize', '30')
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
657 pageinfo['queryPageSize'] =self.REQUEST.get('queryPageSize', '20')
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
658 pageinfo['tocPN'] = self.REQUEST.get('tocPN', '1')
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
659 pageinfo['searchPN'] =self.REQUEST.get('searchPN','1')
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
660 pageinfo['sn'] =self.REQUEST.get('sn','1')
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
661
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
662 return pageinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
663
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
664 def getSearch(self, pn=1, pageinfo=None, docinfo=None, query=None, queryType=None):
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
665 """get search list"""
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
666 docpath = docinfo['textURLPath']
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
667 pagesize = pageinfo['queryPageSize']
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
668 pn = pageinfo['searchPN']
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
669 sn = pageinfo['sn']
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
670 query =pageinfo['query']
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
671 queryType =pageinfo['queryType']
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
672 viewMode= pageinfo['viewMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
673 tocMode = pageinfo['tocMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
674 tocPN = pageinfo['tocPN']
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
675 pagexml=self.template.fulltextclient.eval("/mpdl/interface/doc-query.xql","document=%s&mode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s&sn=%s"%(docpath, 'text', queryType, query, pagesize, pn, sn) ,outputUnicode=False)
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
676 pagedom = Parse(pagexml)
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
677 #pagedivs = pagedom.xpath("//div[@class='queryResultPage']")
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
678 selfurl = self.absolute_url()
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
679 page = pagexml.replace('page-fragment.xql?document=/echo/la/Benedetti_1585.xml','%s?url=/mpiwg/online/permanent/library/163127KK&viewMode=%s&tocMode=%s&tocPN=%s&query=%s&queryType=%s'%(selfurl, viewMode, tocMode, tocPN, query, queryType))
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
680 text =page.replace('mode=text','mode=texttool')
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
681 return text
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
682 #if len(pagedivs) > 0:
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
683 # pagenode = pagedom[0]
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
684 # return serializeNode(pagenode)
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
685 #else:
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
686 # return "xaxa"
0
dwinter
parents:
diff changeset
687
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
688 def getNumPages(self,docinfo=None):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
689 """get list of pages from fulltext and put in docinfo"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
690 xquery = '//pb'
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
691 text = self.template.fulltextclient.eval("/mpdl/interface/xquery.xql", "document=%s&xquery=%s"%(docinfo['textURLPath'],xquery))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
692 # TODO: better processing of the page list. do we need the info somewhere else also?
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
693 docinfo['numPages'] = text.count("<pb ")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
694 return docinfo
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
695
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
696 def getTextPage(self, mode="text", pn=1, docinfo=None, pageinfo=None,):
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
697 """returns single page from fulltext"""
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
698 docpath = docinfo['textURLPath']
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
699 if mode == "text_dict":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
700 textmode = "textPollux"
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
701 else:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
702 textmode = mode
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
703
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
704 #selfurl = self.absolute_url()
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
705 #viewMode= pageinfo['viewMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
706 #tocMode = pageinfo['tocMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
707 #tocPN = pageinfo['tocPN']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
708
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
709 pagexml=self.template.fulltextclient.eval("/mpdl/interface/page-fragment.xql", "document=%s&mode=%s&pn=%s"%(docpath,textmode,pn), outputUnicode=False)
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
710 #######
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
711 #page = pagexml.replace('page-fragment.xql?document=/echo/la/Benedetti_1585.xml','%s?url=/mpiwg/online/permanent/library/163127KK&viewMode=%s&tocMode=%s&tocPN=%s'%(selfurl, viewMode, tocMode, tocPN))
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
712 #text =page.replace('mode=text','mode=texttool')
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
713 #######
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
714 # post-processing downloaded xml
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
715 pagedom = Parse(pagexml)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
716 # plain text mode
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
717 if mode == "text":
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
718 # first div contains text
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
719 pagedivs = pagedom.xpath("/div")
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
720 #queryResultPage
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
721 if len(pagedivs) > 0:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
722 pagenode = pagedivs[0]
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
723 return serializeNode(pagenode)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
724
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
725 # text-with-links mode
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
726 if mode == "text_dict":
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
727 # first div contains text
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
728 pagedivs = pagedom.xpath("/div")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
729 if len(pagedivs) > 0:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
730 pagenode = pagedivs[0]
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
731 # check all a-tags
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
732 links = pagenode.xpath("//a")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
733 for l in links:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
734 hrefNode = l.getAttributeNodeNS(None, u"href")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
735 if hrefNode:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
736 # is link with href
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
737 href = hrefNode.nodeValue
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
738 if href.startswith('lt/lex.xql'):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
739 # is pollux link
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
740 selfurl = self.absolute_url()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
741 # change href
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
742 hrefNode.nodeValue = href.replace('lt/lex.xql','%s/template/head_main_voc'%selfurl)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
743 # add target
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
744 l.setAttributeNS(None, 'target', '_blank')
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
745
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
746 if href.startswith('lt/lemma.xql'):
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
747 selfurl = self.absolute_url()
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
748 hrefNode.nodeValue = href.replace('lt/lemma.xql','%s/template/head_main_lemma'%selfurl)
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
749 l.setAttributeNS(None, 'target', '_blank')
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
750 return serializeNode(pagenode)
0
dwinter
parents:
diff changeset
751
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
752 return "no text here"
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
753
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
754 def getTranslate(self, query=None, language=None):
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
755 """translate into another languages"""
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
756 pagexml=self.template.fulltextclient.eval("/mpdl/interface/lt/lex.xql","query=%s&language=%s"%(query,language),outputUnicode=False)
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
757 return pagexml
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
758
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
759 def getLemma(self):
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
760 """lemma"""
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
761 pagexml=self.template.fulltextclient.eval("/mpdl/interface/lt/lemma.xql","query=%s&language=%s"%(query,language),outputUnicode=False)
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
762 return pagexml
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
763
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
764 def getToc(self, mode="text", docinfo=None):
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
765 """loads table of contents and stores in docinfo"""
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
766 logging.debug("documentViewer (gettoc) mode: %s"%(mode))
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
767 if 'tocSize_%s'%mode in docinfo:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
768 # cached toc
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
769 return docinfo
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
770
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
771 docpath = docinfo['textURLPath']
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
772 # we need to set a result set size
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
773 pagesize = 1000
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
774 pn = 1
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
775 if mode == "text":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
776 queryType = "toc"
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
777 else:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
778 queryType = mode
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
779 # number of entries in toc
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
780 tocSize = 0
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
781 tocDiv = None
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
782 pagexml=self.template.fulltextclient.eval("/mpdl/interface/doc-query.xql", "document=%s&queryType=%s&queryResultPageSize=%s&queryResultPN=%s"%(docpath,queryType,pagesize,pn), outputUnicode=False)
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
783 # post-processing downloaded xml
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
784 pagedom = Parse(pagexml)
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
785 # get number of entries
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
786 numdivs = pagedom.xpath("//div[@class='queryResultHits']")
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
787 if len(numdivs) > 0:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
788 tocSize = int(getTextFromNode(numdivs[0]))
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
789 # div contains text
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
790 #pagedivs = pagedom.xpath("//div[@class='queryResultPage']")
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
791 #if len(pagedivs) > 0:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
792 # tocDiv = pagedivs[0]
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
793
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
794 docinfo['tocSize_%s'%mode] = tocSize
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
795 #docinfo['tocDiv_%s'%mode] = tocDiv
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
796 return docinfo
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
797
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
798 def getTocPage(self, mode="text", pn=1, pageinfo=None, docinfo=None):
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
799 """returns single page from the table of contents"""
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
800 # TODO: this should use the cached TOC
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
801 if mode == "text":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
802 queryType = "toc"
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
803 else:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
804 queryType = mode
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
805 docpath = docinfo['textURLPath']
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
806 pagesize = pageinfo['tocPageSize']
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
807 pn = pageinfo['tocPN']
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
808
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
809 selfurl = self.absolute_url()
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
810 viewMode= pageinfo['viewMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
811 tocMode = pageinfo['tocMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
812 tocPN = pageinfo['tocPN']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
813
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
814 pagexml=self.template.fulltextclient.eval("/mpdl/interface/doc-query.xql", "document=%s&queryType=%s&queryResultPageSize=%s&queryResultPN=%s"%(docpath,queryType, pagesize, pn), outputUnicode=False)
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
815 page = pagexml.replace('page-fragment.xql?document=/echo/la/Benedetti_1585.xml','%s?url=/mpiwg/online/permanent/library/163127KK&viewMode=%s&tocMode=%s&tocPN=%s'%(selfurl, viewMode, tocMode, tocPN))
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
816 text = page.replace('mode=image','mode=texttool')
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
817 return text
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
818 # post-processing downloaded xml
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
819 #pagedom = Parse(text)
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
820 # div contains text
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
821 #pagedivs = pagedom.xpath("//div[@class='queryResultPage']")
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
822 #if len(pagedivs) > 0:
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
823 # pagenode = pagedivs[0]
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
824 # return serializeNode(pagenode)
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
825 #else:
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
826 # return "No TOC!"
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
827
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
828
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
829 def changeDocumentViewer(self,title="",digilibBaseUrl=None,thumbrows=2,thumbcols=5,authgroups='mpiwg',RESPONSE=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
830 """init document viewer"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
831 self.title=title
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
832 self.digilibBaseUrl = digilibBaseUrl
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
833 self.thumbrows = thumbrows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
834 self.thumbcols = thumbcols
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
835 self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
836 if RESPONSE is not None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
837 RESPONSE.redirect('manage_main')
0
dwinter
parents:
diff changeset
838
dwinter
parents:
diff changeset
839
dwinter
parents:
diff changeset
840
dwinter
parents:
diff changeset
841 def manage_AddDocumentViewerForm(self):
dwinter
parents:
diff changeset
842 """add the viewer form"""
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
843 pt=PageTemplateFile('zpt/addDocumentViewer', globals()).__of__(self)
0
dwinter
parents:
diff changeset
844 return pt()
dwinter
parents:
diff changeset
845
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
846 def manage_AddDocumentViewer(self,id,imageScalerUrl="",textServerName="",title="",RESPONSE=None):
0
dwinter
parents:
diff changeset
847 """add the viewer"""
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
848 newObj=documentViewer(id,imageScalerUrl=imageScalerUrl,title=title,textServerName=textServerName)
0
dwinter
parents:
diff changeset
849 self._setObject(id,newObj)
dwinter
parents:
diff changeset
850
dwinter
parents:
diff changeset
851 if RESPONSE is not None:
dwinter
parents:
diff changeset
852 RESPONSE.redirect('manage_main')
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
853
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
854
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
855 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
856 ## DocumentViewerTemplate class
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
857 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
858 class DocumentViewerTemplate(ZopePageTemplate):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
859 """Template for document viewer"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
860 meta_type="DocumentViewer Template"
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
861
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
862
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
863 def manage_addDocumentViewerTemplateForm(self):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
864 """Form for adding"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
865 pt=PageTemplateFile('zpt/addDocumentViewerTemplate', globals()).__of__(self)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
866 return pt()
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
867
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
868 def manage_addDocumentViewerTemplate(self, id='viewer_main', title=None, text=None,
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
869 REQUEST=None, submit=None):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
870 "Add a Page Template with optional file content."
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
871
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
872 self._setObject(id, DocumentViewerTemplate(id))
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
873 ob = getattr(self, id)
53
f4e0af8c281d NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents: 52
diff changeset
874 txt=file(os.path.join(package_home(globals()),'zpt/viewer_main.zpt'),'r').read()
f4e0af8c281d NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents: 52
diff changeset
875 logging.info("txt %s:"%txt)
f4e0af8c281d NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents: 52
diff changeset
876 ob.pt_edit(txt,"text/html")
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
877 if title:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
878 ob.pt_setTitle(title)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
879 try:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
880 u = self.DestinationURL()
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
881 except AttributeError:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
882 u = REQUEST['URL1']
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
883
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
884 u = "%s/%s" % (u, urllib.quote(id))
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
885 REQUEST.RESPONSE.redirect(u+'/manage_main')
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
886 return ''
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
887
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
888
41
0c8ee8fcfd76 some more logging
casties
parents: 40
diff changeset
889