annotate documentViewer.py @ 124:10d10e0db919

*** empty log message ***
author abukhman
date Tue, 01 Jun 2010 16:31:26 +0200
parents f1fc821f88a9
children c6dcf12e3807
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
1
0
dwinter
parents:
diff changeset
2 from OFS.Folder import Folder
dwinter
parents:
diff changeset
3 from Products.PageTemplates.ZopePageTemplate import ZopePageTemplate
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
4 from Products.PageTemplates.PageTemplateFile import PageTemplateFile
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
5 from Products.PythonScripts.standard import url_quote
0
dwinter
parents:
diff changeset
6 from AccessControl import ClassSecurityInfo
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
7 from AccessControl import getSecurityManager
0
dwinter
parents:
diff changeset
8 from Globals import package_home
dwinter
parents:
diff changeset
9
dwinter
parents:
diff changeset
10 from Ft.Xml.Domlette import NonvalidatingReader
dwinter
parents:
diff changeset
11 from Ft.Xml.Domlette import PrettyPrint, Print
38
025d3b6cba51 fixes by dirk
casties
parents: 37
diff changeset
12 from Ft.Xml import EMPTY_NAMESPACE, Parse
0
dwinter
parents:
diff changeset
13
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
14 from xml.dom.minidom import parse, parseString
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
15
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
16
83
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
17
0
dwinter
parents:
diff changeset
18 import Ft.Xml.XPath
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
19 import cStringIO
83
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
20 import xmlrpclib
0
dwinter
parents:
diff changeset
21 import os.path
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
22 import sys
0
dwinter
parents:
diff changeset
23 import cgi
dwinter
parents:
diff changeset
24 import urllib
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
25 import logging
61
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
26 import math
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
27
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
28 import urlparse
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
29 from types import *
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
30
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
31 def logger(txt,method,txt2):
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
32 """logging"""
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
33 logging.info(txt+ txt2)
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
34
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
35
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
36 def getInt(number, default=0):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
37 """returns always an int (0 in case of problems)"""
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
38 try:
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
39 return int(number)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
40 except:
62
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
41 return int(default)
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
42
0
dwinter
parents:
diff changeset
43 def getTextFromNode(nodename):
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
44 """get the cdata content of a node"""
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
45 if nodename is None:
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
46 return ""
0
dwinter
parents:
diff changeset
47 nodelist=nodename.childNodes
dwinter
parents:
diff changeset
48 rc = ""
dwinter
parents:
diff changeset
49 for node in nodelist:
dwinter
parents:
diff changeset
50 if node.nodeType == node.TEXT_NODE:
dwinter
parents:
diff changeset
51 rc = rc + node.data
dwinter
parents:
diff changeset
52 return rc
dwinter
parents:
diff changeset
53
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
54 def serializeNode(node, encoding='utf-8'):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
55 """returns a string containing node as XML"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
56 buf = cStringIO.StringIO()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
57 Print(node, stream=buf, encoding=encoding)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
58 s = buf.getvalue()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
59 buf.close()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
60 return s
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
61
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
62
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
63 def getParentDir(path):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
64 """returns pathname shortened by one"""
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
65 return '/'.join(path.split('/')[0:-1])
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
66
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
67
0
dwinter
parents:
diff changeset
68 import socket
dwinter
parents:
diff changeset
69
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
70 def urlopen(url,timeout=2):
0
dwinter
parents:
diff changeset
71 """urlopen mit timeout"""
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
72 socket.setdefaulttimeout(timeout)
0
dwinter
parents:
diff changeset
73 ret=urllib.urlopen(url)
dwinter
parents:
diff changeset
74 socket.setdefaulttimeout(5)
dwinter
parents:
diff changeset
75 return ret
dwinter
parents:
diff changeset
76
dwinter
parents:
diff changeset
77
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
78 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
79 ## documentViewer class
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
80 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
81 class documentViewer(Folder):
0
dwinter
parents:
diff changeset
82 """document viewer"""
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
83 #textViewerUrl="http://127.0.0.1:8080/HFQP/testXSLT/getPage?"
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
84
0
dwinter
parents:
diff changeset
85 meta_type="Document viewer"
dwinter
parents:
diff changeset
86
dwinter
parents:
diff changeset
87 security=ClassSecurityInfo()
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
88 manage_options=Folder.manage_options+(
0
dwinter
parents:
diff changeset
89 {'label':'main config','action':'changeDocumentViewerForm'},
dwinter
parents:
diff changeset
90 )
dwinter
parents:
diff changeset
91
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
92 # templates and forms
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
93 viewer_main = PageTemplateFile('zpt/viewer_main', globals())
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
94 toc_thumbs = PageTemplateFile('zpt/toc_thumbs', globals())
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
95 toc_text = PageTemplateFile('zpt/toc_text', globals())
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
96 toc_figures = PageTemplateFile('zpt/toc_figures', globals())
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
97 page_main_images = PageTemplateFile('zpt/page_main_images', globals())
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
98 page_main_text = PageTemplateFile('zpt/page_main_text', globals())
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
99 page_main_text_dict = PageTemplateFile('zpt/page_main_text_dict', globals())
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
100 page_main_xml = PageTemplateFile('zpt/page_main_xml', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
101 head_main = PageTemplateFile('zpt/head_main', globals())
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
102 docuviewer_css = PageTemplateFile('css/docuviewer.css', globals())
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
103 info_xml = PageTemplateFile('zpt/info_xml', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
104
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
105 thumbs_main_rss = PageTemplateFile('zpt/thumbs_main_rss', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
106 security.declareProtected('View management screens','changeDocumentViewerForm')
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
107 changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals())
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
108
0
dwinter
parents:
diff changeset
109
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
110 def __init__(self,id,imageScalerUrl=None,textServerName=None,title="",digilibBaseUrl=None,thumbcols=2,thumbrows=5,authgroups="mpiwg"):
0
dwinter
parents:
diff changeset
111 """init document viewer"""
dwinter
parents:
diff changeset
112 self.id=id
dwinter
parents:
diff changeset
113 self.title=title
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
114 self.thumbcols = thumbcols
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
115 self.thumbrows = thumbrows
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
116 # authgroups is list of authorized groups (delimited by ,)
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
117 self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
118 # create template folder so we can always use template.something
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
119
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
120 templateFolder = Folder('template')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
121 #self['template'] = templateFolder # Zope-2.12 style
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
122 self._setObject('template',templateFolder) # old style
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
123 try:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
124 from Products.XMLRpcTools.XMLRpcTools import XMLRpcServerProxy
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
125 xmlRpcClient = XMLRpcServerProxy(id='fulltextclient', serverUrl=textServerName, use_xmlrpc=False)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
126 #templateFolder['fulltextclient'] = xmlRpcClient
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
127 templateFolder._setObject('fulltextclient',xmlRpcClient)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
128 except Exception, e:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
129 logging.error("Unable to create XMLRpcTools for fulltextclient: "+str(e))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
130 try:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
131 from Products.zogiLib.zogiLib import zogiLib
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
132 zogilib = zogiLib(id="zogilib", title="zogilib for docuviewer", dlServerURL=imageScalerUrl, layout="book")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
133 #templateFolder['zogilib'] = zogilib
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
134 templateFolder._setObject('zogilib',zogilib)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
135 except Exception, e:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
136 logging.error("Unable to create zogiLib for zogilib: "+str(e))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
137
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
138
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
139 security.declareProtected('View','thumbs_rss')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
140 def thumbs_rss(self,mode,url,viewMode="auto",start=None,pn=1):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
141 '''
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
142 view it
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
143 @param mode: defines how to access the document behind url
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
144 @param url: url which contains display information
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
145 @param viewMode: if images display images, if text display text, default is images (text,images or auto)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
146
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
147 '''
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
148 logging.debug("HHHHHHHHHHHHHH:load the rss")
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
149 logger("documentViewer (index)", logging.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
150
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
151 if not hasattr(self, 'template'):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
152 # create template folder if it doesn't exist
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
153 self.manage_addFolder('template')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
154
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
155 if not self.digilibBaseUrl:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
156 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
157
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
158 docinfo = self.getDocinfo(mode=mode,url=url)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
159 pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
160 pt = getattr(self.template, 'thumbs_main_rss')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
161
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
162 if viewMode=="auto": # automodus gewaehlt
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
163 if docinfo.get("textURL",'') and self.textViewerUrl: #texturl gesetzt und textViewer konfiguriert
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
164 viewMode="text"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
165 else:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
166 viewMode="images"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
167
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
168 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
169
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
170 security.declareProtected('View','index_html')
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
171 def index_html(self,url,mode="texttool",viewMode="auto",tocMode="thumbs",start=None,pn=1,mk=None, query=None, querySearch=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
172 '''
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
173 view it
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
174 @param mode: defines how to access the document behind url
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
175 @param url: url which contains display information
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
176 @param viewMode: if images display images, if text display text, default is auto (text,images or auto)
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
177 @param tocMode: type of 'table of contents' for navigation (thumbs, text, figures, none)
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
178 @param querySearch: type of different search modes (fulltext, fulltextMorph, xpath, xquery, ftIndex, ftIndexMorph, fulltextMorphLemma)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
179 '''
0
dwinter
parents:
diff changeset
180
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
181 logging.debug("documentViewer (index) mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
182
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
183 if not hasattr(self, 'template'):
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
184 # this won't work
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
185 logging.error("template folder missing!")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
186 return "ERROR: template folder missing!"
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
187
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
188 if not getattr(self, 'digilibBaseUrl', None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
189 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
190
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
191 docinfo = self.getDocinfo(mode=mode,url=url)
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
192
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
193
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
194 if tocMode != "thumbs":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
195 # get table of contents
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
196 docinfo = self.getToc(mode=tocMode, docinfo=docinfo)
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
197
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
198 pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo,viewMode=viewMode,tocMode=tocMode)
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
199
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
200 if viewMode=="auto": # automodus gewaehlt
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
201 if docinfo.get("textURL",''): #texturl gesetzt und textViewer konfiguriert
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
202 viewMode="text"
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
203 else:
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
204 viewMode="images"
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
205
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
206 pt = getattr(self.template, 'viewer_main')
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
207 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode,mk=self.generateMarks(mk))
0
dwinter
parents:
diff changeset
208
74
dwinter
parents: 73
diff changeset
209 def generateMarks(self,mk):
dwinter
parents: 73
diff changeset
210 ret=""
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
211 if mk is None:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
212 return ""
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
213 if type(mk) is not ListType:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
214 mk=[mk]
74
dwinter
parents: 73
diff changeset
215 for m in mk:
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
216 ret+="mk=%s"%m
74
dwinter
parents: 73
diff changeset
217 return ret
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
218
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
219
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
220 def findDigilibUrl(self):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
221 """try to get the digilib URL from zogilib"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
222 url = self.template.zogilib.getDLBaseUrl()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
223 return url
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
224
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
225 def getStyle(self, idx, selected, style=""):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
226 """returns a string with the given style and append 'sel' if path == selected."""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
227 #logger("documentViewer (getstyle)", logging.INFO, "idx: %s selected: %s style: %s"%(idx,selected,style))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
228 if idx == selected:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
229 return style + 'sel'
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
230 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
231 return style
74
dwinter
parents: 73
diff changeset
232
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
233 def getLink(self,param=None,val=None):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
234 """link to documentviewer with parameter param set to val"""
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
235 params=self.REQUEST.form.copy()
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
236 if param is not None:
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
237 if val is None:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
238 if params.has_key(param):
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
239 del params[param]
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
240 else:
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
241 params[param] = str(val)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
242
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
243 if params.get("mode", None) == "filepath": #wenn beim erst Aufruf filepath gesetzt wurde aendere das nun zu imagepath
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
244 params["mode"] = "imagepath"
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
245 params["url"] = getParentDir(params["url"])
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
246
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
247 # quote values and assemble into query string
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
248 ps = "&".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
249 url=self.REQUEST['URL1']+"?"+ps
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
250 return url
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
251
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
252 def getLinkAmp(self,param=None,val=None):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
253 """link to documentviewer with parameter param set to val"""
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
254 params=self.REQUEST.form.copy()
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
255 if param is not None:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
256 if val is None:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
257 if params.has_key(param):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
258 del params[param]
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
259 else:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
260 params[param] = str(val)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
261
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
262 # quote values and assemble into query string
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
263 logging.info("XYXXXXX: %s"%repr(params.items()))
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
264 ps = "&".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
265 url=self.REQUEST['URL1']+"?"+ps
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
266 return url
81
fae97f071724 fixed problem with info.xml when url without index.meta
casties
parents: 79
diff changeset
267
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
268 def getInfo_xml(self,url,mode):
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
269 """returns info about the document as XML"""
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
270
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
271 if not self.digilibBaseUrl:
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
272 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
273
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
274 docinfo = self.getDocinfo(mode=mode,url=url)
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
275 pt = getattr(self.template, 'info_xml')
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
276 return pt(docinfo=docinfo)
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
277
0
dwinter
parents:
diff changeset
278
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
279 def isAccessible(self, docinfo):
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
280 """returns if access to the resource is granted"""
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
281 access = docinfo.get('accessType', None)
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
282 logger("documentViewer (accessOK)", logging.INFO, "access type %s"%access)
45
0391fe75aef3 fixed handling of documents with missing access tag
casties
parents: 43
diff changeset
283 if access is not None and access == 'free':
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
284 logger("documentViewer (accessOK)", logging.INFO, "access is free")
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
285 return True
45
0391fe75aef3 fixed handling of documents with missing access tag
casties
parents: 43
diff changeset
286 elif access is None or access in self.authgroups:
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
287 # only local access -- only logged in users
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
288 user = getSecurityManager().getUser()
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
289 if user is not None:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
290 #print "user: ", user
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
291 return (user.getUserName() != "Anonymous User")
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
292 else:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
293 return False
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
294
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
295 logger("documentViewer (accessOK)", logging.INFO, "unknown access type %s"%access)
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
296 return False
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
297
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
298
73
dwinter
parents: 71
diff changeset
299 def getDirinfoFromDigilib(self,path,docinfo=None,cut=0):
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
300 """gibt param von dlInfo aus"""
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
301 num_retries = 3
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
302 if docinfo is None:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
303 docinfo = {}
73
dwinter
parents: 71
diff changeset
304
dwinter
parents: 71
diff changeset
305 for x in range(cut):
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
306
73
dwinter
parents: 71
diff changeset
307 path=getParentDir(path)
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
308
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
309 infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
310
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
311 logger("documentViewer (getparamfromdigilib)", logging.INFO, "dirInfo from %s"%(infoUrl))
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
312
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
313 for cnt in range(num_retries):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
314 try:
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
315 # dom = NonvalidatingReader.parseUri(imageUrl)
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
316 txt=urllib.urlopen(infoUrl).read()
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
317 dom = Parse(txt)
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
318 break
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
319 except:
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
320 logger("documentViewer (getdirinfofromdigilib)", logging.ERROR, "error reading %s (try %d)"%(infoUrl,cnt))
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
321 else:
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
322 raise IOError("Unable to get dir-info from %s"%(infoUrl))
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
323
37
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
324 sizes=dom.xpath("//dir/size")
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
325 logger("documentViewer (getparamfromdigilib)", logging.INFO, "dirInfo:size"%sizes)
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
326
37
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
327 if sizes:
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
328 docinfo['numPages'] = int(getTextFromNode(sizes[0]))
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
329 else:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
330 docinfo['numPages'] = 0
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
331
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
332 # TODO: produce and keep list of image names and numbers
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
333
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
334 return docinfo
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
335
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
336
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
337 def getIndexMeta(self, url):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
338 """returns dom of index.meta document at url"""
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
339 num_retries = 3
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
340 dom = None
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
341 metaUrl = None
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
342 if url.startswith("http://"):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
343 # real URL
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
344 metaUrl = url
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
345 else:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
346 # online path
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
347 server=self.digilibBaseUrl+"/servlet/Texter?fn="
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
348 metaUrl=server+url.replace("/mpiwg/online","")
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
349 if not metaUrl.endswith("index.meta"):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
350 metaUrl += "/index.meta"
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
351 logging.debug("METAURL: %s"%metaUrl)
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
352 for cnt in range(num_retries):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
353 try:
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
354 # patch dirk encoding fehler treten dann nicht mehr auf
38
025d3b6cba51 fixes by dirk
casties
parents: 37
diff changeset
355 # dom = NonvalidatingReader.parseUri(metaUrl)
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
356 txt=urllib.urlopen(metaUrl).read()
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
357 dom = Parse(txt)
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
358 break
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
359 except:
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
360 logger("ERROR documentViewer (getIndexMeta)", logging.INFO,"%s (%s)"%sys.exc_info()[0:2])
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
361
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
362 if dom is None:
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
363 raise IOError("Unable to read index meta from %s"%(url))
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
364
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
365 return dom
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
366
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
367 def getPresentationInfoXML(self, url):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
368 """returns dom of info.xml document at url"""
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
369 num_retries = 3
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
370 dom = None
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
371 metaUrl = None
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
372 if url.startswith("http://"):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
373 # real URL
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
374 metaUrl = url
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
375 else:
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
376 # online path
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
377 server=self.digilibBaseUrl+"/servlet/Texter?fn="
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
378 metaUrl=server+url.replace("/mpiwg/online","")
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
379
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
380 for cnt in range(num_retries):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
381 try:
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
382 # patch dirk encoding fehler treten dann nicht mehr auf
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
383 # dom = NonvalidatingReader.parseUri(metaUrl)
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
384 txt=urllib.urlopen(metaUrl).read()
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
385 dom = Parse(txt)
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
386 break
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
387 except:
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
388 logger("ERROR documentViewer (getPresentationInfoXML)", logging.INFO,"%s (%s)"%sys.exc_info()[0:2])
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
389
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
390 if dom is None:
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
391 raise IOError("Unable to read infoXMLfrom %s"%(url))
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
392
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
393 return dom
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
394
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
395
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
396 def getAuthinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
397 """gets authorization info from the index.meta file at path or given by dom"""
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
398 logger("documentViewer (getauthinfofromindexmeta)", logging.INFO,"path: %s"%(path))
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
399
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
400 access = None
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
401
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
402 if docinfo is None:
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
403 docinfo = {}
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
404
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
405 if dom is None:
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
406 for x in range(cut):
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
407 path=getParentDir(path)
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
408 dom = self.getIndexMeta(path)
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
409
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
410 acctype = dom.xpath("//access-conditions/access/@type")
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
411 if acctype and (len(acctype)>0):
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
412 access=acctype[0].value
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
413 if access in ['group', 'institution']:
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
414 access = getTextFromNode(dom.xpath("//access-conditions/access/name")[0]).lower()
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
415
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
416 docinfo['accessType'] = access
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
417 return docinfo
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
418
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
419
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
420 def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
421 """gets bibliographical info from the index.meta file at path or given by dom"""
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
422 logging.debug("documentViewer (getbibinfofromindexmeta) path: %s"%(path))
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
423
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
424 if docinfo is None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
425 docinfo = {}
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
426
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
427 if dom is None:
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
428 for x in range(cut):
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
429 path=getParentDir(path)
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
430 dom = self.getIndexMeta(path)
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
431
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
432 logging.debug("documentViewer (getbibinfofromindexmeta cutted) path: %s"%(path))
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
433 # put in all raw bib fields as dict "bib"
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
434 bib = dom.xpath("//bib/*")
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
435 if bib and len(bib)>0:
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
436 bibinfo = {}
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
437 for e in bib:
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
438 bibinfo[e.localName] = getTextFromNode(e)
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
439 docinfo['bib'] = bibinfo
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
440
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
441 # extract some fields (author, title, year) according to their mapping
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
442 metaData=self.metadata.main.meta.bib
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
443 bibtype=dom.xpath("//bib/@type")
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
444 if bibtype and (len(bibtype)>0):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
445 bibtype=bibtype[0].value
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
446 else:
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
447 bibtype="generic"
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
448
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
449 bibtype=bibtype.replace("-"," ") # wrong typesiin index meta "-" instead of " " (not wrong! ROC)
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
450 docinfo['bib_type'] = bibtype
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
451 bibmap=metaData.generateMappingForType(bibtype)
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
452 # if there is no mapping bibmap is empty (mapping sometimes has empty fields)
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
453 if len(bibmap) > 0 and len(bibmap['author'][0]) > 0:
63
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
454 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
455 docinfo['author']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['author'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
456 except: pass
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
457 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
458 docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
459 except: pass
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
460 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
461 docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
462 except: pass
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
463 logging.debug("documentViewer (getbibinfofromindexmeta) using mapping for %s"%bibtype)
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
464 try:
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
465 docinfo['lang']=getTextFromNode(dom.xpath("//bib/lang")[0])
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
466 except:
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
467 docinfo['lang']=''
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
468
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
469 return docinfo
83
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
470
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
471
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
472 def getDocinfoFromTextTool(self, url, dom=None, docinfo=None):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
473 """parse texttool tag in index meta"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
474 logger("documentViewer (getdocinfofromtexttool)", logging.INFO, "url: %s" % (url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
475 if docinfo is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
476 docinfo = {}
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
477 if docinfo.get('lang', None) is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
478 docinfo['lang'] = '' # default keine Sprache gesetzt
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
479 if dom is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
480 dom = self.getIndexMeta(url)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
481
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
482 archivePath = None
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
483 archiveName = None
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
484
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
485 archiveNames = dom.xpath("//resource/name")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
486 if archiveNames and (len(archiveNames) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
487 archiveName = getTextFromNode(archiveNames[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
488 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
489 logger("documentViewer (getdocinfofromtexttool)", logging.WARNING, "resource/name missing in: %s" % (url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
490
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
491 archivePaths = dom.xpath("//resource/archive-path")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
492 if archivePaths and (len(archivePaths) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
493 archivePath = getTextFromNode(archivePaths[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
494 # clean up archive path
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
495 if archivePath[0] != '/':
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
496 archivePath = '/' + archivePath
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
497 if archiveName and (not archivePath.endswith(archiveName)):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
498 archivePath += "/" + archiveName
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
499 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
500 # try to get archive-path from url
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
501 logger("documentViewer (getdocinfofromtexttool)", logging.WARNING, "resource/archive-path missing in: %s" % (url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
502 if (not url.startswith('http')):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
503 archivePath = url.replace('index.meta', '')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
504
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
505 if archivePath is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
506 # we balk without archive-path
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
507 raise IOError("Missing archive-path (for text-tool) in %s" % (url))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
508
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
509 imageDirs = dom.xpath("//texttool/image")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
510 if imageDirs and (len(imageDirs) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
511 imageDir = getTextFromNode(imageDirs[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
512
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
513 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
514 # we balk with no image tag / not necessary anymore because textmode is now standard
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
515 #raise IOError("No text-tool info in %s"%(url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
516 imageDir = ""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
517 #xquery="//pb"
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
518 docinfo['imagePath'] = "" # keine Bilder
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
519 docinfo['imageURL'] = ""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
520
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
521 if imageDir and archivePath:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
522 #print "image: ", imageDir, " archivepath: ", archivePath
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
523 imageDir = os.path.join(archivePath, imageDir)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
524 imageDir = imageDir.replace("/mpiwg/online", '')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
525 docinfo = self.getDirinfoFromDigilib(imageDir, docinfo=docinfo)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
526 docinfo['imagePath'] = imageDir
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
527
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
528 docinfo['imageURL'] = self.digilibBaseUrl + "/servlet/Scaler?fn=" + imageDir
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
529
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
530 viewerUrls = dom.xpath("//texttool/digiliburlprefix")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
531 if viewerUrls and (len(viewerUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
532 viewerUrl = getTextFromNode(viewerUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
533 docinfo['viewerURL'] = viewerUrl
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
534
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
535 textUrls = dom.xpath("//texttool/text")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
536 if textUrls and (len(textUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
537 textUrl = getTextFromNode(textUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
538 if urlparse.urlparse(textUrl)[0] == "": #keine url
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
539 textUrl = os.path.join(archivePath, textUrl)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
540 # fix URLs starting with /mpiwg/online
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
541 if textUrl.startswith("/mpiwg/online"):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
542 textUrl = textUrl.replace("/mpiwg/online", '', 1)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
543
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
544 docinfo['textURL'] = textUrl
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
545
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
546 textUrls = dom.xpath("//texttool/text-url-path")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
547 if textUrls and (len(textUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
548 textUrl = getTextFromNode(textUrls[0])
102
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
549 docinfo['textURLPath'] = textUrl
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
550 if not docinfo['imagePath']:
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
551 # text-only, no page images
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
552 docinfo = self.getNumPages(docinfo) #im moment einfach auf eins setzen, navigation ueber die thumbs geht natuerlich nicht
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
553
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
554 presentationUrls = dom.xpath("//texttool/presentation")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
555 docinfo = self.getBibinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get info von bib tag
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
556
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
557 if presentationUrls and (len(presentationUrls) > 0): # ueberschreibe diese durch presentation informationen
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
558 # presentation url ergiebt sich ersetzen von index.meta in der url der fuer die Metadaten
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
559 # durch den relativen Pfad auf die presentation infos
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
560 presentationPath = getTextFromNode(presentationUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
561 if url.endswith("index.meta"):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
562 presentationUrl = url.replace('index.meta', presentationPath)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
563 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
564 presentationUrl = url + "/" + presentationPath
102
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
565
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
566 docinfo = self.getBibinfoFromTextToolPresentation(presentationUrl, docinfo=docinfo, dom=dom)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
567
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
568 docinfo = self.getAuthinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get access info
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
569
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
570 return docinfo
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
571
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
572
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
573 def getBibinfoFromTextToolPresentation(self,url,docinfo=None,dom=None):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
574 """gets the bibliographical information from the preseantion entry in texttools
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
575 """
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
576 dom=self.getPresentationInfoXML(url)
62
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
577 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
578 docinfo['author']=getTextFromNode(dom.xpath("//author")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
579 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
580 pass
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
581 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
582 docinfo['title']=getTextFromNode(dom.xpath("//title")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
583 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
584 pass
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
585 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
586 docinfo['year']=getTextFromNode(dom.xpath("//date")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
587 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
588 pass
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
589 return docinfo
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
590
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
591 def getDocinfoFromImagePath(self,path,docinfo=None,cut=0):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
592 """path ist the path to the images it assumes that the index.meta file is one level higher."""
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
593 logger("documentViewer (getdocinfofromimagepath)", logging.INFO,"path: %s"%(path))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
594 if docinfo is None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
595 docinfo = {}
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
596 path=path.replace("/mpiwg/online","")
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
597 docinfo['imagePath'] = path
73
dwinter
parents: 71
diff changeset
598 docinfo=self.getDirinfoFromDigilib(path,docinfo=docinfo,cut=cut)
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
599
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
600 pathorig=path
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
601 for x in range(cut):
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
602 path=getParentDir(path)
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
603 logging.error("PATH:"+path)
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
604 imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn="+path
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
605 docinfo['imageURL'] = imageUrl
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
606
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
607 #path ist the path to the images it assumes that the index.meta file is one level higher.
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
608 docinfo = self.getBibinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
609 docinfo = self.getAuthinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
610 return docinfo
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
611
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
612
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
613 def getDocinfo(self, mode, url):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
614 """returns docinfo depending on mode"""
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
615 logger("documentViewer (getdocinfo)", logging.INFO,"mode: %s, url: %s"%(mode,url))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
616 # look for cached docinfo in session
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
617 if self.REQUEST.SESSION.has_key('docinfo'):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
618 docinfo = self.REQUEST.SESSION['docinfo']
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
619 # check if its still current
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
620 if docinfo is not None and docinfo.get('mode') == mode and docinfo.get('url') == url:
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
621 logger("documentViewer (getdocinfo)", logging.INFO,"docinfo in session: %s"%docinfo)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
622 return docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
623 # new docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
624 docinfo = {'mode': mode, 'url': url}
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
625 if mode=="texttool": #index.meta with texttool information
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
626 docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
627 elif mode=="imagepath":
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
628 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo)
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
629 elif mode=="filepath":
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
630 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo,cut=1)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
631 else:
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
632 logger("documentViewer (getdocinfo)", logging.ERROR,"unknown mode!")
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
633 raise ValueError("Unknown mode %s! Has to be one of 'texttool','imagepath','filepath'."%(mode))
37
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
634
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
635 logger("documentViewer (getdocinfo)", logging.INFO,"docinfo: %s"%docinfo)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
636 self.REQUEST.SESSION['docinfo'] = docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
637 return docinfo
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
638
9884703dae70 new modi
dwinter
parents: 0
diff changeset
639
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
640 def getPageinfo(self, current, start=None, rows=None, cols=None, docinfo=None, viewMode=None, tocMode=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
641 """returns pageinfo with the given parameters"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
642 pageinfo = {}
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
643 current = getInt(current)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
644 pageinfo['current'] = current
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
645 rows = int(rows or self.thumbrows)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
646 pageinfo['rows'] = rows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
647 cols = int(cols or self.thumbcols)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
648 pageinfo['cols'] = cols
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
649 grpsize = cols * rows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
650 pageinfo['groupsize'] = grpsize
61
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
651 start = getInt(start, default=(math.ceil(float(current)/float(grpsize))*grpsize-(grpsize-1)))
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
652 # int(current / grpsize) * grpsize +1))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
653 pageinfo['start'] = start
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
654 pageinfo['end'] = start + grpsize
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
655 if (docinfo is not None) and ('numPages' in docinfo):
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
656 np = int(docinfo['numPages'])
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
657 pageinfo['end'] = min(pageinfo['end'], np)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
658 pageinfo['numgroups'] = int(np / grpsize)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
659 if np % grpsize > 0:
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
660 pageinfo['numgroups'] += 1
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
661
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
662
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
663 pageinfo['viewMode'] = viewMode
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
664 pageinfo['tocMode'] = tocMode
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
665 pageinfo['query'] = self.REQUEST.get('query',' ')
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
666 pageinfo['queryType'] = self.REQUEST.get('queryType',' ')
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
667 pageinfo['querySearch'] =self.REQUEST.get('querySearch', 'fulltext')
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
668 pageinfo['textPN'] = self.REQUEST.get('textPN','1')
106
9f11913bc132 *** empty log message ***
abukhman
parents: 105
diff changeset
669 pageinfo['highlightQuery'] = self.REQUEST.get('highlightQuery','')
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
670 pageinfo['tocPageSize'] = self.REQUEST.get('tocPageSize', '30')
105
6bffb612cd6a *** empty log message ***
abukhman
parents: 104
diff changeset
671 pageinfo['queryPageSize'] =self.REQUEST.get('queryPageSize', '10')
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
672 pageinfo['tocPN'] = self.REQUEST.get('tocPN', '1')
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
673 toc = int (pageinfo['tocPN'])
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
674 pageinfo['textPages'] =int (toc)
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
675
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
676 if 'tocSize_%s'%tocMode in docinfo:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
677 tocSize = int(docinfo['tocSize_%s'%tocMode])
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
678 tocPageSize = int(pageinfo['tocPageSize'])
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
679 # cached toc
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
680
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
681 if tocSize%tocPageSize>0:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
682 tocPages=tocSize/tocPageSize+1
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
683 else:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
684 tocPages=tocSize/tocPageSize
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
685 pageinfo['tocPN'] = min (tocPages,toc)
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
686
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
687 pageinfo['searchPN'] =self.REQUEST.get('searchPN','1')
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
688 pageinfo['sn'] =self.REQUEST.get('sn','')
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
689
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
690 return pageinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
691
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
692 def getSearch(self, pn=1, pageinfo=None, docinfo=None, query=None, queryType=None):
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
693 """get search list"""
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
694 docpath = docinfo['textURLPath']
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
695 url = docinfo['url']
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
696 logging.debug("documentViewer (gettoc) docpath: %s"%(docpath))
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
697 logging.debug("documentViewer (gettoc) url: %s"%(url))
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
698 pagesize = pageinfo['queryPageSize']
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
699 pn = pageinfo['searchPN']
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
700 sn = pageinfo['sn']
106
9f11913bc132 *** empty log message ***
abukhman
parents: 105
diff changeset
701 highlightQuery = pageinfo['highlightQuery']
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
702 query =pageinfo['query']
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
703 queryType =pageinfo['queryType']
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
704 viewMode= pageinfo['viewMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
705 tocMode = pageinfo['tocMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
706 tocPN = pageinfo['tocPN']
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
707 selfurl = self.absolute_url()
107
53c395d3175f *** empty log message ***
abukhman
parents: 106
diff changeset
708 page=self.template.fulltextclient.eval("/mpdl/interface/doc-query.xql","document=%s&mode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s&sn=%s&viewMode=%s&highlightQuery=%s"%(docpath, 'text', queryType, query, pagesize, pn, sn, viewMode,highlightQuery) ,outputUnicode=False)
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
709 pagexml = page.replace('?document=%s'%str(docpath),'?url=%s'%url)
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
710 pagedom = Parse(pagexml)
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
711 if (queryType=="fulltext")or(queryType=="xpath")or(queryType=="xquery")or(queryType=="fulltextMorphLemma"):
137459e3b378 Last update
abukhman
parents: 99
diff changeset
712 pagedivs = pagedom.xpath("//div[@class='queryResultPage']")
137459e3b378 Last update
abukhman
parents: 99
diff changeset
713 if len(pagedivs)>0:
137459e3b378 Last update
abukhman
parents: 99
diff changeset
714 pagenode=pagedivs[0]
137459e3b378 Last update
abukhman
parents: 99
diff changeset
715 links=pagenode.xpath("//a")
137459e3b378 Last update
abukhman
parents: 99
diff changeset
716 for l in links:
137459e3b378 Last update
abukhman
parents: 99
diff changeset
717 hrefNode = l.getAttributeNodeNS(None, u"href")
137459e3b378 Last update
abukhman
parents: 99
diff changeset
718 if hrefNode:
137459e3b378 Last update
abukhman
parents: 99
diff changeset
719 href = hrefNode.nodeValue
137459e3b378 Last update
abukhman
parents: 99
diff changeset
720 if href.startswith('page-fragment.xql'):
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
721 selfurl = self.absolute_url()
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
722 pagexml=href.replace('mode=text','mode=texttool&viewMode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s&tocMode=%s&searchPN=%s&tocPN=%s'%(viewMode,queryType,query,pagesize,pn,tocMode,pn,tocPN))
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
723 hrefNode.nodeValue = pagexml.replace('page-fragment.xql','%s'%selfurl)
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
724 return serializeNode(pagenode)
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
725
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
726 if (queryType=="fulltextMorph"):
137459e3b378 Last update
abukhman
parents: 99
diff changeset
727 pagedivs = pagedom.xpath("//div[@class='queryResult']")
137459e3b378 Last update
abukhman
parents: 99
diff changeset
728 if len(pagedivs)>0:
137459e3b378 Last update
abukhman
parents: 99
diff changeset
729 pagenode=pagedivs[0]
137459e3b378 Last update
abukhman
parents: 99
diff changeset
730 links=pagenode.xpath("//a")
137459e3b378 Last update
abukhman
parents: 99
diff changeset
731 for l in links:
137459e3b378 Last update
abukhman
parents: 99
diff changeset
732 hrefNode = l.getAttributeNodeNS(None, u"href")
137459e3b378 Last update
abukhman
parents: 99
diff changeset
733 if hrefNode:
137459e3b378 Last update
abukhman
parents: 99
diff changeset
734 href = hrefNode.nodeValue
137459e3b378 Last update
abukhman
parents: 99
diff changeset
735 if href.startswith('page-fragment.xql'):
137459e3b378 Last update
abukhman
parents: 99
diff changeset
736 selfurl = self.absolute_url()
137459e3b378 Last update
abukhman
parents: 99
diff changeset
737 pagexml=href.replace('mode=text','mode=texttool&viewMode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s&tocMode=%s&searchPN=%s&tocPN=%s'%(viewMode,queryType,query,pagesize,pn,tocMode,pn,tocPN))
137459e3b378 Last update
abukhman
parents: 99
diff changeset
738 hrefNode.nodeValue = pagexml.replace('page-fragment.xql','%s'%selfurl)
137459e3b378 Last update
abukhman
parents: 99
diff changeset
739 if href.startswith('../lt/lemma.xql'):
117
d9705375d4d7 *** empty log message ***
abukhman
parents: 116
diff changeset
740
d9705375d4d7 *** empty log message ***
abukhman
parents: 116
diff changeset
741 hrefNode.nodeValue = href.replace('../lt/lemma.xql','%s/template/head_main_lemma'%selfurl)
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
742 l.setAttributeNS(None, 'target', '_blank')
137459e3b378 Last update
abukhman
parents: 99
diff changeset
743 l.setAttributeNS(None, 'onClick',"popupWin = window.open(this.href, 'contacts', 'location,width=500,height=600,top=180, left=400, scrollbars=1'); return false;")
117
d9705375d4d7 *** empty log message ***
abukhman
parents: 116
diff changeset
744 l.setAttributeNS(None, 'onDblclick', 'popupWin.focus();')
d9705375d4d7 *** empty log message ***
abukhman
parents: 116
diff changeset
745 pagedivs = pagedom.xpath("//div[@class='queryResultMorphExpansion']")
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
746 return serializeNode(pagenode)
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
747
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
748 if (queryType=="ftIndex")or(queryType=="ftIndexMorph"):
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
749 pagedivs= pagedom.xpath("//div[@class='queryResultPage']")
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
750 if len(pagedivs)>0:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
751 pagenode=pagedivs[0]
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
752 links=pagenode.xpath("//a")
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
753 for l in links:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
754 hrefNode = l.getAttributeNodeNS(None, u"href")
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
755 if hrefNode:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
756 href = hrefNode.nodeValue
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
757 hrefNode.nodeValue=href.replace('mode=text','mode=texttool&viewMode=%s&tocMode=%s&tocPN=%s&pn=%s'%(viewMode,tocMode,tocPN,pn))
137459e3b378 Last update
abukhman
parents: 99
diff changeset
758
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
759 if href.startswith('../lt/lex.xql'):
106
9f11913bc132 *** empty log message ***
abukhman
parents: 105
diff changeset
760 hrefNode.nodeValue = href.replace('../lt/lex.xql','%s/template/head_main_voc'%selfurl)
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
761 l.setAttributeNS(None, 'target', '_blank')
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
762 l.setAttributeNS(None, 'onClick',"popupWin = window.open(this.href, 'contacts', 'location,width=500,height=600,top=180, left=400, scrollbars=1'); return false;")
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
763 l.setAttributeNS(None, 'onDblclick', 'popupWin.focus();')
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
764 if href.startswith('../lt/lemma.xql'):
106
9f11913bc132 *** empty log message ***
abukhman
parents: 105
diff changeset
765 hrefNode.nodeValue = href.replace('../lt/lemma.xql','%s/template/head_main_lemma'%selfurl)
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
766 l.setAttributeNS(None, 'target', '_blank')
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
767 l.setAttributeNS(None, 'onClick',"popupWin = window.open(this.href, 'contacts', 'location,width=500,height=600,top=180, left=400, scrollbars=1'); return false;")
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
768 l.setAttributeNS(None, 'onDblclick', 'popupWin.focus();')
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
769 return serializeNode(pagenode)
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
770 return "no text here"
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
771
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
772 def getNumPages(self,docinfo=None):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
773 """get list of pages from fulltext and put in docinfo"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
774 xquery = '//pb'
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
775 text = self.template.fulltextclient.eval("/mpdl/interface/xquery.xql", "document=%s&xquery=%s"%(docinfo['textURLPath'],xquery))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
776 # TODO: better processing of the page list. do we need the info somewhere else also?
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
777 docinfo['numPages'] = text.count("<pb ")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
778 return docinfo
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
779
120
f1fc821f88a9 *** empty log message ***
abukhman
parents: 117
diff changeset
780 def getTextPage(self, mode="text", pn=1, docinfo=None, pageinfo=None, highlightQuery=None,sn=None, viewMode=None, tocMode=None, tocPN=None):
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
781 """returns single page from fulltext"""
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
782 docpath = docinfo['textURLPath']
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
783 path = docinfo['textURLPath']
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
784 url = docinfo['url']
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
785 viewMode= pageinfo['viewMode']
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
786 tocMode = pageinfo['tocMode']
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
787 tocPN = pageinfo['tocPN']
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
788 selfurl = self.absolute_url()
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
789
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
790 #pn = pageinfo['searchPN']
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
791
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
792 if mode == "text_dict":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
793 textmode = "textPollux"
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
794 else:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
795 textmode = mode
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
796
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
797 textParam = "document=%s&mode=%s&pn=%s"%(docpath,textmode,pn)
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
798 if highlightQuery is not None:
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
799 textParam +="&highlightQuery=%s&sn=%s"%(highlightQuery,sn)
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
800
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
801 pagexml=self.template.fulltextclient.eval("/mpdl/interface/page-fragment.xql", textParam, outputUnicode=False)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
802 pagedom = Parse(pagexml)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
803 # plain text mode
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
804 if mode == "text":
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
805 # first div contains text
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
806 pagedivs = pagedom.xpath("/div")
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
807 #queryResultPage
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
808 if len(pagedivs) > 0:
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
809 pagenode = pagedivs[0]
103
daedc22e4e76 last update
abukhman
parents: 102
diff changeset
810 links = pagenode.xpath("//a")
daedc22e4e76 last update
abukhman
parents: 102
diff changeset
811 for l in links:
daedc22e4e76 last update
abukhman
parents: 102
diff changeset
812 hrefNode = l.getAttributeNodeNS(None, u"href")
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
813
103
daedc22e4e76 last update
abukhman
parents: 102
diff changeset
814 if hrefNode:
daedc22e4e76 last update
abukhman
parents: 102
diff changeset
815 href= hrefNode.nodeValue
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
816 if href.startswith('#note-'):
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
817 hrefNode.nodeValue = href.replace('#note-',"?url=%s&viewMode=%s&tocMode=%s&tocPN=%s&pn=%s#note-"%(url,viewMode,tocMode,tocPN,pn))
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
818
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
819 return serializeNode(pagenode)
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
820 if mode == "xml":
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
821 # first div contains text
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
822 pagedivs = pagedom.xpath("/div")
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
823 if len(pagedivs) > 0:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
824 pagenode = pagedivs[0]
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
825 return serializeNode(pagenode)
124
10d10e0db919 *** empty log message ***
abukhman
parents: 120
diff changeset
826 if mode == "pureXml":
10d10e0db919 *** empty log message ***
abukhman
parents: 120
diff changeset
827 # first div contains text
10d10e0db919 *** empty log message ***
abukhman
parents: 120
diff changeset
828 pagedivs = pagedom.xpath("/div")
10d10e0db919 *** empty log message ***
abukhman
parents: 120
diff changeset
829 if len(pagedivs) > 0:
10d10e0db919 *** empty log message ***
abukhman
parents: 120
diff changeset
830 pagenode = pagedivs[0]
10d10e0db919 *** empty log message ***
abukhman
parents: 120
diff changeset
831 return serializeNode(pagenode)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
832 # text-with-links mode
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
833 if mode == "text_dict":
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
834 # first div contains text
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
835 pagedivs = pagedom.xpath("/div")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
836 if len(pagedivs) > 0:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
837 pagenode = pagedivs[0]
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
838 # check all a-tags
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
839 links = pagenode.xpath("//a")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
840 for l in links:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
841 hrefNode = l.getAttributeNodeNS(None, u"href")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
842 if hrefNode:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
843 # is link with href
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
844 href = hrefNode.nodeValue
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
845 if href.startswith('lt/lex.xql'):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
846 # is pollux link
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
847 selfurl = self.absolute_url()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
848 # change href
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
849 hrefNode.nodeValue = href.replace('lt/lex.xql','%s/template/head_main_voc'%selfurl)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
850 # add target
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
851 l.setAttributeNS(None, 'target', '_blank')
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
852 l.setAttributeNS(None, 'onClick',"popupWin = window.open(this.href, 'contacts', 'location,width=500,height=600,top=180, left=700, scrollbars=1'); return false;")
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
853 l.setAttributeNS(None, 'onDblclick', 'popupWin.focus();')
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
854
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
855 if href.startswith('lt/lemma.xql'):
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
856 selfurl = self.absolute_url()
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
857 hrefNode.nodeValue = href.replace('lt/lemma.xql','%s/template/head_main_lemma'%selfurl)
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
858 l.setAttributeNS(None, 'target', '_blank')
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
859 l.setAttributeNS(None, 'onClick',"popupWin = window.open(this.href, 'contacts', 'location,width=500,height=600,top=180, left=700, scrollbars=1'); return false;")
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
860 l.setAttributeNS(None, 'onDblclick', 'popupWin.focus();')
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
861
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
862 if href.startswith('#note-'):
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
863 hrefNode.nodeValue = href.replace('#note-',"?url=%s&viewMode=%s&tocMode=%s&tocPN=%s&pn=%s#note-"%(url,viewMode,tocMode,tocPN,pn))
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
864
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
865
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
866 return serializeNode(pagenode)
0
dwinter
parents:
diff changeset
867
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
868 return "no text here"
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
869
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
870 def getTranslate(self, query=None, language=None):
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
871 """translate into another languages"""
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
872 pagexml=self.template.fulltextclient.eval("/mpdl/interface/lt/lex.xql","document=&language="+str(language)+"&query="+url_quote(str(query)))
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
873 return pagexml
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
874
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
875 def getLemma(self, lemma=None, language=None):
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
876 """simular words lemma """
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
877 pagexml=self.template.fulltextclient.eval("/mpdl/interface/lt/lemma.xql","document=&language="+str(language)+"&lemma="+url_quote(str(lemma)))
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
878 #pagexml=self.template.fulltextclient.eval("/mpdl/interface/lt/lemma.xql","lemma=%s&language=%s"%(lemma,language),outputUnicode=False)
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
879 return pagexml
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
880
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
881 def getQuery (self, docinfo=None, pageinfo=None, query=None, queryType=None, pn=1):
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
882 """number of"""
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
883 docpath = docinfo['textURLPath']
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
884 pagesize = pageinfo['queryPageSize']
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
885 pn = pageinfo['searchPN']
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
886 query =pageinfo['query']
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
887 queryType =pageinfo['queryType']
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
888
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
889 tocSearch = 0
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
890 tocDiv = None
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
891 pagexml=self.template.fulltextclient.eval("/mpdl/interface/doc-query.xql","document=%s&mode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s"%(docpath, 'text', queryType, query, pagesize, pn) ,outputUnicode=False)
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
892
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
893 pagedom = Parse(pagexml)
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
894 numdivs = pagedom.xpath("//div[@class='queryResultHits']")
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
895 tocSearch = int(getTextFromNode(numdivs[0]))
105
6bffb612cd6a *** empty log message ***
abukhman
parents: 104
diff changeset
896 tc=int((tocSearch/10)+1)
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
897 logging.debug("documentViewer (gettoc) tc: %s"%(tc))
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
898 return tc
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
899
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
900 def getToc(self, mode="text", docinfo=None):
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
901 """loads table of contents and stores in docinfo"""
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
902 logging.debug("documentViewer (gettoc) mode: %s"%(mode))
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
903 if 'tocSize_%s'%mode in docinfo:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
904 # cached toc
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
905 return docinfo
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
906 docpath = docinfo['textURLPath']
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
907 # we need to set a result set size
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
908 pagesize = 1000
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
909 pn = 1
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
910 if mode == "text":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
911 queryType = "toc"
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
912 else:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
913 queryType = mode
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
914 # number of entries in toc
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
915 tocSize = 0
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
916 tocDiv = None
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
917 pagexml=self.template.fulltextclient.eval("/mpdl/interface/doc-query.xql", "document=%s&queryType=%s&queryResultPageSize=%s&queryResultPN=%s"%(docpath,queryType,pagesize,pn), outputUnicode=False)
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
918 # post-processing downloaded xml
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
919 pagedom = Parse(pagexml)
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
920 # get number of entries
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
921 numdivs = pagedom.xpath("//div[@class='queryResultHits']")
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
922 if len(numdivs) > 0:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
923 tocSize = int(getTextFromNode(numdivs[0]))
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
924 # div contains text
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
925 #pagedivs = pagedom.xpath("//div[@class='queryResultPage']")
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
926 #if len(pagedivs) > 0:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
927 # tocDiv = pagedivs[0]
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
928
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
929 docinfo['tocSize_%s'%mode] = tocSize
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
930 #docinfo['tocDiv_%s'%mode] = tocDiv
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
931 return docinfo
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
932
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
933 def getTocPage(self, mode="text", pn=1, pageinfo=None, docinfo=None):
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
934 """returns single page from the table of contents"""
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
935 # TODO: this should use the cached TOC
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
936 if mode == "text":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
937 queryType = "toc"
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
938 else:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
939 queryType = mode
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
940 docpath = docinfo['textURLPath']
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
941 path = docinfo['textURLPath']
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
942 #logging.debug("documentViewer (gettoc) pathNomer: %s"%(pathNomer))
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
943 pagesize = pageinfo['tocPageSize']
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
944 pn = pageinfo['tocPN']
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
945 url = docinfo['url']
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
946 selfurl = self.absolute_url()
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
947 viewMode= pageinfo['viewMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
948 tocMode = pageinfo['tocMode']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
949 tocPN = pageinfo['tocPN']
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
950
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
951 pagexml=self.template.fulltextclient.eval("/mpdl/interface/doc-query.xql", "document=%s&queryType=%s&queryResultPageSize=%s&queryResultPN=%s"%(docpath,queryType, pagesize, pn), outputUnicode=False)
101
a839579233c3 Update for all Books(not for only Benedetti)
abukhman
parents: 100
diff changeset
952 page = pagexml.replace('page-fragment.xql?document=%s'%str(path),'%s?url=%s&viewMode=%s&tocMode=%s&tocPN=%s'%(selfurl,url, viewMode, tocMode, tocPN))
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
953 text = page.replace('mode=image','mode=texttool')
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
954 return text
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
955 # post-processing downloaded xml
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
956 #pagedom = Parse(text)
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
957 # div contains text
96
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
958 #pagedivs = pagedom.xpath("//div[@class='queryResultPage']")
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
959 #if len(pagedivs) > 0:
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
960 # pagenode = pagedivs[0]
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
961 # return serializeNode(pagenode)
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
962 #else:
a679c8c7148d getTranslate, getLemma
abukhman
parents: 95
diff changeset
963 # return "No TOC!"
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
964
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
965 def changeDocumentViewer(self,title="",digilibBaseUrl=None,thumbrows=2,thumbcols=5,authgroups='mpiwg',RESPONSE=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
966 """init document viewer"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
967 self.title=title
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
968 self.digilibBaseUrl = digilibBaseUrl
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
969 self.thumbrows = thumbrows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
970 self.thumbcols = thumbcols
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
971 self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
972 if RESPONSE is not None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
973 RESPONSE.redirect('manage_main')
0
dwinter
parents:
diff changeset
974
dwinter
parents:
diff changeset
975
dwinter
parents:
diff changeset
976
dwinter
parents:
diff changeset
977 def manage_AddDocumentViewerForm(self):
dwinter
parents:
diff changeset
978 """add the viewer form"""
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
979 pt=PageTemplateFile('zpt/addDocumentViewer', globals()).__of__(self)
0
dwinter
parents:
diff changeset
980 return pt()
dwinter
parents:
diff changeset
981
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
982 def manage_AddDocumentViewer(self,id,imageScalerUrl="",textServerName="",title="",RESPONSE=None):
0
dwinter
parents:
diff changeset
983 """add the viewer"""
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
984 newObj=documentViewer(id,imageScalerUrl=imageScalerUrl,title=title,textServerName=textServerName)
0
dwinter
parents:
diff changeset
985 self._setObject(id,newObj)
dwinter
parents:
diff changeset
986
dwinter
parents:
diff changeset
987 if RESPONSE is not None:
dwinter
parents:
diff changeset
988 RESPONSE.redirect('manage_main')
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
989
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
990
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
991 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
992 ## DocumentViewerTemplate class
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
993 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
994 class DocumentViewerTemplate(ZopePageTemplate):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
995 """Template for document viewer"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
996 meta_type="DocumentViewer Template"
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
997
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
998
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
999 def manage_addDocumentViewerTemplateForm(self):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1000 """Form for adding"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1001 pt=PageTemplateFile('zpt/addDocumentViewerTemplate', globals()).__of__(self)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1002 return pt()
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1003
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1004 def manage_addDocumentViewerTemplate(self, id='viewer_main', title=None, text=None,
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1005 REQUEST=None, submit=None):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1006 "Add a Page Template with optional file content."
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1007
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1008 self._setObject(id, DocumentViewerTemplate(id))
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1009 ob = getattr(self, id)
53
f4e0af8c281d NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents: 52
diff changeset
1010 txt=file(os.path.join(package_home(globals()),'zpt/viewer_main.zpt'),'r').read()
f4e0af8c281d NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents: 52
diff changeset
1011 logging.info("txt %s:"%txt)
f4e0af8c281d NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents: 52
diff changeset
1012 ob.pt_edit(txt,"text/html")
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1013 if title:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1014 ob.pt_setTitle(title)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1015 try:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1016 u = self.DestinationURL()
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1017 except AttributeError:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1018 u = REQUEST['URL1']
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1019
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1020 u = "%s/%s" % (u, urllib.quote(id))
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1021 REQUEST.RESPONSE.redirect(u+'/manage_main')
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1022 return ''
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1023
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
1024
41
0c8ee8fcfd76 some more logging
casties
parents: 40
diff changeset
1025