Mercurial > hg > documentViewer
annotate documentViewer.py @ 432:8d8f2cbd6213
*** empty log message ***
| author | abukhman |
|---|---|
| date | Fri, 18 Feb 2011 12:21:46 +0100 |
| parents | d6a2125a4b09 |
| children | 44ccb7bd0938 |
| rev | line source |
|---|---|
| 46 | 1 |
| 0 | 2 from OFS.Folder import Folder |
| 3 from Products.PageTemplates.ZopePageTemplate import ZopePageTemplate | |
| 52 | 4 from Products.PageTemplates.PageTemplateFile import PageTemplateFile |
| 0 | 5 from AccessControl import ClassSecurityInfo |
| 32 | 6 from AccessControl import getSecurityManager |
| 0 | 7 from Globals import package_home |
| 235 | 8 from Products.zogiLib.zogiLib import browserCheck |
| 0 | 9 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
10 from Ft.Xml import EMPTY_NAMESPACE, Parse |
| 134 | 11 import Ft.Xml.Domlette |
| 0 | 12 import os.path |
| 31 | 13 import sys |
| 0 | 14 import urllib |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
15 import urllib2 |
|
50
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
16 import logging |
| 61 | 17 import math |
| 46 | 18 import urlparse |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
19 import cStringIO |
| 174 | 20 import re |
| 389 | 21 import string |
| 231 | 22 |
| 52 | 23 def logger(txt,method,txt2): |
| 24 """logging""" | |
| 25 logging.info(txt+ txt2) | |
| 26 | |
| 27 | |
| 25 | 28 def getInt(number, default=0): |
| 29 """returns always an int (0 in case of problems)""" | |
| 30 try: | |
| 31 return int(number) | |
| 32 except: | |
| 62 | 33 return int(default) |
| 25 | 34 |
| 0 | 35 def getTextFromNode(nodename): |
| 46 | 36 """get the cdata content of a node""" |
| 32 | 37 if nodename is None: |
| 38 return "" | |
| 0 | 39 nodelist=nodename.childNodes |
| 40 rc = "" | |
| 41 for node in nodelist: | |
| 42 if node.nodeType == node.TEXT_NODE: | |
| 43 rc = rc + node.data | |
| 44 return rc | |
| 45 | |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
46 def serializeNode(node, encoding='utf-8'): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
47 """returns a string containing node as XML""" |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
48 buf = cStringIO.StringIO() |
| 136 | 49 Ft.Xml.Domlette.Print(node, stream=buf, encoding=encoding) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
50 s = buf.getvalue() |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
51 buf.close() |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
52 return s |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
53 |
| 387 | 54 def browserCheck(self): |
| 55 """check the browsers request to find out the browser type""" | |
| 56 bt = {} | |
| 57 ua = self.REQUEST.get_header("HTTP_USER_AGENT") | |
| 58 bt['ua'] = ua | |
| 59 bt['isIE'] = False | |
| 60 bt['isN4'] = False | |
| 425 | 61 bt['versFirefox']="" |
| 62 bt['versIE']="" | |
| 63 bt['versSafariChrome']="" | |
| 64 bt['versOpera']="" | |
| 65 | |
| 387 | 66 if string.find(ua, 'MSIE') > -1: |
| 67 bt['isIE'] = True | |
| 68 else: | |
| 69 bt['isN4'] = (string.find(ua, 'Mozilla/4.') > -1) | |
| 425 | 70 # Safari oder Chrome identification |
| 71 try: | |
| 72 nav = ua[string.find(ua, '('):] | |
| 73 nav1=ua[string.find(ua,')'):] | |
| 74 nav2=nav1[string.find(nav1,'('):] | |
| 75 nav3=nav2[string.find(nav2,')'):] | |
| 76 ie = string.split(nav, "; ")[1] | |
| 77 ie1 =string.split(nav1, " ")[2] | |
| 78 ie2 =string.split(nav3, " ")[1] | |
| 79 ie3 =string.split(nav3, " ")[2] | |
| 80 if string.find(ie3, "Safari") >-1: | |
| 81 bt['versSafariChrome']=string.split(ie2, "/")[1] | |
| 82 except: pass | |
| 83 # IE identification | |
| 387 | 84 try: |
| 85 nav = ua[string.find(ua, '('):] | |
| 86 ie = string.split(nav, "; ")[1] | |
| 87 if string.find(ie, "MSIE") > -1: | |
| 88 bt['versIE'] = string.split(ie, " ")[1] | |
| 425 | 89 except:pass |
| 90 # Firefox identification | |
| 91 try: | |
| 92 nav = ua[string.find(ua, '('):] | |
| 93 nav1=ua[string.find(ua,')'):] | |
| 94 if string.find(ie1, "Firefox") >-1: | |
| 95 nav5= string.split(ie1, "/")[1] | |
| 96 logging.debug("FIREFOX: %s"%(nav5)) | |
| 427 | 97 bt['versFirefox']=nav5[0:3] |
| 425 | 98 except:pass |
| 99 #Opera identification | |
| 100 try: | |
| 101 if string.find(ua,"Opera") >-1: | |
| 102 nav = ua[string.find(ua, '('):] | |
| 103 nav1=nav[string.find(nav,')'):] | |
| 104 bt['versOpera']=string.split(nav1,"/")[2] | |
| 105 except:pass | |
| 387 | 106 |
| 107 bt['isMac'] = string.find(ua, 'Macintosh') > -1 | |
| 108 bt['isWin'] = string.find(ua, 'Windows') > -1 | |
| 109 bt['isIEWin'] = bt['isIE'] and bt['isWin'] | |
| 110 bt['isIEMac'] = bt['isIE'] and bt['isMac'] | |
| 111 bt['staticHTML'] = False | |
| 112 | |
| 113 return bt | |
| 234 | 114 |
| 115 | |
| 35 | 116 def getParentDir(path): |
| 117 """returns pathname shortened by one""" | |
| 118 return '/'.join(path.split('/')[0:-1]) | |
| 119 | |
| 120 | |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
121 def getHttpData(url, data=None, num_tries=3, timeout=10): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
122 """returns result from url+data HTTP request""" |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
123 # we do GET (by appending data to url) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
124 if isinstance(data, str) or isinstance(data, unicode): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
125 # if data is string then append |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
126 url = "%s?%s"%(url,data) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
127 elif isinstance(data, dict) or isinstance(data, list) or isinstance(data, tuple): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
128 # urlencode |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
129 url = "%s?%s"%(url,urllib.urlencode(data)) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
130 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
131 response = None |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
132 errmsg = None |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
133 for cnt in range(num_tries): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
134 try: |
| 167 | 135 logging.debug("getHttpData(#%s %ss) url=%s"%(cnt+1,timeout,url)) |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
136 if sys.version_info < (2, 6): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
137 # set timeout on socket -- ugly :-( |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
138 import socket |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
139 socket.setdefaulttimeout(float(timeout)) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
140 response = urllib2.urlopen(url) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
141 else: |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
142 response = urllib2.urlopen(url,timeout=float(timeout)) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
143 # check result? |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
144 break |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
145 except urllib2.HTTPError, e: |
| 167 | 146 logging.error("getHttpData: HTTP error(%s): %s"%(e.code,e)) |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
147 errmsg = str(e) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
148 # stop trying |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
149 break |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
150 except urllib2.URLError, e: |
| 167 | 151 logging.error("getHttpData: URLLIB error(%s): %s"%(e.reason,e)) |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
152 errmsg = str(e) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
153 # stop trying |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
154 #break |
| 0 | 155 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
156 if response is not None: |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
157 data = response.read() |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
158 response.close() |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
159 return data |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
160 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
161 raise IOError("ERROR fetching HTTP data from %s: %s"%(url,errmsg)) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
162 #return None |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
163 |
| 0 | 164 |
| 165 | |
| 22 | 166 ## |
| 167 ## documentViewer class | |
| 168 ## | |
| 169 class documentViewer(Folder): | |
| 0 | 170 """document viewer""" |
| 171 meta_type="Document viewer" | |
| 172 | |
| 173 security=ClassSecurityInfo() | |
| 22 | 174 manage_options=Folder.manage_options+( |
| 0 | 175 {'label':'main config','action':'changeDocumentViewerForm'}, |
| 176 ) | |
| 177 | |
| 22 | 178 # templates and forms |
| 179 viewer_main = PageTemplateFile('zpt/viewer_main', globals()) | |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
180 toc_thumbs = PageTemplateFile('zpt/toc_thumbs', globals()) |
|
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
181 toc_text = PageTemplateFile('zpt/toc_text', globals()) |
|
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
182 toc_figures = PageTemplateFile('zpt/toc_figures', globals()) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
183 page_main_images = PageTemplateFile('zpt/page_main_images', globals()) |
| 412 | 184 page_main_double = PageTemplateFile('zpt/page_main_double', globals()) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
185 page_main_text = PageTemplateFile('zpt/page_main_text', globals()) |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
186 page_main_text_dict = PageTemplateFile('zpt/page_main_text_dict', globals()) |
| 140 | 187 page_main_gis =PageTemplateFile ('zpt/page_main_gis', globals()) |
| 99 | 188 page_main_xml = PageTemplateFile('zpt/page_main_xml', globals()) |
| 404 | 189 page_main_pureXml = PageTemplateFile('zpt/page_main_pureXml', globals()) |
| 22 | 190 head_main = PageTemplateFile('zpt/head_main', globals()) |
| 191 docuviewer_css = PageTemplateFile('css/docuviewer.css', globals()) | |
| 57 | 192 info_xml = PageTemplateFile('zpt/info_xml', globals()) |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
193 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
194 |
| 68 | 195 thumbs_main_rss = PageTemplateFile('zpt/thumbs_main_rss', globals()) |
| 22 | 196 security.declareProtected('View management screens','changeDocumentViewerForm') |
| 197 changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals()) | |
| 198 | |
| 0 | 199 |
| 95 | 200 def __init__(self,id,imageScalerUrl=None,textServerName=None,title="",digilibBaseUrl=None,thumbcols=2,thumbrows=5,authgroups="mpiwg"): |
| 0 | 201 """init document viewer""" |
| 202 self.id=id | |
| 203 self.title=title | |
| 25 | 204 self.thumbcols = thumbcols |
| 205 self.thumbrows = thumbrows | |
| 32 | 206 # authgroups is list of authorized groups (delimited by ,) |
| 207 self.authgroups = [s.strip().lower() for s in authgroups.split(',')] | |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
208 # create template folder so we can always use template.something |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
209 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
210 templateFolder = Folder('template') |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
211 #self['template'] = templateFolder # Zope-2.12 style |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
212 self._setObject('template',templateFolder) # old style |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
213 try: |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
214 import MpdlXmlTextServer |
| 132 | 215 textServer = MpdlXmlTextServer.MpdlXmlTextServer(id='fulltextclient',serverName=textServerName) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
216 #templateFolder['fulltextclient'] = xmlRpcClient |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
217 templateFolder._setObject('fulltextclient',textServer) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
218 except Exception, e: |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
219 logging.error("Unable to create MpdlXmlTextServer for fulltextclient: "+str(e)) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
220 try: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
221 from Products.zogiLib.zogiLib import zogiLib |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
222 zogilib = zogiLib(id="zogilib", title="zogilib for docuviewer", dlServerURL=imageScalerUrl, layout="book") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
223 #templateFolder['zogilib'] = zogilib |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
224 templateFolder._setObject('zogilib',zogilib) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
225 except Exception, e: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
226 logging.error("Unable to create zogiLib for zogilib: "+str(e)) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
227 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
228 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
229 # proxy text server methods to fulltextclient |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
230 def getTextPage(self, **args): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
231 """get page""" |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
232 return self.template.fulltextclient.getTextPage(**args) |
| 430 | 233 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
234 def getQuery(self, **args): |
| 419 | 235 """get query in search""" |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
236 return self.template.fulltextclient.getQuery(**args) |
| 419 | 237 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
238 def getSearch(self, **args): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
239 """get search""" |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
240 return self.template.fulltextclient.getSearch(**args) |
| 256 | 241 |
| 242 def getGisPlaces(self, **args): | |
| 307 | 243 """get gis places""" |
| 256 | 244 return self.template.fulltextclient.getGisPlaces(**args) |
| 307 | 245 |
| 246 def getAllGisPlaces(self, **args): | |
| 310 | 247 """get all gis places """ |
| 248 return self.template.fulltextclient.getAllGisPlaces(**args) | |
| 419 | 249 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
250 def getTranslate(self, **args): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
251 """get translate""" |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
252 return self.template.fulltextclient.getTranslate(**args) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
253 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
254 def getLemma(self, **args): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
255 """get lemma""" |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
256 return self.template.fulltextclient.getLemma(**args) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
257 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
258 def getToc(self, **args): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
259 """get toc""" |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
260 return self.template.fulltextclient.getToc(**args) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
261 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
262 def getTocPage(self, **args): |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
263 """get tocpage""" |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
264 return self.template.fulltextclient.getTocPage(**args) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
265 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
266 |
| 68 | 267 security.declareProtected('View','thumbs_rss') |
| 268 def thumbs_rss(self,mode,url,viewMode="auto",start=None,pn=1): | |
| 269 ''' | |
| 270 view it | |
| 271 @param mode: defines how to access the document behind url | |
| 272 @param url: url which contains display information | |
| 273 @param viewMode: if images display images, if text display text, default is images (text,images or auto) | |
| 274 | |
| 275 ''' | |
| 167 | 276 logging.debug("HHHHHHHHHHHHHH:load the rss") |
| 277 logger("documentViewer (index)", logging.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn)) | |
| 68 | 278 |
| 279 if not hasattr(self, 'template'): | |
| 280 # create template folder if it doesn't exist | |
| 281 self.manage_addFolder('template') | |
| 282 | |
| 283 if not self.digilibBaseUrl: | |
| 284 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary" | |
| 285 | |
| 286 docinfo = self.getDocinfo(mode=mode,url=url) | |
| 338 | 287 #pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo) |
| 345 | 288 pageinfo = self.getPageinfo(start=start,current=pn, docinfo=docinfo) |
| 331 | 289 ''' ZDES ''' |
| 68 | 290 pt = getattr(self.template, 'thumbs_main_rss') |
| 291 | |
| 292 if viewMode=="auto": # automodus gewaehlt | |
| 409 | 293 if docinfo.has_key("textURL") or docinfo.get('textURLPath',None): #texturl gesetzt und textViewer konfiguriert |
| 68 | 294 viewMode="text" |
| 295 else: | |
| 296 viewMode="images" | |
| 297 | |
| 298 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode) | |
| 299 | |
| 22 | 300 security.declareProtected('View','index_html') |
| 405 | 301 def index_html(self,url,mode="texttool",viewMode="auto",tocMode="thumbs",start=None,pn=1,mk=None): |
| 22 | 302 ''' |
| 303 view it | |
| 57 | 304 @param mode: defines how to access the document behind url |
| 22 | 305 @param url: url which contains display information |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
306 @param viewMode: if images display images, if text display text, default is auto (text,images or auto) |
| 99 | 307 @param tocMode: type of 'table of contents' for navigation (thumbs, text, figures, none) |
| 141 | 308 @param characterNormalization type of text display (reg, norm, none) |
| 100 | 309 @param querySearch: type of different search modes (fulltext, fulltextMorph, xpath, xquery, ftIndex, ftIndexMorph, fulltextMorphLemma) |
| 22 | 310 ''' |
| 0 | 311 |
| 345 | 312 logging.debug("documentViewer (index) mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn)) |
| 22 | 313 |
| 314 if not hasattr(self, 'template'): | |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
315 # this won't work |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
316 logging.error("template folder missing!") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
317 return "ERROR: template folder missing!" |
| 22 | 318 |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
319 if not getattr(self, 'digilibBaseUrl', None): |
| 132 | 320 self.digilibBaseUrl = self.findDigilibUrl() or "http://digilib.mpiwg-berlin.mpg.de/digitallibrary" |
| 22 | 321 |
| 25 | 322 docinfo = self.getDocinfo(mode=mode,url=url) |
| 97 | 323 |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
324 if tocMode != "thumbs": |
|
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
325 # get table of contents |
|
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
326 docinfo = self.getToc(mode=tocMode, docinfo=docinfo) |
| 97 | 327 |
|
51
c5d3aabbf61b
textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents:
50
diff
changeset
|
328 if viewMode=="auto": # automodus gewaehlt |
| 409 | 329 if docinfo.has_key('textURL') or docinfo.get('textURLPath',None): #texturl gesetzt und textViewer konfiguriert |
| 127 | 330 viewMode="text_dict" |
|
51
c5d3aabbf61b
textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents:
50
diff
changeset
|
331 else: |
|
c5d3aabbf61b
textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents:
50
diff
changeset
|
332 viewMode="images" |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
333 |
| 345 | 334 pageinfo = self.getPageinfo(start=start,current=pn, docinfo=docinfo,viewMode=viewMode,tocMode=tocMode) |
| 127 | 335 |
| 419 | 336 if (docinfo.get('textURLPath',None)): |
| 337 page = self.getTextPage(docinfo=docinfo, pageinfo=pageinfo) | |
| 338 pageinfo['textPage'] = page | |
| 430 | 339 tt = getattr(self, 'template') |
| 340 pt = getattr(tt, 'viewer_main') | |
|
75
9673218e155b
minorCVS: ----------------------------------------------------------------------
dwinter
parents:
74
diff
changeset
|
341 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode,mk=self.generateMarks(mk)) |
| 0 | 342 |
| 74 | 343 def generateMarks(self,mk): |
| 344 ret="" | |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
345 if mk is None: |
|
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
346 return "" |
| 134 | 347 if not isinstance(mk, list): |
| 132 | 348 mk=[mk] |
| 74 | 349 for m in mk: |
|
75
9673218e155b
minorCVS: ----------------------------------------------------------------------
dwinter
parents:
74
diff
changeset
|
350 ret+="mk=%s"%m |
| 74 | 351 return ret |
| 389 | 352 |
| 353 | |
| 387 | 354 def getBrowser(self): |
| 355 """getBrowser the version of browser """ | |
| 413 | 356 bt = browserCheck(self) |
| 424 | 357 logging.debug("BROWSER VERSION: %s"%(bt)) |
| 413 | 358 return bt |
| 387 | 359 |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
360 def findDigilibUrl(self): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
361 """try to get the digilib URL from zogilib""" |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
362 url = self.template.zogilib.getDLBaseUrl() |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
363 return url |
| 126 | 364 |
| 365 def getDocumentViewerURL(self): | |
| 366 """returns the URL of this instance""" | |
| 367 return self.absolute_url() | |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
368 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
369 def getStyle(self, idx, selected, style=""): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
370 """returns a string with the given style and append 'sel' if path == selected.""" |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
371 #logger("documentViewer (getstyle)", logging.INFO, "idx: %s selected: %s style: %s"%(idx,selected,style)) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
372 if idx == selected: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
373 return style + 'sel' |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
374 else: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
375 return style |
| 74 | 376 |
| 413 | 377 def getLink(self, param=None, val=None, params=None, baseUrl=None, paramSep='&'): |
| 378 """returns URL to documentviewer with parameter param set to val or from dict params""" | |
| 379 # copy existing request params | |
| 380 urlParams=self.REQUEST.form.copy() | |
| 381 # change single param | |
| 25 | 382 if param is not None: |
| 31 | 383 if val is None: |
| 413 | 384 if urlParams.has_key(param): |
| 385 del urlParams[param] | |
| 25 | 386 else: |
| 413 | 387 urlParams[param] = str(val) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
388 |
| 413 | 389 # change more params |
| 390 if params is not None: | |
| 391 for k in params.keys(): | |
| 392 v = params[k] | |
| 393 if v is None: | |
| 394 # val=None removes param | |
| 395 if urlParams.has_key(k): | |
| 396 del urlParams[k] | |
| 397 | |
| 398 else: | |
| 399 urlParams[k] = v | |
| 400 | |
| 401 # FIXME: does this belong here? | |
| 402 if urlParams.get("mode", None) == "filepath": #wenn beim erst Aufruf filepath gesetzt wurde aendere das nun zu imagepath | |
| 403 urlParams["mode"] = "imagepath" | |
| 404 urlParams["url"] = getParentDir(urlParams["url"]) | |
| 31 | 405 |
| 413 | 406 # quote values and assemble into query string (not escaping '/') |
| 407 ps = paramSep.join(["%s=%s"%(k,urllib.quote_plus(v,'/')) for (k, v) in urlParams.items()]) | |
| 408 #ps = urllib.urlencode(urlParams) | |
| 409 if baseUrl is None: | |
| 410 baseUrl = self.REQUEST['URL1'] | |
| 411 | |
| 412 url = "%s?%s"%(baseUrl, ps) | |
| 25 | 413 return url |
| 414 | |
| 413 | 415 |
| 416 def getLinkAmp(self, param=None, val=None, params=None, baseUrl=None): | |
| 68 | 417 """link to documentviewer with parameter param set to val""" |
| 413 | 418 return self.getLink(param, val, params, baseUrl, '&') |
|
81
fae97f071724
fixed problem with info.xml when url without index.meta
casties
parents:
79
diff
changeset
|
419 |
| 57 | 420 def getInfo_xml(self,url,mode): |
| 421 """returns info about the document as XML""" | |
| 422 | |
| 423 if not self.digilibBaseUrl: | |
| 424 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary" | |
| 425 | |
| 426 docinfo = self.getDocinfo(mode=mode,url=url) | |
| 427 pt = getattr(self.template, 'info_xml') | |
| 428 return pt(docinfo=docinfo) | |
| 429 | |
| 394 | 430 def getOptionToggle(self, newState=None, optionName='text_options_open', initialState=True): |
| 431 """returns new option state""" | |
| 397 | 432 if not self.REQUEST.SESSION.has_key(optionName): |
| 394 | 433 # not in session -- initial |
| 434 opt = {'lastState': newState, 'state': initialState} | |
| 435 else: | |
| 397 | 436 opt = self.REQUEST.SESSION.get(optionName) |
| 394 | 437 if opt['lastState'] != newState: |
| 438 # state in session has changed -- toggle | |
| 439 opt['state'] = not opt['state'] | |
| 440 opt['lastState'] = newState | |
| 441 | |
| 442 self.REQUEST.SESSION[optionName] = opt | |
| 443 return opt['state'] | |
| 0 | 444 |
| 35 | 445 def isAccessible(self, docinfo): |
| 32 | 446 """returns if access to the resource is granted""" |
| 447 access = docinfo.get('accessType', None) | |
| 167 | 448 logging.debug("documentViewer (accessOK) access type %s"%access) |
| 45 | 449 if access is not None and access == 'free': |
| 167 | 450 logging.debug("documentViewer (accessOK) access is free") |
| 32 | 451 return True |
| 45 | 452 elif access is None or access in self.authgroups: |
| 35 | 453 # only local access -- only logged in users |
| 454 user = getSecurityManager().getUser() | |
| 167 | 455 logging.debug("documentViewer (accessOK) user=%s ip=%s"%(user,self.REQUEST.getClientAddr())) |
| 35 | 456 if user is not None: |
| 457 #print "user: ", user | |
| 458 return (user.getUserName() != "Anonymous User") | |
| 459 else: | |
| 460 return False | |
| 32 | 461 |
| 167 | 462 logging.error("documentViewer (accessOK) unknown access type %s"%access) |
| 32 | 463 return False |
| 35 | 464 |
| 32 | 465 |
| 73 | 466 def getDirinfoFromDigilib(self,path,docinfo=None,cut=0): |
| 29 | 467 """gibt param von dlInfo aus""" |
| 31 | 468 if docinfo is None: |
| 469 docinfo = {} | |
| 73 | 470 |
| 471 for x in range(cut): | |
| 78 | 472 |
| 73 | 473 path=getParentDir(path) |
| 78 | 474 |
| 40 | 475 infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path |
| 29 | 476 |
| 167 | 477 logging.debug("documentViewer (getparamfromdigilib) dirInfo from %s"%(infoUrl)) |
| 29 | 478 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
479 txt = getHttpData(infoUrl) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
480 if txt is None: |
| 40 | 481 raise IOError("Unable to get dir-info from %s"%(infoUrl)) |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
482 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
483 dom = Parse(txt) |
| 37 | 484 sizes=dom.xpath("//dir/size") |
| 167 | 485 logging.debug("documentViewer (getparamfromdigilib) dirInfo:size"%sizes) |
| 29 | 486 |
| 37 | 487 if sizes: |
| 488 docinfo['numPages'] = int(getTextFromNode(sizes[0])) | |
| 31 | 489 else: |
| 490 docinfo['numPages'] = 0 | |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
491 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
492 # TODO: produce and keep list of image names and numbers |
| 31 | 493 |
| 494 return docinfo | |
| 32 | 495 |
| 174 | 496 def getIndexMetaPath(self,url): |
| 497 """gib nur den Pfad zurueck""" | |
| 498 regexp = re.compile(r".*(experimental|permanent)/(.*)") | |
| 499 regpath = regexp.match(url) | |
| 500 if (regpath==None): | |
| 501 return "" | |
| 224 | 502 logging.debug("(getDomFromIndexMeta): URLXAXA: %s"%regpath.group(2)) |
| 174 | 503 return ("/mpiwg/online/"+regpath.group(1)+"/"+regpath.group(2)) |
| 504 | |
| 225 | 505 |
| 506 | |
| 174 | 507 def getIndexMetaUrl(self,url): |
| 508 """returns utr of index.meta document at url""" | |
| 509 | |
|
39
1dd90aabd366
added retry when reading index meta from texter applet
casties
parents:
38
diff
changeset
|
510 metaUrl = None |
| 35 | 511 if url.startswith("http://"): |
| 512 # real URL | |
|
39
1dd90aabd366
added retry when reading index meta from texter applet
casties
parents:
38
diff
changeset
|
513 metaUrl = url |
| 35 | 514 else: |
| 515 # online path | |
| 516 server=self.digilibBaseUrl+"/servlet/Texter?fn=" | |
| 40 | 517 metaUrl=server+url.replace("/mpiwg/online","") |
| 35 | 518 if not metaUrl.endswith("index.meta"): |
| 519 metaUrl += "/index.meta" | |
| 174 | 520 |
| 521 return metaUrl | |
| 522 | |
| 523 def getDomFromIndexMeta(self, url): | |
| 524 """get dom from index meta""" | |
| 525 dom = None | |
| 526 metaUrl = self.getIndexMetaUrl(url) | |
|
39
1dd90aabd366
added retry when reading index meta from texter applet
casties
parents:
38
diff
changeset
|
527 |
| 174 | 528 logging.debug("(getDomFromIndexMeta): METAURL: %s"%metaUrl) |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
529 txt=getHttpData(metaUrl) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
530 if txt is None: |
|
39
1dd90aabd366
added retry when reading index meta from texter applet
casties
parents:
38
diff
changeset
|
531 raise IOError("Unable to read index meta from %s"%(url)) |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
532 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
533 dom = Parse(txt) |
| 35 | 534 return dom |
|
50
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
535 |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
536 def getPresentationInfoXML(self, url): |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
537 """returns dom of info.xml document at url""" |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
538 dom = None |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
539 metaUrl = None |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
540 if url.startswith("http://"): |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
541 # real URL |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
542 metaUrl = url |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
543 else: |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
544 # online path |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
545 server=self.digilibBaseUrl+"/servlet/Texter?fn=" |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
546 metaUrl=server+url.replace("/mpiwg/online","") |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
547 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
548 txt=getHttpData(metaUrl) |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
549 if txt is None: |
|
50
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
550 raise IOError("Unable to read infoXMLfrom %s"%(url)) |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
551 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
552 dom = Parse(txt) |
|
50
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
553 return dom |
| 35 | 554 |
| 555 | |
| 70 | 556 def getAuthinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0): |
| 35 | 557 """gets authorization info from the index.meta file at path or given by dom""" |
| 167 | 558 logging.debug("documentViewer (getauthinfofromindexmeta) path: %s"%(path)) |
| 32 | 559 |
| 560 access = None | |
| 561 | |
| 562 if docinfo is None: | |
| 563 docinfo = {} | |
| 564 | |
| 565 if dom is None: | |
| 78 | 566 for x in range(cut): |
| 70 | 567 path=getParentDir(path) |
| 174 | 568 dom = self.getDomFromIndexMeta(path) |
| 46 | 569 |
| 32 | 570 acctype = dom.xpath("//access-conditions/access/@type") |
| 571 if acctype and (len(acctype)>0): | |
| 572 access=acctype[0].value | |
| 35 | 573 if access in ['group', 'institution']: |
| 32 | 574 access = getTextFromNode(dom.xpath("//access-conditions/access/name")[0]).lower() |
| 575 | |
| 576 docinfo['accessType'] = access | |
| 577 return docinfo | |
| 29 | 578 |
| 32 | 579 |
| 70 | 580 def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0): |
| 35 | 581 """gets bibliographical info from the index.meta file at path or given by dom""" |
| 167 | 582 logging.debug("documentViewer (getbibinfofromindexmeta) path: %s"%(path)) |
| 20 | 583 |
| 22 | 584 if docinfo is None: |
| 585 docinfo = {} | |
| 78 | 586 |
| 22 | 587 if dom is None: |
| 78 | 588 for x in range(cut): |
| 70 | 589 path=getParentDir(path) |
| 174 | 590 dom = self.getDomFromIndexMeta(path) |
| 591 | |
| 592 docinfo['indexMetaPath']=self.getIndexMetaPath(path); | |
|
79
df6952ac93e9
bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents:
78
diff
changeset
|
593 |
| 167 | 594 logging.debug("documentViewer (getbibinfofromindexmeta cutted) path: %s"%(path)) |
| 59 | 595 # put in all raw bib fields as dict "bib" |
| 596 bib = dom.xpath("//bib/*") | |
| 597 if bib and len(bib)>0: | |
| 598 bibinfo = {} | |
| 599 for e in bib: | |
| 600 bibinfo[e.localName] = getTextFromNode(e) | |
| 601 docinfo['bib'] = bibinfo | |
| 602 | |
| 603 # extract some fields (author, title, year) according to their mapping | |
| 25 | 604 metaData=self.metadata.main.meta.bib |
| 605 bibtype=dom.xpath("//bib/@type") | |
| 606 if bibtype and (len(bibtype)>0): | |
| 607 bibtype=bibtype[0].value | |
| 20 | 608 else: |
| 25 | 609 bibtype="generic" |
| 59 | 610 |
| 25 | 611 bibtype=bibtype.replace("-"," ") # wrong typesiin index meta "-" instead of " " (not wrong! ROC) |
| 59 | 612 docinfo['bib_type'] = bibtype |
| 25 | 613 bibmap=metaData.generateMappingForType(bibtype) |
| 174 | 614 logging.debug("documentViewer (getbibinfofromindexmeta) bibmap:"+repr(bibmap)) |
| 615 logging.debug("documentViewer (getbibinfofromindexmeta) bibtype:"+repr(bibtype)) | |
| 32 | 616 # if there is no mapping bibmap is empty (mapping sometimes has empty fields) |
| 31 | 617 if len(bibmap) > 0 and len(bibmap['author'][0]) > 0: |
| 63 | 618 try: |
| 619 docinfo['author']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['author'][0])[0]) | |
| 620 except: pass | |
| 621 try: | |
| 622 docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0]) | |
| 623 except: pass | |
| 624 try: | |
| 625 docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0]) | |
| 626 except: pass | |
| 167 | 627 logging.debug("documentViewer (getbibinfofromindexmeta) using mapping for %s"%bibtype) |
| 52 | 628 try: |
| 629 docinfo['lang']=getTextFromNode(dom.xpath("//bib/lang")[0]) | |
| 630 except: | |
| 631 docinfo['lang']='' | |
| 430 | 632 try: |
| 633 docinfo['city']=getTextFromNode(dom.xpath("//bib/city")[0]) | |
| 634 except: | |
| 635 docinfo['city']='' | |
| 636 try: | |
| 637 docinfo['number_of_pages']=getTextFromNode(dom.xpath("//bib/number_of_pages")[0]) | |
| 638 except: | |
| 639 docinfo['number_of_pages']='' | |
| 640 try: | |
| 641 docinfo['series_volume']=getTextFromNode(dom.xpath("//bib/series_volume")[0]) | |
| 642 except: | |
| 643 docinfo['series_volume']='' | |
| 644 try: | |
| 645 docinfo['number_of_volumes']=getTextFromNode(dom.xpath("//bib/number_of_volumes")[0]) | |
| 646 except: | |
| 647 docinfo['number_of_volumes']='' | |
| 648 try: | |
| 649 docinfo['translator']=getTextFromNode(dom.xpath("//bib/translator")[0]) | |
| 650 except: | |
| 651 docinfo['translator']='' | |
| 652 try: | |
| 653 docinfo['edition']=getTextFromNode(dom.xpath("//bib/edition")[0]) | |
| 654 except: | |
| 655 docinfo['edition']='' | |
| 656 try: | |
| 657 docinfo['series_author']=getTextFromNode(dom.xpath("//bib/series_author")[0]) | |
| 658 except: | |
| 659 docinfo['series_author']='' | |
| 660 try: | |
| 661 docinfo['publisher']=getTextFromNode(dom.xpath("//bib/publisher")[0]) | |
| 662 except: | |
| 663 docinfo['publisher']='' | |
| 664 try: | |
| 665 docinfo['series_title']=getTextFromNode(dom.xpath("//bib/series_title")[0]) | |
| 666 except: | |
| 667 docinfo['series_title']='' | |
| 668 try: | |
| 669 docinfo['isbn_issn']=getTextFromNode(dom.xpath("//bib/isbn_issn")[0]) | |
| 670 except: | |
| 671 docinfo['isbn_issn']='' | |
| 22 | 672 return docinfo |
| 83 | 673 |
| 218 | 674 |
| 675 def getNameFromIndexMeta(self,path,docinfo=None,dom=None,cut=0): | |
| 676 """gets name info from the index.meta file at path or given by dom""" | |
| 677 if docinfo is None: | |
| 678 docinfo = {} | |
| 679 | |
| 680 if dom is None: | |
| 681 for x in range(cut): | |
| 682 path=getParentDir(path) | |
| 683 dom = self.getDomFromIndexMeta(path) | |
| 330 | 684 |
| 229 | 685 docinfo['name']=getTextFromNode(dom.xpath("/resource/name")[0]) |
| 230 | 686 logging.debug("documentViewer docinfo[name] %s"%docinfo['name']) |
| 218 | 687 return docinfo |
| 83 | 688 |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
689 def getDocinfoFromTextTool(self, url, dom=None, docinfo=None): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
690 """parse texttool tag in index meta""" |
| 167 | 691 logging.debug("documentViewer (getdocinfofromtexttool) url: %s" % (url)) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
692 if docinfo is None: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
693 docinfo = {} |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
694 if docinfo.get('lang', None) is None: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
695 docinfo['lang'] = '' # default keine Sprache gesetzt |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
696 if dom is None: |
| 174 | 697 dom = self.getDomFromIndexMeta(url) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
698 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
699 archivePath = None |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
700 archiveName = None |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
701 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
702 archiveNames = dom.xpath("//resource/name") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
703 if archiveNames and (len(archiveNames) > 0): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
704 archiveName = getTextFromNode(archiveNames[0]) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
705 else: |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
706 logging.warning("documentViewer (getdocinfofromtexttool) resource/name missing in: %s" % (url)) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
707 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
708 archivePaths = dom.xpath("//resource/archive-path") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
709 if archivePaths and (len(archivePaths) > 0): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
710 archivePath = getTextFromNode(archivePaths[0]) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
711 # clean up archive path |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
712 if archivePath[0] != '/': |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
713 archivePath = '/' + archivePath |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
714 if archiveName and (not archivePath.endswith(archiveName)): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
715 archivePath += "/" + archiveName |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
716 else: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
717 # try to get archive-path from url |
| 167 | 718 logging.warning("documentViewer (getdocinfofromtexttool) resource/archive-path missing in: %s" % (url)) |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
719 if (not url.startswith('http')): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
720 archivePath = url.replace('index.meta', '') |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
721 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
722 if archivePath is None: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
723 # we balk without archive-path |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
724 raise IOError("Missing archive-path (for text-tool) in %s" % (url)) |
| 22 | 725 |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
726 imageDirs = dom.xpath("//texttool/image") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
727 if imageDirs and (len(imageDirs) > 0): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
728 imageDir = getTextFromNode(imageDirs[0]) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
729 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
730 else: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
731 # we balk with no image tag / not necessary anymore because textmode is now standard |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
732 #raise IOError("No text-tool info in %s"%(url)) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
733 imageDir = "" |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
734 #xquery="//pb" |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
735 docinfo['imagePath'] = "" # keine Bilder |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
736 docinfo['imageURL'] = "" |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
737 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
738 if imageDir and archivePath: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
739 #print "image: ", imageDir, " archivepath: ", archivePath |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
740 imageDir = os.path.join(archivePath, imageDir) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
741 imageDir = imageDir.replace("/mpiwg/online", '') |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
742 docinfo = self.getDirinfoFromDigilib(imageDir, docinfo=docinfo) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
743 docinfo['imagePath'] = imageDir |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
744 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
745 docinfo['imageURL'] = self.digilibBaseUrl + "/servlet/Scaler?fn=" + imageDir |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
746 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
747 viewerUrls = dom.xpath("//texttool/digiliburlprefix") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
748 if viewerUrls and (len(viewerUrls) > 0): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
749 viewerUrl = getTextFromNode(viewerUrls[0]) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
750 docinfo['viewerURL'] = viewerUrl |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
751 |
|
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
752 # old style text URL |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
753 textUrls = dom.xpath("//texttool/text") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
754 if textUrls and (len(textUrls) > 0): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
755 textUrl = getTextFromNode(textUrls[0]) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
756 if urlparse.urlparse(textUrl)[0] == "": #keine url |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
757 textUrl = os.path.join(archivePath, textUrl) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
758 # fix URLs starting with /mpiwg/online |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
759 if textUrl.startswith("/mpiwg/online"): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
760 textUrl = textUrl.replace("/mpiwg/online", '', 1) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
761 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
762 docinfo['textURL'] = textUrl |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
763 |
|
130
5c779d7b5f71
more modular version with separate object MpdlXmlTextServer
casties
parents:
128
diff
changeset
|
764 # new style text-url-path |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
765 textUrls = dom.xpath("//texttool/text-url-path") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
766 if textUrls and (len(textUrls) > 0): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
767 textUrl = getTextFromNode(textUrls[0]) |
| 102 | 768 docinfo['textURLPath'] = textUrl |
| 419 | 769 #if not docinfo['imagePath']: |
| 102 | 770 # text-only, no page images |
| 419 | 771 #docinfo = self.getNumTextPages(docinfo) |
| 772 | |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
773 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
774 presentationUrls = dom.xpath("//texttool/presentation") |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
775 docinfo = self.getBibinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get info von bib tag |
| 228 | 776 docinfo = self.getNameFromIndexMeta(url, docinfo=docinfo, dom=dom) |
| 386 | 777 |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
778 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
779 if presentationUrls and (len(presentationUrls) > 0): # ueberschreibe diese durch presentation informationen |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
780 # presentation url ergiebt sich ersetzen von index.meta in der url der fuer die Metadaten |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
781 # durch den relativen Pfad auf die presentation infos |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
782 presentationPath = getTextFromNode(presentationUrls[0]) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
783 if url.endswith("index.meta"): |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
784 presentationUrl = url.replace('index.meta', presentationPath) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
785 else: |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
786 presentationUrl = url + "/" + presentationPath |
| 102 | 787 |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
788 docinfo = self.getBibinfoFromTextToolPresentation(presentationUrl, docinfo=docinfo, dom=dom) |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
789 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
790 docinfo = self.getAuthinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get access info |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
791 |
|
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
792 return docinfo |
| 22 | 793 |
|
50
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
794 |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
795 def getBibinfoFromTextToolPresentation(self,url,docinfo=None,dom=None): |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
796 """gets the bibliographical information from the preseantion entry in texttools |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
797 """ |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
798 dom=self.getPresentationInfoXML(url) |
| 62 | 799 try: |
| 800 docinfo['author']=getTextFromNode(dom.xpath("//author")[0]) | |
| 801 except: | |
| 802 pass | |
| 803 try: | |
| 804 docinfo['title']=getTextFromNode(dom.xpath("//title")[0]) | |
| 805 except: | |
| 806 pass | |
| 807 try: | |
| 808 docinfo['year']=getTextFromNode(dom.xpath("//date")[0]) | |
| 809 except: | |
| 810 pass | |
|
50
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
811 return docinfo |
|
6c0f20cecc60
added evaluation of the presentation/info.xml in texttools
dwinter
parents:
49
diff
changeset
|
812 |
| 70 | 813 def getDocinfoFromImagePath(self,path,docinfo=None,cut=0): |
| 22 | 814 """path ist the path to the images it assumes that the index.meta file is one level higher.""" |
| 167 | 815 logging.debug("documentViewer (getdocinfofromimagepath) path: %s"%(path)) |
| 22 | 816 if docinfo is None: |
| 817 docinfo = {} | |
| 29 | 818 path=path.replace("/mpiwg/online","") |
| 22 | 819 docinfo['imagePath'] = path |
| 73 | 820 docinfo=self.getDirinfoFromDigilib(path,docinfo=docinfo,cut=cut) |
| 78 | 821 |
|
79
df6952ac93e9
bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents:
78
diff
changeset
|
822 pathorig=path |
| 78 | 823 for x in range(cut): |
| 824 path=getParentDir(path) | |
| 167 | 825 logging.debug("documentViewer (getdocinfofromimagepath) PATH:"+path) |
| 31 | 826 imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn="+path |
| 22 | 827 docinfo['imageURL'] = imageUrl |
| 828 | |
|
79
df6952ac93e9
bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents:
78
diff
changeset
|
829 #path ist the path to the images it assumes that the index.meta file is one level higher. |
|
df6952ac93e9
bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents:
78
diff
changeset
|
830 docinfo = self.getBibinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1) |
|
df6952ac93e9
bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents:
78
diff
changeset
|
831 docinfo = self.getAuthinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1) |
| 22 | 832 return docinfo |
| 20 | 833 |
| 22 | 834 |
| 835 def getDocinfo(self, mode, url): | |
| 836 """returns docinfo depending on mode""" | |
| 167 | 837 logging.debug("documentViewer (getdocinfo) mode: %s, url: %s"%(mode,url)) |
| 22 | 838 # look for cached docinfo in session |
|
51
c5d3aabbf61b
textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents:
50
diff
changeset
|
839 if self.REQUEST.SESSION.has_key('docinfo'): |
| 22 | 840 docinfo = self.REQUEST.SESSION['docinfo'] |
| 841 # check if its still current | |
| 842 if docinfo is not None and docinfo.get('mode') == mode and docinfo.get('url') == url: | |
| 167 | 843 logging.debug("documentViewer (getdocinfo) docinfo in session: %s"%docinfo) |
| 22 | 844 return docinfo |
| 845 # new docinfo | |
| 846 docinfo = {'mode': mode, 'url': url} | |
| 847 if mode=="texttool": #index.meta with texttool information | |
| 848 docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo) | |
| 849 elif mode=="imagepath": | |
| 850 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo) | |
| 70 | 851 elif mode=="filepath": |
|
75
9673218e155b
minorCVS: ----------------------------------------------------------------------
dwinter
parents:
74
diff
changeset
|
852 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo,cut=1) |
| 22 | 853 else: |
| 167 | 854 logging.error("documentViewer (getdocinfo) unknown mode: %s!"%mode) |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
855 raise ValueError("Unknown mode %s! Has to be one of 'texttool','imagepath','filepath'."%(mode)) |
| 409 | 856 |
| 857 # FIXME: fake texturlpath | |
| 858 if not docinfo.has_key('textURLPath'): | |
| 859 docinfo['textURLPath'] = None | |
| 860 | |
| 167 | 861 logging.debug("documentViewer (getdocinfo) docinfo: %s"%docinfo) |
| 362 | 862 #logging.debug("documentViewer (getdocinfo) docinfo: %s"%) |
| 22 | 863 self.REQUEST.SESSION['docinfo'] = docinfo |
| 864 return docinfo | |
| 128 | 865 |
| 405 | 866 def getPageinfo(self, current, start=None, rows=None, cols=None, docinfo=None, viewMode=None, tocMode=None): |
| 22 | 867 """returns pageinfo with the given parameters""" |
| 868 pageinfo = {} | |
| 25 | 869 current = getInt(current) |
| 338 | 870 |
| 25 | 871 pageinfo['current'] = current |
| 872 rows = int(rows or self.thumbrows) | |
| 873 pageinfo['rows'] = rows | |
| 874 cols = int(cols or self.thumbcols) | |
| 875 pageinfo['cols'] = cols | |
| 876 grpsize = cols * rows | |
| 877 pageinfo['groupsize'] = grpsize | |
| 61 | 878 start = getInt(start, default=(math.ceil(float(current)/float(grpsize))*grpsize-(grpsize-1))) |
| 879 # int(current / grpsize) * grpsize +1)) | |
| 22 | 880 pageinfo['start'] = start |
| 25 | 881 pageinfo['end'] = start + grpsize |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
882 if (docinfo is not None) and ('numPages' in docinfo): |
| 25 | 883 np = int(docinfo['numPages']) |
| 884 pageinfo['end'] = min(pageinfo['end'], np) | |
| 885 pageinfo['numgroups'] = int(np / grpsize) | |
| 886 if np % grpsize > 0: | |
| 128 | 887 pageinfo['numgroups'] += 1 |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
888 pageinfo['viewMode'] = viewMode |
|
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
889 pageinfo['tocMode'] = tocMode |
| 412 | 890 pageinfo['characterNormalization'] = self.REQUEST.get('characterNormalization','reg') |
| 398 | 891 pageinfo['optionToggle'] = self.REQUEST.get('optionToggle','') |
| 892 pageinfo['query'] = self.REQUEST.get('query','') | |
| 384 | 893 pageinfo['queryType'] = self.REQUEST.get('queryType','') |
| 95 | 894 pageinfo['querySearch'] =self.REQUEST.get('querySearch', 'fulltext') |
| 99 | 895 pageinfo['textPN'] = self.REQUEST.get('textPN','1') |
| 384 | 896 pageinfo['highlightQuery'] = self.REQUEST.get('highlightQuery','') |
| 95 | 897 pageinfo['tocPageSize'] = self.REQUEST.get('tocPageSize', '30') |
| 105 | 898 pageinfo['queryPageSize'] =self.REQUEST.get('queryPageSize', '10') |
|
90
6a4a72033d58
new version with new full-text infrastructure and some more changed templates
casties
parents:
84
diff
changeset
|
899 pageinfo['tocPN'] = self.REQUEST.get('tocPN', '1') |
| 419 | 900 |
| 99 | 901 toc = int (pageinfo['tocPN']) |
| 902 pageinfo['textPages'] =int (toc) | |
| 158 | 903 |
| 362 | 904 |
| 326 | 905 |
| 99 | 906 if 'tocSize_%s'%tocMode in docinfo: |
| 907 tocSize = int(docinfo['tocSize_%s'%tocMode]) | |
| 908 tocPageSize = int(pageinfo['tocPageSize']) | |
| 128 | 909 # cached toc |
| 99 | 910 if tocSize%tocPageSize>0: |
| 911 tocPages=tocSize/tocPageSize+1 | |
| 912 else: | |
| 913 tocPages=tocSize/tocPageSize | |
| 128 | 914 pageinfo['tocPN'] = min (tocPages,toc) |
| 95 | 915 pageinfo['searchPN'] =self.REQUEST.get('searchPN','1') |
| 112 | 916 pageinfo['sn'] =self.REQUEST.get('sn','') |
| 22 | 917 return pageinfo |
| 918 | |
| 128 | 919 def changeDocumentViewer(self,title="",digilibBaseUrl=None,thumbrows=2,thumbcols=5,authgroups='mpiwg',RESPONSE=None): |
| 22 | 920 """init document viewer""" |
| 921 self.title=title | |
| 922 self.digilibBaseUrl = digilibBaseUrl | |
| 25 | 923 self.thumbrows = thumbrows |
| 924 self.thumbcols = thumbcols | |
| 32 | 925 self.authgroups = [s.strip().lower() for s in authgroups.split(',')] |
| 22 | 926 if RESPONSE is not None: |
| 927 RESPONSE.redirect('manage_main') | |
| 0 | 928 |
| 929 def manage_AddDocumentViewerForm(self): | |
| 930 """add the viewer form""" | |
| 22 | 931 pt=PageTemplateFile('zpt/addDocumentViewer', globals()).__of__(self) |
| 0 | 932 return pt() |
| 933 | |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
934 def manage_AddDocumentViewer(self,id,imageScalerUrl="",textServerName="",title="",RESPONSE=None): |
| 0 | 935 """add the viewer""" |
|
84
a6e4f9b6729a
first version with new full-text infrastructure and slightly changed templates
casties
parents:
83
diff
changeset
|
936 newObj=documentViewer(id,imageScalerUrl=imageScalerUrl,title=title,textServerName=textServerName) |
| 0 | 937 self._setObject(id,newObj) |
| 938 | |
| 939 if RESPONSE is not None: | |
| 940 RESPONSE.redirect('manage_main') | |
| 22 | 941 |
| 942 ## DocumentViewerTemplate class | |
| 943 class DocumentViewerTemplate(ZopePageTemplate): | |
| 944 """Template for document viewer""" | |
| 945 meta_type="DocumentViewer Template" | |
| 946 | |
| 947 | |
| 948 def manage_addDocumentViewerTemplateForm(self): | |
| 949 """Form for adding""" | |
| 950 pt=PageTemplateFile('zpt/addDocumentViewerTemplate', globals()).__of__(self) | |
| 951 return pt() | |
| 952 | |
| 953 def manage_addDocumentViewerTemplate(self, id='viewer_main', title=None, text=None, | |
| 954 REQUEST=None, submit=None): | |
| 955 "Add a Page Template with optional file content." | |
| 956 | |
| 957 self._setObject(id, DocumentViewerTemplate(id)) | |
| 958 ob = getattr(self, id) | |
|
53
f4e0af8c281d
NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents:
52
diff
changeset
|
959 txt=file(os.path.join(package_home(globals()),'zpt/viewer_main.zpt'),'r').read() |
| 167 | 960 logging.info("txt %s:"%txt) |
|
53
f4e0af8c281d
NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents:
52
diff
changeset
|
961 ob.pt_edit(txt,"text/html") |
| 22 | 962 if title: |
| 963 ob.pt_setTitle(title) | |
| 964 try: | |
| 965 u = self.DestinationURL() | |
| 966 except AttributeError: | |
| 967 u = REQUEST['URL1'] | |
| 968 | |
| 969 u = "%s/%s" % (u, urllib.quote(id)) | |
| 970 REQUEST.RESPONSE.redirect(u+'/manage_main') | |
| 971 return '' | |
| 972 | |
| 973 | |
| 41 | 974 |
