annotate documentViewer.py @ 410:13dd83f46f6f

*** empty log message ***
author abukhman
date Mon, 06 Dec 2010 11:39:43 +0100
parents f7d73ea4b38b
children 759ed7577eef
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
1
0
dwinter
parents:
diff changeset
2 from OFS.Folder import Folder
dwinter
parents:
diff changeset
3 from Products.PageTemplates.ZopePageTemplate import ZopePageTemplate
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
4 from Products.PageTemplates.PageTemplateFile import PageTemplateFile
0
dwinter
parents:
diff changeset
5 from AccessControl import ClassSecurityInfo
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
6 from AccessControl import getSecurityManager
0
dwinter
parents:
diff changeset
7 from Globals import package_home
235
f4ece44559e5 *** empty log message ***
abukhman
parents: 234
diff changeset
8 from Products.zogiLib.zogiLib import browserCheck
0
dwinter
parents:
diff changeset
9
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
10 from Ft.Xml import EMPTY_NAMESPACE, Parse
134
6a33aa624ba4 fixed more oopsies
casties
parents: 133
diff changeset
11 import Ft.Xml.Domlette
0
dwinter
parents:
diff changeset
12 import os.path
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
13 import sys
0
dwinter
parents:
diff changeset
14 import urllib
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
15 import urllib2
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
16 import logging
61
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
17 import math
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
18 import urlparse
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
19 import cStringIO
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
20 import re
389
114d40b358ab *** empty log message ***
abukhman
parents: 387
diff changeset
21 import string
231
a88ece9a5e74 *** empty log message ***
abukhman
parents: 230
diff changeset
22
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
23 def logger(txt,method,txt2):
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
24 """logging"""
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
25 logging.info(txt+ txt2)
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
26
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
27
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
28 def getInt(number, default=0):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
29 """returns always an int (0 in case of problems)"""
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
30 try:
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
31 return int(number)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
32 except:
62
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
33 return int(default)
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
34
0
dwinter
parents:
diff changeset
35 def getTextFromNode(nodename):
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
36 """get the cdata content of a node"""
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
37 if nodename is None:
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
38 return ""
0
dwinter
parents:
diff changeset
39 nodelist=nodename.childNodes
dwinter
parents:
diff changeset
40 rc = ""
dwinter
parents:
diff changeset
41 for node in nodelist:
dwinter
parents:
diff changeset
42 if node.nodeType == node.TEXT_NODE:
dwinter
parents:
diff changeset
43 rc = rc + node.data
dwinter
parents:
diff changeset
44 return rc
dwinter
parents:
diff changeset
45
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
46 def serializeNode(node, encoding='utf-8'):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
47 """returns a string containing node as XML"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
48 buf = cStringIO.StringIO()
136
a2114cd4673c fixed broken imports (silly me)
casties
parents: 135
diff changeset
49 Ft.Xml.Domlette.Print(node, stream=buf, encoding=encoding)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
50 s = buf.getvalue()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
51 buf.close()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
52 return s
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
53
387
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
54 def browserCheck(self):
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
55 """check the browsers request to find out the browser type"""
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
56 bt = {}
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
57 ua = self.REQUEST.get_header("HTTP_USER_AGENT")
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
58 bt['ua'] = ua
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
59 bt['isIE'] = False
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
60 bt['isN4'] = False
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
61 if string.find(ua, 'MSIE') > -1:
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
62 bt['isIE'] = True
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
63 else:
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
64 bt['isN4'] = (string.find(ua, 'Mozilla/4.') > -1)
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
65
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
66 try:
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
67 nav = ua[string.find(ua, '('):]
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
68 ie = string.split(nav, "; ")[1]
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
69 if string.find(ie, "MSIE") > -1:
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
70 bt['versIE'] = string.split(ie, " ")[1]
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
71 except: pass
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
72
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
73 bt['isMac'] = string.find(ua, 'Macintosh') > -1
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
74 bt['isWin'] = string.find(ua, 'Windows') > -1
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
75 bt['isIEWin'] = bt['isIE'] and bt['isWin']
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
76 bt['isIEMac'] = bt['isIE'] and bt['isMac']
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
77 bt['staticHTML'] = False
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
78
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
79 return bt
234
0813585df9f4 *** empty log message ***
abukhman
parents: 231
diff changeset
80
0813585df9f4 *** empty log message ***
abukhman
parents: 231
diff changeset
81
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
82 def getParentDir(path):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
83 """returns pathname shortened by one"""
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
84 return '/'.join(path.split('/')[0:-1])
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
85
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
86
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
87 def getHttpData(url, data=None, num_tries=3, timeout=10):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
88 """returns result from url+data HTTP request"""
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
89 # we do GET (by appending data to url)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
90 if isinstance(data, str) or isinstance(data, unicode):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
91 # if data is string then append
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
92 url = "%s?%s"%(url,data)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
93 elif isinstance(data, dict) or isinstance(data, list) or isinstance(data, tuple):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
94 # urlencode
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
95 url = "%s?%s"%(url,urllib.urlencode(data))
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
96
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
97 response = None
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
98 errmsg = None
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
99 for cnt in range(num_tries):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
100 try:
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
101 logging.debug("getHttpData(#%s %ss) url=%s"%(cnt+1,timeout,url))
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
102 if sys.version_info < (2, 6):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
103 # set timeout on socket -- ugly :-(
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
104 import socket
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
105 socket.setdefaulttimeout(float(timeout))
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
106 response = urllib2.urlopen(url)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
107 else:
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
108 response = urllib2.urlopen(url,timeout=float(timeout))
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
109 # check result?
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
110 break
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
111 except urllib2.HTTPError, e:
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
112 logging.error("getHttpData: HTTP error(%s): %s"%(e.code,e))
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
113 errmsg = str(e)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
114 # stop trying
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
115 break
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
116 except urllib2.URLError, e:
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
117 logging.error("getHttpData: URLLIB error(%s): %s"%(e.reason,e))
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
118 errmsg = str(e)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
119 # stop trying
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
120 #break
0
dwinter
parents:
diff changeset
121
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
122 if response is not None:
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
123 data = response.read()
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
124 response.close()
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
125 return data
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
126
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
127 raise IOError("ERROR fetching HTTP data from %s: %s"%(url,errmsg))
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
128 #return None
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
129
0
dwinter
parents:
diff changeset
130
dwinter
parents:
diff changeset
131
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
132 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
133 ## documentViewer class
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
134 ##
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
135 class documentViewer(Folder):
0
dwinter
parents:
diff changeset
136 """document viewer"""
dwinter
parents:
diff changeset
137 meta_type="Document viewer"
dwinter
parents:
diff changeset
138
dwinter
parents:
diff changeset
139 security=ClassSecurityInfo()
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
140 manage_options=Folder.manage_options+(
0
dwinter
parents:
diff changeset
141 {'label':'main config','action':'changeDocumentViewerForm'},
dwinter
parents:
diff changeset
142 )
dwinter
parents:
diff changeset
143
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
144 # templates and forms
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
145 viewer_main = PageTemplateFile('zpt/viewer_main', globals())
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
146 toc_thumbs = PageTemplateFile('zpt/toc_thumbs', globals())
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
147 toc_text = PageTemplateFile('zpt/toc_text', globals())
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
148 toc_figures = PageTemplateFile('zpt/toc_figures', globals())
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
149 page_main_images = PageTemplateFile('zpt/page_main_images', globals())
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
150 page_main_text = PageTemplateFile('zpt/page_main_text', globals())
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
151 page_main_text_dict = PageTemplateFile('zpt/page_main_text_dict', globals())
140
6345583d809a Gis mode
abukhman
parents: 137
diff changeset
152 page_main_gis =PageTemplateFile ('zpt/page_main_gis', globals())
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
153 page_main_xml = PageTemplateFile('zpt/page_main_xml', globals())
404
29a87dc92750 *** empty log message ***
abukhman
parents: 398
diff changeset
154 page_main_pureXml = PageTemplateFile('zpt/page_main_pureXml', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
155 head_main = PageTemplateFile('zpt/head_main', globals())
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
156 docuviewer_css = PageTemplateFile('css/docuviewer.css', globals())
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
157 info_xml = PageTemplateFile('zpt/info_xml', globals())
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
158
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
159
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
160 thumbs_main_rss = PageTemplateFile('zpt/thumbs_main_rss', globals())
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
161 security.declareProtected('View management screens','changeDocumentViewerForm')
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
162 changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals())
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
163
0
dwinter
parents:
diff changeset
164
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
165 def __init__(self,id,imageScalerUrl=None,textServerName=None,title="",digilibBaseUrl=None,thumbcols=2,thumbrows=5,authgroups="mpiwg"):
0
dwinter
parents:
diff changeset
166 """init document viewer"""
dwinter
parents:
diff changeset
167 self.id=id
dwinter
parents:
diff changeset
168 self.title=title
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
169 self.thumbcols = thumbcols
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
170 self.thumbrows = thumbrows
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
171 # authgroups is list of authorized groups (delimited by ,)
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
172 self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
173 # create template folder so we can always use template.something
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
174
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
175 templateFolder = Folder('template')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
176 #self['template'] = templateFolder # Zope-2.12 style
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
177 self._setObject('template',templateFolder) # old style
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
178 try:
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
179 import MpdlXmlTextServer
132
39167e96e582 fixed creation of text server on __init__
casties
parents: 130
diff changeset
180 textServer = MpdlXmlTextServer.MpdlXmlTextServer(id='fulltextclient',serverName=textServerName)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
181 #templateFolder['fulltextclient'] = xmlRpcClient
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
182 templateFolder._setObject('fulltextclient',textServer)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
183 except Exception, e:
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
184 logging.error("Unable to create MpdlXmlTextServer for fulltextclient: "+str(e))
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
185 try:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
186 from Products.zogiLib.zogiLib import zogiLib
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
187 zogilib = zogiLib(id="zogilib", title="zogilib for docuviewer", dlServerURL=imageScalerUrl, layout="book")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
188 #templateFolder['zogilib'] = zogilib
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
189 templateFolder._setObject('zogilib',zogilib)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
190 except Exception, e:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
191 logging.error("Unable to create zogiLib for zogilib: "+str(e))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
192
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
193
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
194 # proxy text server methods to fulltextclient
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
195 def getTextPage(self, **args):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
196 """get page"""
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
197 return self.template.fulltextclient.getTextPage(**args)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
198
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
199 def getQuery(self, **args):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
200 """get query"""
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
201 return self.template.fulltextclient.getQuery(**args)
386
48d27e100d19 *** empty log message ***
abukhman
parents: 384
diff changeset
202
396
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
203 def getQueryResultHits(self, **args):
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
204 """get query"""
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
205 return self.template.fulltextclient.getQueryResultHits(**args)
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
206
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
207 def getQueryResultHitsText(self, **args):
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
208 """get query"""
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
209 return self.template.fulltextclient.getQueryResultHitsText(**args)
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
210
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
211 def getQueryResultHitsFigures(self, **args):
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
212 """get query"""
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
213 return self.template.fulltextclient.getQueryResultHitsFigures(**args)
28a03e25a0e8 *** empty log message ***
abukhman
parents: 394
diff changeset
214
386
48d27e100d19 *** empty log message ***
abukhman
parents: 384
diff changeset
215 def getPDF(self, **args):
48d27e100d19 *** empty log message ***
abukhman
parents: 384
diff changeset
216 """get query"""
48d27e100d19 *** empty log message ***
abukhman
parents: 384
diff changeset
217 return self.template.fulltextclient.getPDF(**args)
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
218
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
219 def getSearch(self, **args):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
220 """get search"""
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
221 return self.template.fulltextclient.getSearch(**args)
256
ad1458aff8a6 *** empty log message ***
abukhman
parents: 235
diff changeset
222
ad1458aff8a6 *** empty log message ***
abukhman
parents: 235
diff changeset
223 def getGisPlaces(self, **args):
307
ec5e920a61e6 *** empty log message ***
abukhman
parents: 256
diff changeset
224 """get gis places"""
256
ad1458aff8a6 *** empty log message ***
abukhman
parents: 235
diff changeset
225 return self.template.fulltextclient.getGisPlaces(**args)
307
ec5e920a61e6 *** empty log message ***
abukhman
parents: 256
diff changeset
226
ec5e920a61e6 *** empty log message ***
abukhman
parents: 256
diff changeset
227 def getAllGisPlaces(self, **args):
310
80ae2324562b *** empty log message ***
abukhman
parents: 307
diff changeset
228 """get all gis places """
80ae2324562b *** empty log message ***
abukhman
parents: 307
diff changeset
229 return self.template.fulltextclient.getAllGisPlaces(**args)
80ae2324562b *** empty log message ***
abukhman
parents: 307
diff changeset
230
80ae2324562b *** empty log message ***
abukhman
parents: 307
diff changeset
231 def getOrigPages(self, **args):
80ae2324562b *** empty log message ***
abukhman
parents: 307
diff changeset
232 """get original page number """
80ae2324562b *** empty log message ***
abukhman
parents: 307
diff changeset
233 return self.template.fulltextclient.getOrigPages(**args)
80ae2324562b *** empty log message ***
abukhman
parents: 307
diff changeset
234
410
13dd83f46f6f *** empty log message ***
abukhman
parents: 409
diff changeset
235 def getAllPlaces(self, **args):
13dd83f46f6f *** empty log message ***
abukhman
parents: 409
diff changeset
236 """get original page number """
13dd83f46f6f *** empty log message ***
abukhman
parents: 409
diff changeset
237 return self.template.fulltextclient.getAllPlaces(**args)
13dd83f46f6f *** empty log message ***
abukhman
parents: 409
diff changeset
238
133
40730cfbcb8e fixed problem with getnumpages and **args
casties
parents: 132
diff changeset
239 def getNumPages(self, docinfo):
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
240 """get numpages"""
133
40730cfbcb8e fixed problem with getnumpages and **args
casties
parents: 132
diff changeset
241 return self.template.fulltextclient.getNumPages(docinfo)
191
cffaec9bc5ad *** empty log message ***
abukhman
parents: 174
diff changeset
242
cffaec9bc5ad *** empty log message ***
abukhman
parents: 174
diff changeset
243 def getNumTextPages(self, docinfo):
cffaec9bc5ad *** empty log message ***
abukhman
parents: 174
diff changeset
244 """get numpages text"""
cffaec9bc5ad *** empty log message ***
abukhman
parents: 174
diff changeset
245 return self.template.fulltextclient.getNumTextPages(docinfo)
cffaec9bc5ad *** empty log message ***
abukhman
parents: 174
diff changeset
246
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
247 def getTranslate(self, **args):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
248 """get translate"""
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
249 return self.template.fulltextclient.getTranslate(**args)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
250
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
251 def getLemma(self, **args):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
252 """get lemma"""
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
253 return self.template.fulltextclient.getLemma(**args)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
254
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
255 def getToc(self, **args):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
256 """get toc"""
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
257 return self.template.fulltextclient.getToc(**args)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
258
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
259 def getTocPage(self, **args):
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
260 """get tocpage"""
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
261 return self.template.fulltextclient.getTocPage(**args)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
262
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
263
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
264 security.declareProtected('View','thumbs_rss')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
265 def thumbs_rss(self,mode,url,viewMode="auto",start=None,pn=1):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
266 '''
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
267 view it
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
268 @param mode: defines how to access the document behind url
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
269 @param url: url which contains display information
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
270 @param viewMode: if images display images, if text display text, default is images (text,images or auto)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
271
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
272 '''
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
273 logging.debug("HHHHHHHHHHHHHH:load the rss")
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
274 logger("documentViewer (index)", logging.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
275
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
276 if not hasattr(self, 'template'):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
277 # create template folder if it doesn't exist
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
278 self.manage_addFolder('template')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
279
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
280 if not self.digilibBaseUrl:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
281 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
282
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
283 docinfo = self.getDocinfo(mode=mode,url=url)
338
0576f524e2ee *** empty log message ***
abukhman
parents: 337
diff changeset
284 #pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo)
345
c39c252a3186 *** empty log message ***
abukhman
parents: 343
diff changeset
285 pageinfo = self.getPageinfo(start=start,current=pn, docinfo=docinfo)
331
6cde7f02786e *** empty log message ***
abukhman
parents: 330
diff changeset
286 ''' ZDES '''
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
287 pt = getattr(self.template, 'thumbs_main_rss')
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
288
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
289 if viewMode=="auto": # automodus gewaehlt
409
f7d73ea4b38b quick fix for broken texturlpath
casties
parents: 405
diff changeset
290 if docinfo.has_key("textURL") or docinfo.get('textURLPath',None): #texturl gesetzt und textViewer konfiguriert
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
291 viewMode="text"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
292 else:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
293 viewMode="images"
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
294
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
295 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
296
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
297 security.declareProtected('View','index_html')
405
b8fb4c750d74 fix for characternormalization default
casties
parents: 404
diff changeset
298 def index_html(self,url,mode="texttool",viewMode="auto",tocMode="thumbs",start=None,pn=1,mk=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
299 '''
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
300 view it
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
301 @param mode: defines how to access the document behind url
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
302 @param url: url which contains display information
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
303 @param viewMode: if images display images, if text display text, default is auto (text,images or auto)
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
304 @param tocMode: type of 'table of contents' for navigation (thumbs, text, figures, none)
141
39c7d6164da8 characterNormalization (reg,norm, none)
abukhman
parents: 140
diff changeset
305 @param characterNormalization type of text display (reg, norm, none)
100
137459e3b378 Last update
abukhman
parents: 99
diff changeset
306 @param querySearch: type of different search modes (fulltext, fulltextMorph, xpath, xquery, ftIndex, ftIndexMorph, fulltextMorphLemma)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
307 '''
0
dwinter
parents:
diff changeset
308
345
c39c252a3186 *** empty log message ***
abukhman
parents: 343
diff changeset
309 logging.debug("documentViewer (index) mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
310
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
311 if not hasattr(self, 'template'):
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
312 # this won't work
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
313 logging.error("template folder missing!")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
314 return "ERROR: template folder missing!"
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
315
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
316 if not getattr(self, 'digilibBaseUrl', None):
132
39167e96e582 fixed creation of text server on __init__
casties
parents: 130
diff changeset
317 self.digilibBaseUrl = self.findDigilibUrl() or "http://digilib.mpiwg-berlin.mpg.de/digitallibrary"
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
318
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
319 docinfo = self.getDocinfo(mode=mode,url=url)
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
320
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
321 if tocMode != "thumbs":
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
322 # get table of contents
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
323 docinfo = self.getToc(mode=tocMode, docinfo=docinfo)
97
2b8fd19432fb Last update
abukhman
parents: 96
diff changeset
324
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
325 if viewMode=="auto": # automodus gewaehlt
409
f7d73ea4b38b quick fix for broken texturlpath
casties
parents: 405
diff changeset
326 if docinfo.has_key('textURL') or docinfo.get('textURLPath',None): #texturl gesetzt und textViewer konfiguriert
127
49f381f896d0 try to make text_dict default for texts
casties
parents: 126
diff changeset
327 viewMode="text_dict"
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
328 else:
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
329 viewMode="images"
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
330
345
c39c252a3186 *** empty log message ***
abukhman
parents: 343
diff changeset
331 pageinfo = self.getPageinfo(start=start,current=pn, docinfo=docinfo,viewMode=viewMode,tocMode=tocMode)
127
49f381f896d0 try to make text_dict default for texts
casties
parents: 126
diff changeset
332
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
333 pt = getattr(self.template, 'viewer_main')
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
334 return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode,mk=self.generateMarks(mk))
0
dwinter
parents:
diff changeset
335
74
dwinter
parents: 73
diff changeset
336 def generateMarks(self,mk):
dwinter
parents: 73
diff changeset
337 ret=""
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
338 if mk is None:
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
339 return ""
134
6a33aa624ba4 fixed more oopsies
casties
parents: 133
diff changeset
340 if not isinstance(mk, list):
132
39167e96e582 fixed creation of text server on __init__
casties
parents: 130
diff changeset
341 mk=[mk]
74
dwinter
parents: 73
diff changeset
342 for m in mk:
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
343 ret+="mk=%s"%m
74
dwinter
parents: 73
diff changeset
344 return ret
389
114d40b358ab *** empty log message ***
abukhman
parents: 387
diff changeset
345
114d40b358ab *** empty log message ***
abukhman
parents: 387
diff changeset
346
387
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
347 def getBrowser(self):
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
348 """getBrowser the version of browser """
389
114d40b358ab *** empty log message ***
abukhman
parents: 387
diff changeset
349 names=""
114d40b358ab *** empty log message ***
abukhman
parents: 387
diff changeset
350 names = browserCheck(self)
114d40b358ab *** empty log message ***
abukhman
parents: 387
diff changeset
351 #logging.debug("XXXXXXXXXXXXXXXX: %s"%names)
114d40b358ab *** empty log message ***
abukhman
parents: 387
diff changeset
352 return names
387
580db757e0eb *** empty log message ***
abukhman
parents: 386
diff changeset
353
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
354 def findDigilibUrl(self):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
355 """try to get the digilib URL from zogilib"""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
356 url = self.template.zogilib.getDLBaseUrl()
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
357 return url
126
c6dcf12e3807 added method to get url of viewer instance
casties
parents: 124
diff changeset
358
c6dcf12e3807 added method to get url of viewer instance
casties
parents: 124
diff changeset
359 def getDocumentViewerURL(self):
c6dcf12e3807 added method to get url of viewer instance
casties
parents: 124
diff changeset
360 """returns the URL of this instance"""
c6dcf12e3807 added method to get url of viewer instance
casties
parents: 124
diff changeset
361 return self.absolute_url()
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
362
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
363 def getStyle(self, idx, selected, style=""):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
364 """returns a string with the given style and append 'sel' if path == selected."""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
365 #logger("documentViewer (getstyle)", logging.INFO, "idx: %s selected: %s style: %s"%(idx,selected,style))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
366 if idx == selected:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
367 return style + 'sel'
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
368 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
369 return style
74
dwinter
parents: 73
diff changeset
370
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
371 def getLink(self,param=None,val=None):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
372 """link to documentviewer with parameter param set to val"""
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
373 params=self.REQUEST.form.copy()
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
374 if param is not None:
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
375 if val is None:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
376 if params.has_key(param):
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
377 del params[param]
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
378 else:
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
379 params[param] = str(val)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
380
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
381 if params.get("mode", None) == "filepath": #wenn beim erst Aufruf filepath gesetzt wurde aendere das nun zu imagepath
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
382 params["mode"] = "imagepath"
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
383 params["url"] = getParentDir(params["url"])
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
384
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
385 # quote values and assemble into query string
135
123248b3bb34 fixed more oopsies
casties
parents: 134
diff changeset
386 #ps = "&".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
123248b3bb34 fixed more oopsies
casties
parents: 134
diff changeset
387 ps = urllib.urlencode(params)
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
388 url=self.REQUEST['URL1']+"?"+ps
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
389 return url
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
390
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
391 def getLinkAmp(self,param=None,val=None):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
392 """link to documentviewer with parameter param set to val"""
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
393 params=self.REQUEST.form.copy()
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
394 if param is not None:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
395 if val is None:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
396 if params.has_key(param):
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
397 del params[param]
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
398 else:
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
399 params[param] = str(val)
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
400
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
401 # quote values and assemble into query string
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
402 logging.debug("XYXXXXX: %s"%repr(params.items()))
68
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
403 ps = "&amp;".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
404 url=self.REQUEST['URL1']+"?"+ps
b8457fc33446 piclens rss/support
dwinter
parents: 65
diff changeset
405 return url
81
fae97f071724 fixed problem with info.xml when url without index.meta
casties
parents: 79
diff changeset
406
57
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
407 def getInfo_xml(self,url,mode):
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
408 """returns info about the document as XML"""
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
409
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
410 if not self.digilibBaseUrl:
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
411 self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
412
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
413 docinfo = self.getDocinfo(mode=mode,url=url)
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
414 pt = getattr(self.template, 'info_xml')
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
415 return pt(docinfo=docinfo)
7cdb0fc34a92 added getInfo_xml method
casties
parents: 55
diff changeset
416
394
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
417 def getOptionToggle(self, newState=None, optionName='text_options_open', initialState=True):
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
418 """returns new option state"""
397
5b078a6d8909 new toggle option method
casties
parents: 396
diff changeset
419 if not self.REQUEST.SESSION.has_key(optionName):
394
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
420 # not in session -- initial
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
421 opt = {'lastState': newState, 'state': initialState}
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
422 else:
397
5b078a6d8909 new toggle option method
casties
parents: 396
diff changeset
423 opt = self.REQUEST.SESSION.get(optionName)
394
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
424 if opt['lastState'] != newState:
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
425 # state in session has changed -- toggle
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
426 opt['state'] = not opt['state']
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
427 opt['lastState'] = newState
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
428
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
429 self.REQUEST.SESSION[optionName] = opt
ce9fa69f81c3 new toggle option method
casties
parents: 392
diff changeset
430 return opt['state']
0
dwinter
parents:
diff changeset
431
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
432 def isAccessible(self, docinfo):
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
433 """returns if access to the resource is granted"""
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
434 access = docinfo.get('accessType', None)
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
435 logging.debug("documentViewer (accessOK) access type %s"%access)
45
0391fe75aef3 fixed handling of documents with missing access tag
casties
parents: 43
diff changeset
436 if access is not None and access == 'free':
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
437 logging.debug("documentViewer (accessOK) access is free")
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
438 return True
45
0391fe75aef3 fixed handling of documents with missing access tag
casties
parents: 43
diff changeset
439 elif access is None or access in self.authgroups:
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
440 # only local access -- only logged in users
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
441 user = getSecurityManager().getUser()
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
442 logging.debug("documentViewer (accessOK) user=%s ip=%s"%(user,self.REQUEST.getClientAddr()))
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
443 if user is not None:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
444 #print "user: ", user
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
445 return (user.getUserName() != "Anonymous User")
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
446 else:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
447 return False
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
448
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
449 logging.error("documentViewer (accessOK) unknown access type %s"%access)
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
450 return False
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
451
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
452
73
dwinter
parents: 71
diff changeset
453 def getDirinfoFromDigilib(self,path,docinfo=None,cut=0):
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
454 """gibt param von dlInfo aus"""
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
455 if docinfo is None:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
456 docinfo = {}
73
dwinter
parents: 71
diff changeset
457
dwinter
parents: 71
diff changeset
458 for x in range(cut):
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
459
73
dwinter
parents: 71
diff changeset
460 path=getParentDir(path)
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
461
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
462 infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
463
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
464 logging.debug("documentViewer (getparamfromdigilib) dirInfo from %s"%(infoUrl))
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
465
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
466 txt = getHttpData(infoUrl)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
467 if txt is None:
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
468 raise IOError("Unable to get dir-info from %s"%(infoUrl))
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
469
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
470 dom = Parse(txt)
37
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
471 sizes=dom.xpath("//dir/size")
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
472 logging.debug("documentViewer (getparamfromdigilib) dirInfo:size"%sizes)
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
473
37
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
474 if sizes:
ead830ce45d6 better error messages
casties
parents: 35
diff changeset
475 docinfo['numPages'] = int(getTextFromNode(sizes[0]))
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
476 else:
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
477 docinfo['numPages'] = 0
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
478
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
479 # TODO: produce and keep list of image names and numbers
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
480
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
481 return docinfo
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
482
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
483 def getIndexMetaPath(self,url):
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
484 """gib nur den Pfad zurueck"""
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
485 regexp = re.compile(r".*(experimental|permanent)/(.*)")
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
486 regpath = regexp.match(url)
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
487 if (regpath==None):
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
488 return ""
224
58c5338749c7 *** empty log message ***
abukhman
parents: 223
diff changeset
489 logging.debug("(getDomFromIndexMeta): URLXAXA: %s"%regpath.group(2))
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
490 return ("/mpiwg/online/"+regpath.group(1)+"/"+regpath.group(2))
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
491
225
57c2f5b6ada5 *** empty log message ***
abukhman
parents: 224
diff changeset
492
57c2f5b6ada5 *** empty log message ***
abukhman
parents: 224
diff changeset
493
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
494 def getIndexMetaUrl(self,url):
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
495 """returns utr of index.meta document at url"""
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
496
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
497 metaUrl = None
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
498 if url.startswith("http://"):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
499 # real URL
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
500 metaUrl = url
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
501 else:
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
502 # online path
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
503 server=self.digilibBaseUrl+"/servlet/Texter?fn="
40
749ee5389892 try to ignore superfluous /mpiwg/online in urls
casties
parents: 39
diff changeset
504 metaUrl=server+url.replace("/mpiwg/online","")
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
505 if not metaUrl.endswith("index.meta"):
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
506 metaUrl += "/index.meta"
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
507
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
508 return metaUrl
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
509
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
510 def getDomFromIndexMeta(self, url):
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
511 """get dom from index meta"""
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
512 dom = None
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
513 metaUrl = self.getIndexMetaUrl(url)
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
514
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
515 logging.debug("(getDomFromIndexMeta): METAURL: %s"%metaUrl)
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
516 txt=getHttpData(metaUrl)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
517 if txt is None:
39
1dd90aabd366 added retry when reading index meta from texter applet
casties
parents: 38
diff changeset
518 raise IOError("Unable to read index meta from %s"%(url))
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
519
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
520 dom = Parse(txt)
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
521 return dom
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
522
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
523 def getPresentationInfoXML(self, url):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
524 """returns dom of info.xml document at url"""
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
525 dom = None
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
526 metaUrl = None
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
527 if url.startswith("http://"):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
528 # real URL
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
529 metaUrl = url
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
530 else:
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
531 # online path
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
532 server=self.digilibBaseUrl+"/servlet/Texter?fn="
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
533 metaUrl=server+url.replace("/mpiwg/online","")
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
534
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
535 txt=getHttpData(metaUrl)
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
536 if txt is None:
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
537 raise IOError("Unable to read infoXMLfrom %s"%(url))
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
538
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
539 dom = Parse(txt)
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
540 return dom
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
541
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
542
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
543 def getAuthinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
544 """gets authorization info from the index.meta file at path or given by dom"""
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
545 logging.debug("documentViewer (getauthinfofromindexmeta) path: %s"%(path))
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
546
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
547 access = None
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
548
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
549 if docinfo is None:
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
550 docinfo = {}
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
551
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
552 if dom is None:
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
553 for x in range(cut):
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
554 path=getParentDir(path)
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
555 dom = self.getDomFromIndexMeta(path)
46
31059e3d9338 has now also a text mode viewMode=text
dwinter
parents: 45
diff changeset
556
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
557 acctype = dom.xpath("//access-conditions/access/@type")
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
558 if acctype and (len(acctype)>0):
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
559 access=acctype[0].value
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
560 if access in ['group', 'institution']:
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
561 access = getTextFromNode(dom.xpath("//access-conditions/access/name")[0]).lower()
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
562
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
563 docinfo['accessType'] = access
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
564 return docinfo
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
565
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
566
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
567 def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
35
2d9261aea8f3 version 0.2.4
casties
parents: 32
diff changeset
568 """gets bibliographical info from the index.meta file at path or given by dom"""
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
569 logging.debug("documentViewer (getbibinfofromindexmeta) path: %s"%(path))
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
570
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
571 if docinfo is None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
572 docinfo = {}
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
573
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
574 if dom is None:
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
575 for x in range(cut):
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
576 path=getParentDir(path)
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
577 dom = self.getDomFromIndexMeta(path)
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
578
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
579 docinfo['indexMetaPath']=self.getIndexMetaPath(path);
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
580
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
581 logging.debug("documentViewer (getbibinfofromindexmeta cutted) path: %s"%(path))
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
582 # put in all raw bib fields as dict "bib"
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
583 bib = dom.xpath("//bib/*")
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
584 if bib and len(bib)>0:
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
585 bibinfo = {}
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
586 for e in bib:
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
587 bibinfo[e.localName] = getTextFromNode(e)
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
588 docinfo['bib'] = bibinfo
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
589
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
590 # extract some fields (author, title, year) according to their mapping
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
591 metaData=self.metadata.main.meta.bib
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
592 bibtype=dom.xpath("//bib/@type")
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
593 if bibtype and (len(bibtype)>0):
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
594 bibtype=bibtype[0].value
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
595 else:
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
596 bibtype="generic"
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
597
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
598 bibtype=bibtype.replace("-"," ") # wrong typesiin index meta "-" instead of " " (not wrong! ROC)
59
996b61d71351 added all fields from bib tag to docinfo
casties
parents: 57
diff changeset
599 docinfo['bib_type'] = bibtype
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
600 bibmap=metaData.generateMappingForType(bibtype)
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
601 logging.debug("documentViewer (getbibinfofromindexmeta) bibmap:"+repr(bibmap))
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
602 logging.debug("documentViewer (getbibinfofromindexmeta) bibtype:"+repr(bibtype))
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
603 # if there is no mapping bibmap is empty (mapping sometimes has empty fields)
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
604 if len(bibmap) > 0 and len(bibmap['author'][0]) > 0:
63
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
605 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
606 docinfo['author']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['author'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
607 except: pass
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
608 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
609 docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
610 except: pass
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
611 try:
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
612 docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0])
4a17b755bfc7 added more try/excepts to bib-meta reading code
casties
parents: 62
diff changeset
613 except: pass
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
614 logging.debug("documentViewer (getbibinfofromindexmeta) using mapping for %s"%bibtype)
52
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
615 try:
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
616 docinfo['lang']=getTextFromNode(dom.xpath("//bib/lang")[0])
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
617 except:
92047eaa6272 zLOG exchanged by logging
dwinter
parents: 51
diff changeset
618 docinfo['lang']=''
227
fd9aa1d0941a *** empty log message ***
abukhman
parents: 226
diff changeset
619
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
620 return docinfo
83
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
621
218
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
622
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
623 def getNameFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
624 """gets name info from the index.meta file at path or given by dom"""
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
625 if docinfo is None:
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
626 docinfo = {}
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
627
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
628 if dom is None:
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
629 for x in range(cut):
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
630 path=getParentDir(path)
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
631 dom = self.getDomFromIndexMeta(path)
330
c81509acead9 *** empty log message ***
abukhman
parents: 327
diff changeset
632
229
833de3f54e47 *** empty log message ***
abukhman
parents: 228
diff changeset
633 docinfo['name']=getTextFromNode(dom.xpath("/resource/name")[0])
230
87c6aac31003 *** empty log message ***
abukhman
parents: 229
diff changeset
634 logging.debug("documentViewer docinfo[name] %s"%docinfo['name'])
218
66f334ec3256 *** empty log message ***
abukhman
parents: 205
diff changeset
635 return docinfo
83
ec12a2440daa My last update Bukhman Andrey
abukhman
parents: 82
diff changeset
636
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
637 def getDocinfoFromTextTool(self, url, dom=None, docinfo=None):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
638 """parse texttool tag in index meta"""
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
639 logging.debug("documentViewer (getdocinfofromtexttool) url: %s" % (url))
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
640 if docinfo is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
641 docinfo = {}
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
642 if docinfo.get('lang', None) is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
643 docinfo['lang'] = '' # default keine Sprache gesetzt
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
644 if dom is None:
174
5780092e4989 *** empty log message ***
dwinter
parents: 173
diff changeset
645 dom = self.getDomFromIndexMeta(url)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
646
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
647 archivePath = None
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
648 archiveName = None
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
649
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
650 archiveNames = dom.xpath("//resource/name")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
651 if archiveNames and (len(archiveNames) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
652 archiveName = getTextFromNode(archiveNames[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
653 else:
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
654 logging.warning("documentViewer (getdocinfofromtexttool) resource/name missing in: %s" % (url))
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
655
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
656 archivePaths = dom.xpath("//resource/archive-path")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
657 if archivePaths and (len(archivePaths) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
658 archivePath = getTextFromNode(archivePaths[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
659 # clean up archive path
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
660 if archivePath[0] != '/':
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
661 archivePath = '/' + archivePath
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
662 if archiveName and (not archivePath.endswith(archiveName)):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
663 archivePath += "/" + archiveName
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
664 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
665 # try to get archive-path from url
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
666 logging.warning("documentViewer (getdocinfofromtexttool) resource/archive-path missing in: %s" % (url))
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
667 if (not url.startswith('http')):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
668 archivePath = url.replace('index.meta', '')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
669
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
670 if archivePath is None:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
671 # we balk without archive-path
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
672 raise IOError("Missing archive-path (for text-tool) in %s" % (url))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
673
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
674 imageDirs = dom.xpath("//texttool/image")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
675 if imageDirs and (len(imageDirs) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
676 imageDir = getTextFromNode(imageDirs[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
677
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
678 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
679 # we balk with no image tag / not necessary anymore because textmode is now standard
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
680 #raise IOError("No text-tool info in %s"%(url))
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
681 imageDir = ""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
682 #xquery="//pb"
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
683 docinfo['imagePath'] = "" # keine Bilder
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
684 docinfo['imageURL'] = ""
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
685
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
686 if imageDir and archivePath:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
687 #print "image: ", imageDir, " archivepath: ", archivePath
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
688 imageDir = os.path.join(archivePath, imageDir)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
689 imageDir = imageDir.replace("/mpiwg/online", '')
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
690 docinfo = self.getDirinfoFromDigilib(imageDir, docinfo=docinfo)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
691 docinfo['imagePath'] = imageDir
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
692
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
693 docinfo['imageURL'] = self.digilibBaseUrl + "/servlet/Scaler?fn=" + imageDir
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
694
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
695 viewerUrls = dom.xpath("//texttool/digiliburlprefix")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
696 if viewerUrls and (len(viewerUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
697 viewerUrl = getTextFromNode(viewerUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
698 docinfo['viewerURL'] = viewerUrl
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
699
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
700 # old style text URL
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
701 textUrls = dom.xpath("//texttool/text")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
702 if textUrls and (len(textUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
703 textUrl = getTextFromNode(textUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
704 if urlparse.urlparse(textUrl)[0] == "": #keine url
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
705 textUrl = os.path.join(archivePath, textUrl)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
706 # fix URLs starting with /mpiwg/online
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
707 if textUrl.startswith("/mpiwg/online"):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
708 textUrl = textUrl.replace("/mpiwg/online", '', 1)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
709
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
710 docinfo['textURL'] = textUrl
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
711
130
5c779d7b5f71 more modular version with separate object MpdlXmlTextServer
casties
parents: 128
diff changeset
712 # new style text-url-path
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
713 textUrls = dom.xpath("//texttool/text-url-path")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
714 if textUrls and (len(textUrls) > 0):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
715 textUrl = getTextFromNode(textUrls[0])
102
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
716 docinfo['textURLPath'] = textUrl
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
717 if not docinfo['imagePath']:
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
718 # text-only, no page images
205
1fc7d73ce7ce *** empty log message ***
abukhman
parents: 204
diff changeset
719 docinfo = self.getNumTextPages(docinfo)
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
720
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
721 presentationUrls = dom.xpath("//texttool/presentation")
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
722 docinfo = self.getBibinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get info von bib tag
228
9306c8d0dc4a *** empty log message ***
abukhman
parents: 227
diff changeset
723 docinfo = self.getNameFromIndexMeta(url, docinfo=docinfo, dom=dom)
386
48d27e100d19 *** empty log message ***
abukhman
parents: 384
diff changeset
724
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
725
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
726 if presentationUrls and (len(presentationUrls) > 0): # ueberschreibe diese durch presentation informationen
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
727 # presentation url ergiebt sich ersetzen von index.meta in der url der fuer die Metadaten
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
728 # durch den relativen Pfad auf die presentation infos
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
729 presentationPath = getTextFromNode(presentationUrls[0])
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
730 if url.endswith("index.meta"):
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
731 presentationUrl = url.replace('index.meta', presentationPath)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
732 else:
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
733 presentationUrl = url + "/" + presentationPath
102
27513c893ba9 trying to fix text-only documents
casties
parents: 101
diff changeset
734
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
735 docinfo = self.getBibinfoFromTextToolPresentation(presentationUrl, docinfo=docinfo, dom=dom)
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
736
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
737 docinfo = self.getAuthinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get access info
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
738
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
739 return docinfo
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
740
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
741
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
742 def getBibinfoFromTextToolPresentation(self,url,docinfo=None,dom=None):
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
743 """gets the bibliographical information from the preseantion entry in texttools
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
744 """
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
745 dom=self.getPresentationInfoXML(url)
62
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
746 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
747 docinfo['author']=getTextFromNode(dom.xpath("//author")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
748 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
749 pass
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
750 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
751 docinfo['title']=getTextFromNode(dom.xpath("//title")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
752 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
753 pass
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
754 try:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
755 docinfo['year']=getTextFromNode(dom.xpath("//date")[0])
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
756 except:
8a16ea8db858 fixed bug in getInt
casties
parents: 61
diff changeset
757 pass
50
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
758 return docinfo
6c0f20cecc60 added evaluation of the presentation/info.xml in texttools
dwinter
parents: 49
diff changeset
759
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
760 def getDocinfoFromImagePath(self,path,docinfo=None,cut=0):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
761 """path ist the path to the images it assumes that the index.meta file is one level higher."""
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
762 logging.debug("documentViewer (getdocinfofromimagepath) path: %s"%(path))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
763 if docinfo is None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
764 docinfo = {}
29
e1bed068b351 small fixes
casties
parents: 28
diff changeset
765 path=path.replace("/mpiwg/online","")
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
766 docinfo['imagePath'] = path
73
dwinter
parents: 71
diff changeset
767 docinfo=self.getDirinfoFromDigilib(path,docinfo=docinfo,cut=cut)
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
768
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
769 pathorig=path
78
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
770 for x in range(cut):
70ab234a18dc bugs in filepath mode fixes
dwinter
parents: 75
diff changeset
771 path=getParentDir(path)
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
772 logging.debug("documentViewer (getdocinfofromimagepath) PATH:"+path)
31
c6451e8d5d23 more small fixes - now version 0.2.2
casties
parents: 29
diff changeset
773 imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn="+path
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
774 docinfo['imageURL'] = imageUrl
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
775
79
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
776 #path ist the path to the images it assumes that the index.meta file is one level higher.
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
777 docinfo = self.getBibinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
df6952ac93e9 bug in getDocInforFromImagePath, relative lage der index.meta zu path war falsch.
dwinter
parents: 78
diff changeset
778 docinfo = self.getAuthinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
779 return docinfo
20
9884703dae70 new modi
dwinter
parents: 0
diff changeset
780
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
781
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
782 def getDocinfo(self, mode, url):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
783 """returns docinfo depending on mode"""
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
784 logging.debug("documentViewer (getdocinfo) mode: %s, url: %s"%(mode,url))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
785 # look for cached docinfo in session
51
c5d3aabbf61b textviewer now integrated, new modus auto introduced as standard for viewing
dwinter
parents: 50
diff changeset
786 if self.REQUEST.SESSION.has_key('docinfo'):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
787 docinfo = self.REQUEST.SESSION['docinfo']
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
788 # check if its still current
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
789 if docinfo is not None and docinfo.get('mode') == mode and docinfo.get('url') == url:
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
790 logging.debug("documentViewer (getdocinfo) docinfo in session: %s"%docinfo)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
791 return docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
792 # new docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
793 docinfo = {'mode': mode, 'url': url}
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
794 if mode=="texttool": #index.meta with texttool information
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
795 docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
796 elif mode=="imagepath":
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
797 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo)
70
0049d64aa464 filepath introduced
dwinter
parents: 68
diff changeset
798 elif mode=="filepath":
75
9673218e155b minorCVS: ----------------------------------------------------------------------
dwinter
parents: 74
diff changeset
799 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo,cut=1)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
800 else:
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
801 logging.error("documentViewer (getdocinfo) unknown mode: %s!"%mode)
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
802 raise ValueError("Unknown mode %s! Has to be one of 'texttool','imagepath','filepath'."%(mode))
409
f7d73ea4b38b quick fix for broken texturlpath
casties
parents: 405
diff changeset
803
f7d73ea4b38b quick fix for broken texturlpath
casties
parents: 405
diff changeset
804 # FIXME: fake texturlpath
f7d73ea4b38b quick fix for broken texturlpath
casties
parents: 405
diff changeset
805 if not docinfo.has_key('textURLPath'):
f7d73ea4b38b quick fix for broken texturlpath
casties
parents: 405
diff changeset
806 docinfo['textURLPath'] = None
f7d73ea4b38b quick fix for broken texturlpath
casties
parents: 405
diff changeset
807
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
808 logging.debug("documentViewer (getdocinfo) docinfo: %s"%docinfo)
362
1ed87e862806 *** empty log message ***
abukhman
parents: 356
diff changeset
809 #logging.debug("documentViewer (getdocinfo) docinfo: %s"%)
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
810 self.REQUEST.SESSION['docinfo'] = docinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
811 return docinfo
128
4db49915d825 Last lemma
abukhman
parents: 127
diff changeset
812
405
b8fb4c750d74 fix for characternormalization default
casties
parents: 404
diff changeset
813 def getPageinfo(self, current, start=None, rows=None, cols=None, docinfo=None, viewMode=None, tocMode=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
814 """returns pageinfo with the given parameters"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
815 pageinfo = {}
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
816 current = getInt(current)
338
0576f524e2ee *** empty log message ***
abukhman
parents: 337
diff changeset
817
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
818 pageinfo['current'] = current
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
819 rows = int(rows or self.thumbrows)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
820 pageinfo['rows'] = rows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
821 cols = int(cols or self.thumbcols)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
822 pageinfo['cols'] = cols
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
823 grpsize = cols * rows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
824 pageinfo['groupsize'] = grpsize
61
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
825 start = getInt(start, default=(math.ceil(float(current)/float(grpsize))*grpsize-(grpsize-1)))
f3d2f240692c fixed bug in calculation of group numbers
casties
parents: 59
diff changeset
826 # int(current / grpsize) * grpsize +1))
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
827 pageinfo['start'] = start
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
828 pageinfo['end'] = start + grpsize
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
829 if (docinfo is not None) and ('numPages' in docinfo):
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
830 np = int(docinfo['numPages'])
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
831 pageinfo['end'] = min(pageinfo['end'], np)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
832 pageinfo['numgroups'] = int(np / grpsize)
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
833 if np % grpsize > 0:
128
4db49915d825 Last lemma
abukhman
parents: 127
diff changeset
834 pageinfo['numgroups'] += 1
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
835 pageinfo['viewMode'] = viewMode
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
836 pageinfo['tocMode'] = tocMode
405
b8fb4c750d74 fix for characternormalization default
casties
parents: 404
diff changeset
837 pageinfo['characterNormalization'] = self.REQUEST.get('characterNormalization','regPlusNorm')
398
55f9eeebc338 *** empty log message ***
abukhman
parents: 397
diff changeset
838 pageinfo['optionToggle'] = self.REQUEST.get('optionToggle','')
55f9eeebc338 *** empty log message ***
abukhman
parents: 397
diff changeset
839 pageinfo['query'] = self.REQUEST.get('query','')
384
4ec393062711 *** empty log message ***
abukhman
parents: 382
diff changeset
840 pageinfo['queryType'] = self.REQUEST.get('queryType','')
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
841 pageinfo['querySearch'] =self.REQUEST.get('querySearch', 'fulltext')
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
842 pageinfo['textPN'] = self.REQUEST.get('textPN','1')
384
4ec393062711 *** empty log message ***
abukhman
parents: 382
diff changeset
843 pageinfo['highlightQuery'] = self.REQUEST.get('highlightQuery','')
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
844 pageinfo['tocPageSize'] = self.REQUEST.get('tocPageSize', '30')
105
6bffb612cd6a *** empty log message ***
abukhman
parents: 104
diff changeset
845 pageinfo['queryPageSize'] =self.REQUEST.get('queryPageSize', '10')
90
6a4a72033d58 new version with new full-text infrastructure and some more changed templates
casties
parents: 84
diff changeset
846 pageinfo['tocPN'] = self.REQUEST.get('tocPN', '1')
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
847 toc = int (pageinfo['tocPN'])
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
848 pageinfo['textPages'] =int (toc)
158
4f4fe4e56ffe characterNormalization
abukhman
parents: 157
diff changeset
849
362
1ed87e862806 *** empty log message ***
abukhman
parents: 356
diff changeset
850
326
446cb6197547 *** empty log message ***
abukhman
parents: 310
diff changeset
851
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
852 if 'tocSize_%s'%tocMode in docinfo:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
853 tocSize = int(docinfo['tocSize_%s'%tocMode])
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
854 tocPageSize = int(pageinfo['tocPageSize'])
128
4db49915d825 Last lemma
abukhman
parents: 127
diff changeset
855 # cached toc
99
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
856 if tocSize%tocPageSize>0:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
857 tocPages=tocSize/tocPageSize+1
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
858 else:
4738a696d265 Search function update
abukhman
parents: 97
diff changeset
859 tocPages=tocSize/tocPageSize
128
4db49915d825 Last lemma
abukhman
parents: 127
diff changeset
860 pageinfo['tocPN'] = min (tocPages,toc)
95
db6d594aa4d9 Last update with search function (getSearch)
abukhman
parents: 90
diff changeset
861 pageinfo['searchPN'] =self.REQUEST.get('searchPN','1')
112
d48c1d507556 *** empty log message ***
abukhman
parents: 109
diff changeset
862 pageinfo['sn'] =self.REQUEST.get('sn','')
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
863 return pageinfo
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
864
128
4db49915d825 Last lemma
abukhman
parents: 127
diff changeset
865 def changeDocumentViewer(self,title="",digilibBaseUrl=None,thumbrows=2,thumbcols=5,authgroups='mpiwg',RESPONSE=None):
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
866 """init document viewer"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
867 self.title=title
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
868 self.digilibBaseUrl = digilibBaseUrl
25
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
869 self.thumbrows = thumbrows
e93fb8cadd3a new, less preliminary version 0.2
casties
parents: 22
diff changeset
870 self.thumbcols = thumbcols
32
b25c89d693cf version 0.2.3 - first version with access control!
casties
parents: 31
diff changeset
871 self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
872 if RESPONSE is not None:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
873 RESPONSE.redirect('manage_main')
0
dwinter
parents:
diff changeset
874
dwinter
parents:
diff changeset
875 def manage_AddDocumentViewerForm(self):
dwinter
parents:
diff changeset
876 """add the viewer form"""
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
877 pt=PageTemplateFile('zpt/addDocumentViewer', globals()).__of__(self)
0
dwinter
parents:
diff changeset
878 return pt()
dwinter
parents:
diff changeset
879
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
880 def manage_AddDocumentViewer(self,id,imageScalerUrl="",textServerName="",title="",RESPONSE=None):
0
dwinter
parents:
diff changeset
881 """add the viewer"""
84
a6e4f9b6729a first version with new full-text infrastructure and slightly changed templates
casties
parents: 83
diff changeset
882 newObj=documentViewer(id,imageScalerUrl=imageScalerUrl,title=title,textServerName=textServerName)
0
dwinter
parents:
diff changeset
883 self._setObject(id,newObj)
dwinter
parents:
diff changeset
884
dwinter
parents:
diff changeset
885 if RESPONSE is not None:
dwinter
parents:
diff changeset
886 RESPONSE.redirect('manage_main')
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
887
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
888 ## DocumentViewerTemplate class
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
889 class DocumentViewerTemplate(ZopePageTemplate):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
890 """Template for document viewer"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
891 meta_type="DocumentViewer Template"
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
892
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
893
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
894 def manage_addDocumentViewerTemplateForm(self):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
895 """Form for adding"""
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
896 pt=PageTemplateFile('zpt/addDocumentViewerTemplate', globals()).__of__(self)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
897 return pt()
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
898
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
899 def manage_addDocumentViewerTemplate(self, id='viewer_main', title=None, text=None,
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
900 REQUEST=None, submit=None):
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
901 "Add a Page Template with optional file content."
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
902
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
903 self._setObject(id, DocumentViewerTemplate(id))
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
904 ob = getattr(self, id)
53
f4e0af8c281d NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents: 52
diff changeset
905 txt=file(os.path.join(package_home(globals()),'zpt/viewer_main.zpt'),'r').read()
167
7e2b97941a66 characterNormalization
abukhman
parents: 166
diff changeset
906 logging.info("txt %s:"%txt)
53
f4e0af8c281d NEW - # 44: ECHO - vollst?ndige bibliographische Angabe
dwinter
parents: 52
diff changeset
907 ob.pt_edit(txt,"text/html")
22
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
908 if title:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
909 ob.pt_setTitle(title)
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
910 try:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
911 u = self.DestinationURL()
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
912 except AttributeError:
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
913 u = REQUEST['URL1']
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
914
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
915 u = "%s/%s" % (u, urllib.quote(id))
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
916 REQUEST.RESPONSE.redirect(u+'/manage_main')
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
917 return ''
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
918
b139f9937e97 preliminary version 0.2
casties
parents: 20
diff changeset
919
41
0c8ee8fcfd76 some more logging
casties
parents: 40
diff changeset
920