Context Navigation

source: documentViewer/documentViewer.py @ 137:2fa9d30f4ab0

Last change on this file since 137:2fa9d30f4ab0 was 137:2fa9d30f4ab0, checked in by casties, 14 years ago
debugging user authentication
File size: 30.5 KB

Line
1
2	from OFS.Folder import Folder
3	from Products.PageTemplates.ZopePageTemplate import ZopePageTemplate
4	from Products.PageTemplates.PageTemplateFile import PageTemplateFile
5	from AccessControl import ClassSecurityInfo
6	from AccessControl import getSecurityManager
7	from Globals import package_home
8
9	from Ft.Xml import EMPTY_NAMESPACE, Parse
10	import Ft.Xml.Domlette
11	import os.path
12	import sys
13	import urllib
14	import urllib2
15	import logging
16	import math
17	import urlparse
18	import cStringIO
19
20	def logger(txt,method,txt2):
21	"""logging"""
22	logging.info(txt+ txt2)
23
24
25	def getInt(number, default=0):
26	"""returns always an int (0 in case of problems)"""
27	try:
28	return int(number)
29	except:
30	return int(default)
31
32	def getTextFromNode(nodename):
33	"""get the cdata content of a node"""
34	if nodename is None:
35	return ""
36	nodelist=nodename.childNodes
37	rc = ""
38	for node in nodelist:
39	if node.nodeType == node.TEXT_NODE:
40	rc = rc + node.data
41	return rc
42
43	def serializeNode(node, encoding='utf-8'):
44	"""returns a string containing node as XML"""
45	buf = cStringIO.StringIO()
46	Ft.Xml.Domlette.Print(node, stream=buf, encoding=encoding)
47	s = buf.getvalue()
48	buf.close()
49	return s
50
51
52	def getParentDir(path):
53	"""returns pathname shortened by one"""
54	return '/'.join(path.split('/')[0:-1])
55
56
57	def getHttpData(url, data=None, num_tries=3, timeout=10):
58	"""returns result from url+data HTTP request"""
59	# we do GET (by appending data to url)
60	if isinstance(data, str) or isinstance(data, unicode):
61	# if data is string then append
62	url = "%s?%s"%(url,data)
63	elif isinstance(data, dict) or isinstance(data, list) or isinstance(data, tuple):
64	# urlencode
65	url = "%s?%s"%(url,urllib.urlencode(data))
66
67	response = None
68	errmsg = None
69	for cnt in range(num_tries):
70	try:
71	logging.debug("getHttpData(#%s %ss) url=%s"%(cnt+1,timeout,url))
72	if sys.version_info < (2, 6):
73	# set timeout on socket -- ugly :-(
74	import socket
75	socket.setdefaulttimeout(float(timeout))
76	response = urllib2.urlopen(url)
77	else:
78	response = urllib2.urlopen(url,timeout=float(timeout))
79	# check result?
80	break
81	except urllib2.HTTPError, e:
82	logging.error("getHttpData: HTTP error(%s): %s"%(e.code,e))
83	errmsg = str(e)
84	# stop trying
85	break
86	except urllib2.URLError, e:
87	logging.error("getHttpData: URLLIB error(%s): %s"%(e.reason,e))
88	errmsg = str(e)
89	# stop trying
90	#break
91
92	if response is not None:
93	data = response.read()
94	response.close()
95	return data
96
97	raise IOError("ERROR fetching HTTP data from %s: %s"%(url,errmsg))
98	#return None
99
100
101
102	##
103	## documentViewer class
104	##
105	class documentViewer(Folder):
106	"""document viewer"""
107	meta_type="Document viewer"
108
109	security=ClassSecurityInfo()
110	manage_options=Folder.manage_options+(
111	{'label':'main config','action':'changeDocumentViewerForm'},
112	)
113
114	# templates and forms
115	viewer_main = PageTemplateFile('zpt/viewer_main', globals())
116	toc_thumbs = PageTemplateFile('zpt/toc_thumbs', globals())
117	toc_text = PageTemplateFile('zpt/toc_text', globals())
118	toc_figures = PageTemplateFile('zpt/toc_figures', globals())
119	page_main_images = PageTemplateFile('zpt/page_main_images', globals())
120	page_main_text = PageTemplateFile('zpt/page_main_text', globals())
121	page_main_text_dict = PageTemplateFile('zpt/page_main_text_dict', globals())
122	page_main_xml = PageTemplateFile('zpt/page_main_xml', globals())
123	head_main = PageTemplateFile('zpt/head_main', globals())
124	docuviewer_css = PageTemplateFile('css/docuviewer.css', globals())
125	info_xml = PageTemplateFile('zpt/info_xml', globals())
126
127
128	thumbs_main_rss = PageTemplateFile('zpt/thumbs_main_rss', globals())
129	security.declareProtected('View management screens','changeDocumentViewerForm')
130	changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals())
131
132
133	def __init__(self,id,imageScalerUrl=None,textServerName=None,title="",digilibBaseUrl=None,thumbcols=2,thumbrows=5,authgroups="mpiwg"):
134	"""init document viewer"""
135	self.id=id
136	self.title=title
137	self.thumbcols = thumbcols
138	self.thumbrows = thumbrows
139	# authgroups is list of authorized groups (delimited by ,)
140	self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
141	# create template folder so we can always use template.something
142
143	templateFolder = Folder('template')
144	#self['template'] = templateFolder # Zope-2.12 style
145	self._setObject('template',templateFolder) # old style
146	try:
147	import MpdlXmlTextServer
148	textServer = MpdlXmlTextServer.MpdlXmlTextServer(id='fulltextclient',serverName=textServerName)
149	#templateFolder['fulltextclient'] = xmlRpcClient
150	templateFolder._setObject('fulltextclient',textServer)
151	except Exception, e:
152	logging.error("Unable to create MpdlXmlTextServer for fulltextclient: "+str(e))
153	try:
154	from Products.zogiLib.zogiLib import zogiLib
155	zogilib = zogiLib(id="zogilib", title="zogilib for docuviewer", dlServerURL=imageScalerUrl, layout="book")
156	#templateFolder['zogilib'] = zogilib
157	templateFolder._setObject('zogilib',zogilib)
158	except Exception, e:
159	logging.error("Unable to create zogiLib for zogilib: "+str(e))
160
161
162	# proxy text server methods to fulltextclient
163	def getTextPage(self, **args):
164	"""get page"""
165	return self.template.fulltextclient.getTextPage(**args)
166
167	def getQuery(self, **args):
168	"""get query"""
169	return self.template.fulltextclient.getQuery(**args)
170
171	def getSearch(self, **args):
172	"""get search"""
173	return self.template.fulltextclient.getSearch(**args)
174
175	def getNumPages(self, docinfo):
176	"""get numpages"""
177	return self.template.fulltextclient.getNumPages(docinfo)
178
179	def getTranslate(self, **args):
180	"""get translate"""
181	return self.template.fulltextclient.getTranslate(**args)
182
183	def getLemma(self, **args):
184	"""get lemma"""
185	return self.template.fulltextclient.getLemma(**args)
186
187	def getToc(self, **args):
188	"""get toc"""
189	return self.template.fulltextclient.getToc(**args)
190
191	def getTocPage(self, **args):
192	"""get tocpage"""
193	return self.template.fulltextclient.getTocPage(**args)
194
195
196	security.declareProtected('View','thumbs_rss')
197	def thumbs_rss(self,mode,url,viewMode="auto",start=None,pn=1):
198	'''
199	view it
200	@param mode: defines how to access the document behind url
201	@param url: url which contains display information
202	@param viewMode: if images display images, if text display text, default is images (text,images or auto)
203
204	'''
205	logging.debug("HHHHHHHHHHHHHH:load the rss")
206	logger("documentViewer (index)", logging.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
207
208	if not hasattr(self, 'template'):
209	# create template folder if it doesn't exist
210	self.manage_addFolder('template')
211
212	if not self.digilibBaseUrl:
213	self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
214
215	docinfo = self.getDocinfo(mode=mode,url=url)
216	pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo)
217	pt = getattr(self.template, 'thumbs_main_rss')
218
219	if viewMode=="auto": # automodus gewaehlt
220	if docinfo.has_key("textURL") or docinfo.has_key('textURLPath'): #texturl gesetzt und textViewer konfiguriert
221	viewMode="text"
222	else:
223	viewMode="images"
224
225	return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode)
226
227	security.declareProtected('View','index_html')
228	def index_html(self,url,mode="texttool",viewMode="auto",tocMode="thumbs",start=None,pn=1,mk=None, query=None, querySearch=None):
229	'''
230	view it
231	@param mode: defines how to access the document behind url
232	@param url: url which contains display information
233	@param viewMode: if images display images, if text display text, default is auto (text,images or auto)
234	@param tocMode: type of 'table of contents' for navigation (thumbs, text, figures, none)
235	@param querySearch: type of different search modes (fulltext, fulltextMorph, xpath, xquery, ftIndex, ftIndexMorph, fulltextMorphLemma)
236	'''
237
238	logging.debug("documentViewer (index) mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
239
240	if not hasattr(self, 'template'):
241	# this won't work
242	logging.error("template folder missing!")
243	return "ERROR: template folder missing!"
244
245	if not getattr(self, 'digilibBaseUrl', None):
246	self.digilibBaseUrl = self.findDigilibUrl() or "http://digilib.mpiwg-berlin.mpg.de/digitallibrary"
247
248	docinfo = self.getDocinfo(mode=mode,url=url)
249
250	if tocMode != "thumbs":
251	# get table of contents
252	docinfo = self.getToc(mode=tocMode, docinfo=docinfo)
253
254	if viewMode=="auto": # automodus gewaehlt
255	if docinfo.has_key('textURL') or docinfo.has_key('textURLPath'): #texturl gesetzt und textViewer konfiguriert
256	viewMode="text_dict"
257	else:
258	viewMode="images"
259
260	pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo,viewMode=viewMode,tocMode=tocMode)
261
262	pt = getattr(self.template, 'viewer_main')
263	return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode,mk=self.generateMarks(mk))
264
265	def generateMarks(self,mk):
266	ret=""
267	if mk is None:
268	return ""
269	if not isinstance(mk, list):
270	mk=[mk]
271	for m in mk:
272	ret+="mk=%s"%m
273	return ret
274
275
276	def findDigilibUrl(self):
277	"""try to get the digilib URL from zogilib"""
278	url = self.template.zogilib.getDLBaseUrl()
279	return url
280
281	def getDocumentViewerURL(self):
282	"""returns the URL of this instance"""
283	return self.absolute_url()
284
285	def getStyle(self, idx, selected, style=""):
286	"""returns a string with the given style and append 'sel' if path == selected."""
287	#logger("documentViewer (getstyle)", logging.INFO, "idx: %s selected: %s style: %s"%(idx,selected,style))
288	if idx == selected:
289	return style + 'sel'
290	else:
291	return style
292
293	def getLink(self,param=None,val=None):
294	"""link to documentviewer with parameter param set to val"""
295	params=self.REQUEST.form.copy()
296	if param is not None:
297	if val is None:
298	if params.has_key(param):
299	del params[param]
300	else:
301	params[param] = str(val)
302
303	if params.get("mode", None) == "filepath": #wenn beim erst Aufruf filepath gesetzt wurde aendere das nun zu imagepath
304	params["mode"] = "imagepath"
305	params["url"] = getParentDir(params["url"])
306
307	# quote values and assemble into query string
308	#ps = "&".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
309	ps = urllib.urlencode(params)
310	url=self.REQUEST['URL1']+"?"+ps
311	return url
312
313	def getLinkAmp(self,param=None,val=None):
314	"""link to documentviewer with parameter param set to val"""
315	params=self.REQUEST.form.copy()
316	if param is not None:
317	if val is None:
318	if params.has_key(param):
319	del params[param]
320	else:
321	params[param] = str(val)
322
323	# quote values and assemble into query string
324	logging.debug("XYXXXXX: %s"%repr(params.items()))
325	ps = "&".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
326	url=self.REQUEST['URL1']+"?"+ps
327	return url
328
329	def getInfo_xml(self,url,mode):
330	"""returns info about the document as XML"""
331
332	if not self.digilibBaseUrl:
333	self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
334
335	docinfo = self.getDocinfo(mode=mode,url=url)
336	pt = getattr(self.template, 'info_xml')
337	return pt(docinfo=docinfo)
338
339
340	def isAccessible(self, docinfo):
341	"""returns if access to the resource is granted"""
342	access = docinfo.get('accessType', None)
343	logging.debug("documentViewer (accessOK) access type %s"%access)
344	if access is not None and access == 'free':
345	logging.debug("documentViewer (accessOK) access is free")
346	return True
347	elif access is None or access in self.authgroups:
348	# only local access -- only logged in users
349	user = getSecurityManager().getUser()
350	logging.debug("documentViewer (accessOK) user=%s ip=%s"%(user,self.REQUEST.getClientAddr()))
351	if user is not None:
352	#print "user: ", user
353	return (user.getUserName() != "Anonymous User")
354	else:
355	return False
356
357	logging.error("documentViewer (accessOK) unknown access type %s"%access)
358	return False
359
360
361	def getDirinfoFromDigilib(self,path,docinfo=None,cut=0):
362	"""gibt param von dlInfo aus"""
363	if docinfo is None:
364	docinfo = {}
365
366	for x in range(cut):
367
368	path=getParentDir(path)
369
370	infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path
371
372	logging.debug("documentViewer (getparamfromdigilib) dirInfo from %s"%(infoUrl))
373
374	txt = getHttpData(infoUrl)
375	if txt is None:
376	raise IOError("Unable to get dir-info from %s"%(infoUrl))
377
378	dom = Parse(txt)
379	sizes=dom.xpath("//dir/size")
380	logging.debug("documentViewer (getparamfromdigilib) dirInfo:size"%sizes)
381
382	if sizes:
383	docinfo['numPages'] = int(getTextFromNode(sizes[0]))
384	else:
385	docinfo['numPages'] = 0
386
387	# TODO: produce and keep list of image names and numbers
388
389	return docinfo
390
391
392	def getIndexMeta(self, url):
393	"""returns dom of index.meta document at url"""
394	dom = None
395	metaUrl = None
396	if url.startswith("http://"):
397	# real URL
398	metaUrl = url
399	else:
400	# online path
401	server=self.digilibBaseUrl+"/servlet/Texter?fn="
402	metaUrl=server+url.replace("/mpiwg/online","")
403	if not metaUrl.endswith("index.meta"):
404	metaUrl += "/index.meta"
405
406	logging.debug("(getIndexMeta): METAURL: %s"%metaUrl)
407	txt=getHttpData(metaUrl)
408	if txt is None:
409	raise IOError("Unable to read index meta from %s"%(url))
410
411	dom = Parse(txt)
412	return dom
413
414	def getPresentationInfoXML(self, url):
415	"""returns dom of info.xml document at url"""
416	dom = None
417	metaUrl = None
418	if url.startswith("http://"):
419	# real URL
420	metaUrl = url
421	else:
422	# online path
423	server=self.digilibBaseUrl+"/servlet/Texter?fn="
424	metaUrl=server+url.replace("/mpiwg/online","")
425
426	txt=getHttpData(metaUrl)
427	if txt is None:
428	raise IOError("Unable to read infoXMLfrom %s"%(url))
429
430	dom = Parse(txt)
431	return dom
432
433
434	def getAuthinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
435	"""gets authorization info from the index.meta file at path or given by dom"""
436	logging.debug("documentViewer (getauthinfofromindexmeta) path: %s"%(path))
437
438	access = None
439
440	if docinfo is None:
441	docinfo = {}
442
443	if dom is None:
444	for x in range(cut):
445	path=getParentDir(path)
446	dom = self.getIndexMeta(path)
447
448	acctype = dom.xpath("//access-conditions/access/@type")
449	if acctype and (len(acctype)>0):
450	access=acctype[0].value
451	if access in ['group', 'institution']:
452	access = getTextFromNode(dom.xpath("//access-conditions/access/name")[0]).lower()
453
454	docinfo['accessType'] = access
455	return docinfo
456
457
458	def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
459	"""gets bibliographical info from the index.meta file at path or given by dom"""
460	logging.debug("documentViewer (getbibinfofromindexmeta) path: %s"%(path))
461
462	if docinfo is None:
463	docinfo = {}
464
465	if dom is None:
466	for x in range(cut):
467	path=getParentDir(path)
468	dom = self.getIndexMeta(path)
469
470	logging.debug("documentViewer (getbibinfofromindexmeta cutted) path: %s"%(path))
471	# put in all raw bib fields as dict "bib"
472	bib = dom.xpath("//bib/*")
473	if bib and len(bib)>0:
474	bibinfo = {}
475	for e in bib:
476	bibinfo[e.localName] = getTextFromNode(e)
477	docinfo['bib'] = bibinfo
478
479	# extract some fields (author, title, year) according to their mapping
480	metaData=self.metadata.main.meta.bib
481	bibtype=dom.xpath("//bib/@type")
482	if bibtype and (len(bibtype)>0):
483	bibtype=bibtype[0].value
484	else:
485	bibtype="generic"
486
487	bibtype=bibtype.replace("-"," ") # wrong typesiin index meta "-" instead of " " (not wrong! ROC)
488	docinfo['bib_type'] = bibtype
489	bibmap=metaData.generateMappingForType(bibtype)
490	# if there is no mapping bibmap is empty (mapping sometimes has empty fields)
491	if len(bibmap) > 0 and len(bibmap['author'][0]) > 0:
492	try:
493	docinfo['author']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['author'][0])[0])
494	except: pass
495	try:
496	docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0])
497	except: pass
498	try:
499	docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0])
500	except: pass
501	logging.debug("documentViewer (getbibinfofromindexmeta) using mapping for %s"%bibtype)
502	try:
503	docinfo['lang']=getTextFromNode(dom.xpath("//bib/lang")[0])
504	except:
505	docinfo['lang']=''
506
507	return docinfo
508
509
510	def getDocinfoFromTextTool(self, url, dom=None, docinfo=None):
511	"""parse texttool tag in index meta"""
512	logging.debug("documentViewer (getdocinfofromtexttool) url: %s" % (url))
513	if docinfo is None:
514	docinfo = {}
515	if docinfo.get('lang', None) is None:
516	docinfo['lang'] = '' # default keine Sprache gesetzt
517	if dom is None:
518	dom = self.getIndexMeta(url)
519
520	archivePath = None
521	archiveName = None
522
523	archiveNames = dom.xpath("//resource/name")
524	if archiveNames and (len(archiveNames) > 0):
525	archiveName = getTextFromNode(archiveNames[0])
526	else:
527	logging.warning("documentViewer (getdocinfofromtexttool) resource/name missing in: %s" % (url))
528
529	archivePaths = dom.xpath("//resource/archive-path")
530	if archivePaths and (len(archivePaths) > 0):
531	archivePath = getTextFromNode(archivePaths[0])
532	# clean up archive path
533	if archivePath[0] != '/':
534	archivePath = '/' + archivePath
535	if archiveName and (not archivePath.endswith(archiveName)):
536	archivePath += "/" + archiveName
537	else:
538	# try to get archive-path from url
539	logging.warning("documentViewer (getdocinfofromtexttool) resource/archive-path missing in: %s" % (url))
540	if (not url.startswith('http')):
541	archivePath = url.replace('index.meta', '')
542
543	if archivePath is None:
544	# we balk without archive-path
545	raise IOError("Missing archive-path (for text-tool) in %s" % (url))
546
547	imageDirs = dom.xpath("//texttool/image")
548	if imageDirs and (len(imageDirs) > 0):
549	imageDir = getTextFromNode(imageDirs[0])
550
551	else:
552	# we balk with no image tag / not necessary anymore because textmode is now standard
553	#raise IOError("No text-tool info in %s"%(url))
554	imageDir = ""
555	#xquery="//pb"
556	docinfo['imagePath'] = "" # keine Bilder
557	docinfo['imageURL'] = ""
558
559	if imageDir and archivePath:
560	#print "image: ", imageDir, " archivepath: ", archivePath
561	imageDir = os.path.join(archivePath, imageDir)
562	imageDir = imageDir.replace("/mpiwg/online", '')
563	docinfo = self.getDirinfoFromDigilib(imageDir, docinfo=docinfo)
564	docinfo['imagePath'] = imageDir
565
566	docinfo['imageURL'] = self.digilibBaseUrl + "/servlet/Scaler?fn=" + imageDir
567
568	viewerUrls = dom.xpath("//texttool/digiliburlprefix")
569	if viewerUrls and (len(viewerUrls) > 0):
570	viewerUrl = getTextFromNode(viewerUrls[0])
571	docinfo['viewerURL'] = viewerUrl
572
573	# old style text URL
574	textUrls = dom.xpath("//texttool/text")
575	if textUrls and (len(textUrls) > 0):
576	textUrl = getTextFromNode(textUrls[0])
577	if urlparse.urlparse(textUrl)[0] == "": #keine url
578	textUrl = os.path.join(archivePath, textUrl)
579	# fix URLs starting with /mpiwg/online
580	if textUrl.startswith("/mpiwg/online"):
581	textUrl = textUrl.replace("/mpiwg/online", '', 1)
582
583	docinfo['textURL'] = textUrl
584
585	# new style text-url-path
586	textUrls = dom.xpath("//texttool/text-url-path")
587	if textUrls and (len(textUrls) > 0):
588	textUrl = getTextFromNode(textUrls[0])
589	docinfo['textURLPath'] = textUrl
590	if not docinfo['imagePath']:
591	# text-only, no page images
592	docinfo = self.getNumPages(docinfo)
593
594	presentationUrls = dom.xpath("//texttool/presentation")
595	docinfo = self.getBibinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get info von bib tag
596
597	if presentationUrls and (len(presentationUrls) > 0): # ueberschreibe diese durch presentation informationen
598	# presentation url ergiebt sich ersetzen von index.meta in der url der fuer die Metadaten
599	# durch den relativen Pfad auf die presentation infos
600	presentationPath = getTextFromNode(presentationUrls[0])
601	if url.endswith("index.meta"):
602	presentationUrl = url.replace('index.meta', presentationPath)
603	else:
604	presentationUrl = url + "/" + presentationPath
605
606	docinfo = self.getBibinfoFromTextToolPresentation(presentationUrl, docinfo=docinfo, dom=dom)
607
608	docinfo = self.getAuthinfoFromIndexMeta(url, docinfo=docinfo, dom=dom) # get access info
609
610	return docinfo
611
612
613	def getBibinfoFromTextToolPresentation(self,url,docinfo=None,dom=None):
614	"""gets the bibliographical information from the preseantion entry in texttools
615	"""
616	dom=self.getPresentationInfoXML(url)
617	try:
618	docinfo['author']=getTextFromNode(dom.xpath("//author")[0])
619	except:
620	pass
621	try:
622	docinfo['title']=getTextFromNode(dom.xpath("//title")[0])
623	except:
624	pass
625	try:
626	docinfo['year']=getTextFromNode(dom.xpath("//date")[0])
627	except:
628	pass
629	return docinfo
630
631	def getDocinfoFromImagePath(self,path,docinfo=None,cut=0):
632	"""path ist the path to the images it assumes that the index.meta file is one level higher."""
633	logging.debug("documentViewer (getdocinfofromimagepath) path: %s"%(path))
634	if docinfo is None:
635	docinfo = {}
636	path=path.replace("/mpiwg/online","")
637	docinfo['imagePath'] = path
638	docinfo=self.getDirinfoFromDigilib(path,docinfo=docinfo,cut=cut)
639
640	pathorig=path
641	for x in range(cut):
642	path=getParentDir(path)
643	logging.debug("documentViewer (getdocinfofromimagepath) PATH:"+path)
644	imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn="+path
645	docinfo['imageURL'] = imageUrl
646
647	#path ist the path to the images it assumes that the index.meta file is one level higher.
648	docinfo = self.getBibinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
649	docinfo = self.getAuthinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
650	return docinfo
651
652
653	def getDocinfo(self, mode, url):
654	"""returns docinfo depending on mode"""
655	logging.debug("documentViewer (getdocinfo) mode: %s, url: %s"%(mode,url))
656	# look for cached docinfo in session
657	if self.REQUEST.SESSION.has_key('docinfo'):
658	docinfo = self.REQUEST.SESSION['docinfo']
659	# check if its still current
660	if docinfo is not None and docinfo.get('mode') == mode and docinfo.get('url') == url:
661	logging.debug("documentViewer (getdocinfo) docinfo in session: %s"%docinfo)
662	return docinfo
663	# new docinfo
664	docinfo = {'mode': mode, 'url': url}
665	if mode=="texttool": #index.meta with texttool information
666	docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo)
667	elif mode=="imagepath":
668	docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo)
669	elif mode=="filepath":
670	docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo,cut=1)
671	else:
672	logging.error("documentViewer (getdocinfo) unknown mode: %s!"%mode)
673	raise ValueError("Unknown mode %s! Has to be one of 'texttool','imagepath','filepath'."%(mode))
674
675	logging.debug("documentViewer (getdocinfo) docinfo: %s"%docinfo)
676	self.REQUEST.SESSION['docinfo'] = docinfo
677	return docinfo
678
679	def getPageinfo(self, current, start=None, rows=None, cols=None, docinfo=None, viewMode=None, tocMode=None):
680	"""returns pageinfo with the given parameters"""
681	pageinfo = {}
682	current = getInt(current)
683	pageinfo['current'] = current
684	rows = int(rows or self.thumbrows)
685	pageinfo['rows'] = rows
686	cols = int(cols or self.thumbcols)
687	pageinfo['cols'] = cols
688	grpsize = cols * rows
689	pageinfo['groupsize'] = grpsize
690	start = getInt(start, default=(math.ceil(float(current)/float(grpsize))*grpsize-(grpsize-1)))
691	# int(current / grpsize) * grpsize +1))
692	pageinfo['start'] = start
693	pageinfo['end'] = start + grpsize
694	if (docinfo is not None) and ('numPages' in docinfo):
695	np = int(docinfo['numPages'])
696	pageinfo['end'] = min(pageinfo['end'], np)
697	pageinfo['numgroups'] = int(np / grpsize)
698	if np % grpsize > 0:
699	pageinfo['numgroups'] += 1
700	pageinfo['viewMode'] = viewMode
701	pageinfo['tocMode'] = tocMode
702	pageinfo['query'] = self.REQUEST.get('query',' ')
703	pageinfo['queryType'] = self.REQUEST.get('queryType',' ')
704	pageinfo['querySearch'] =self.REQUEST.get('querySearch', 'fulltext')
705	pageinfo['textPN'] = self.REQUEST.get('textPN','1')
706	pageinfo['highlightQuery'] = self.REQUEST.get('highlightQuery','')
707	pageinfo['tocPageSize'] = self.REQUEST.get('tocPageSize', '30')
708	pageinfo['queryPageSize'] =self.REQUEST.get('queryPageSize', '10')
709	pageinfo['tocPN'] = self.REQUEST.get('tocPN', '1')
710	toc = int (pageinfo['tocPN'])
711	pageinfo['textPages'] =int (toc)
712
713	if 'tocSize_%s'%tocMode in docinfo:
714	tocSize = int(docinfo['tocSize_%s'%tocMode])
715	tocPageSize = int(pageinfo['tocPageSize'])
716	# cached toc
717	if tocSize%tocPageSize>0:
718	tocPages=tocSize/tocPageSize+1
719	else:
720	tocPages=tocSize/tocPageSize
721	pageinfo['tocPN'] = min (tocPages,toc)
722	pageinfo['searchPN'] =self.REQUEST.get('searchPN','1')
723	pageinfo['sn'] =self.REQUEST.get('sn','')
724	return pageinfo
725
726	def changeDocumentViewer(self,title="",digilibBaseUrl=None,thumbrows=2,thumbcols=5,authgroups='mpiwg',RESPONSE=None):
727	"""init document viewer"""
728	self.title=title
729	self.digilibBaseUrl = digilibBaseUrl
730	self.thumbrows = thumbrows
731	self.thumbcols = thumbcols
732	self.authgroups = [s.strip().lower() for s in authgroups.split(',')]
733	if RESPONSE is not None:
734	RESPONSE.redirect('manage_main')
735
736	def manage_AddDocumentViewerForm(self):
737	"""add the viewer form"""
738	pt=PageTemplateFile('zpt/addDocumentViewer', globals()).__of__(self)
739	return pt()
740
741	def manage_AddDocumentViewer(self,id,imageScalerUrl="",textServerName="",title="",RESPONSE=None):
742	"""add the viewer"""
743	newObj=documentViewer(id,imageScalerUrl=imageScalerUrl,title=title,textServerName=textServerName)
744	self._setObject(id,newObj)
745
746	if RESPONSE is not None:
747	RESPONSE.redirect('manage_main')
748
749	## DocumentViewerTemplate class
750	class DocumentViewerTemplate(ZopePageTemplate):
751	"""Template for document viewer"""
752	meta_type="DocumentViewer Template"
753
754
755	def manage_addDocumentViewerTemplateForm(self):
756	"""Form for adding"""
757	pt=PageTemplateFile('zpt/addDocumentViewerTemplate', globals()).__of__(self)
758	return pt()
759
760	def manage_addDocumentViewerTemplate(self, id='viewer_main', title=None, text=None,
761	REQUEST=None, submit=None):
762	"Add a Page Template with optional file content."
763
764	self._setObject(id, DocumentViewerTemplate(id))
765	ob = getattr(self, id)
766	txt=file(os.path.join(package_home(globals()),'zpt/viewer_main.zpt'),'r').read()
767	logging.info("txt %s:"%txt)
768	ob.pt_edit(txt,"text/html")
769	if title:
770	ob.pt_setTitle(title)
771	try:
772	u = self.DestinationURL()
773	except AttributeError:
774	u = REQUEST['URL1']
775
776	u = "%s/%s" % (u, urllib.quote(id))
777	REQUEST.RESPONSE.redirect(u+'/manage_main')
778	return ''
779
780
781

Note: See TracBrowser for help on using the repository browser.

Download in other formats: