--- documentViewer/documentViewer.py 2005/12/23 14:01:29 1.2
+++ documentViewer/documentViewer.py 2006/04/10 11:23:18 1.6
@@ -16,6 +16,15 @@ import Ft.Xml.XPath
import os.path
import cgi
import urllib
+import zLOG
+
+def getInt(number, default=0):
+ """returns always an int (0 in case of problems)"""
+ try:
+ return int(number)
+ except:
+ return default
+
def getTextFromNode(nodename):
nodelist=nodename.childNodes
@@ -34,199 +43,256 @@ def urlopen(url):
socket.setdefaulttimeout(5)
return ret
-def getParamFromDigilib(path,param):
- """gibt param von dlInfo aus"""
- imageUrl=genericDigilib+"/dlInfo-xml.jsp?fn="+path
-
- try:
- dom = NonvalidatingReader.parseUri(imageUrl)
- except:
- return None
-
-
- params=dom.xpath("//document-parameters/parameter[@name='%s']/@value"%param)
-
- if params:
- return params[0].value
-
-def parseUrlTextTool(url):
- """parse index meta"""
-
- try:
- dom = NonvalidatingReader.parseUri(url)
- except:
- zLOG.LOG("documentViewer (parseUrlTexttool)", zLOG.INFO,"%s (%s)"%sys.exc_info()[0:2])
- return (None,None,None)
-
- archivePaths=dom.xpath("//resource/archive-path")
-
- if archivePaths and (len(archivePaths)>0):
- archivePath=getTextFromNode(archivePaths[0])
- else:
- archivePath=None
-
- images=dom.xpath("//texttool/image")
-
- if images and (len(images)>0):
- image=getTextFromNode(images[0])
- else:
- image=None
-
- if image and archivePath:
- image=os.path.join(archivePath,image)
- image=image.replace("/mpiwg/online",'')
- pt=getParamFromDigilib(image,'pt')
-
- else:
- image=None
-
- viewerUrls=dom.xpath("//texttool/digiliburlprefix")
-
- if viewerUrls and (len(viewerUrls)>0):
- viewerUrl=getTextFromNode(viewerUrls[0])
- else:
- viewerUrl=None
-
-
- textUrls=dom.xpath("//texttool/text")
-
- if textUrls and (len(textUrls)>0):
- textUrl=getTextFromNode(textUrls[0])
- else:
- textUrl=None
- return viewerUrl,(image,pt),textUrl
-class documentViewer(ZopePageTemplate):
+##
+## documentViewer class
+##
+class documentViewer(Folder):
"""document viewer"""
meta_type="Document viewer"
security=ClassSecurityInfo()
- manage_options=ZopePageTemplate.manage_options+(
+ manage_options=Folder.manage_options+(
{'label':'main config','action':'changeDocumentViewerForm'},
)
- _default_content_fn = os.path.join(package_home(globals()),'zpt','documentViewer_template.zpt')
+ # templates and forms
+ viewer_main = PageTemplateFile('zpt/viewer_main', globals())
+ thumbs_main = PageTemplateFile('zpt/thumbs_main', globals())
+ image_main = PageTemplateFile('zpt/image_main', globals())
+ head_main = PageTemplateFile('zpt/head_main', globals())
+ docuviewer_css = PageTemplateFile('css/docuviewer.css', globals())
+
+ security.declareProtected('View management screens','changeDocumentViewerForm')
+ changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals())
+
- def __init__(self,id,imageViewerUrl,title=""):
+ def __init__(self,id,imageViewerUrl,title="",digilibBaseUrl=None,thumbcols=2,thumbrows=10):
"""init document viewer"""
self.id=id
self.title=title
self.imageViewerUrl=imageViewerUrl
+ if not digilibBaseUrl:
+ self.digilibBaseUrl = self.findDigilibUrl()
+ else:
+ self.digilibBaseUrl = digilibBaseUrl
+ self.thumbcols = thumbcols
+ self.thumbrows = thumbrows
+ # add template folder so we can always use template.something
+ self.manage_addFolder('template')
+
+
+ security.declareProtected('View','index_html')
+ def index_html(self,mode,url,start=None,pn=1):
+ '''
+ view it
+ @param mode: defines which type of document is behind url
+ @param url: url which contains display information
+ '''
- security.declareProtected('View management screens','changeDocumentViewerForm')
- def changeDocumentViewerForm(self):
- """change it"""
- pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','changeDocumentViewer.zpt')).__of__(self)
- return pt()
+ zLOG.LOG("documentViewer (index)", zLOG.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
+
+ if not hasattr(self, 'template'):
+ # create template folder if it doesn't exist
+ print "no template folder -- creating"
+ self.manage_addFolder('template')
+
+ if not self.digilibBaseUrl:
+ self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"
+
+ docinfo = self.getDocinfo(mode=mode,url=url)
+ pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo)
+ pt = getattr(self.template, 'viewer_main')
+ return pt(docinfo=docinfo,pageinfo=pageinfo)
- def changeDocumentViewer(self,imageViewerUrl,title="",RESPONSE=None):
- """init document viewer"""
- self.title=title
- self.imageViewerUrl=imageViewerUrl
+ def getLink(self,param=None,val=None):
+ """link to documentviewer with parameter param set to val"""
+ params=cgi.parse_qs(self.REQUEST['QUERY_STRING'])
+ if param is not None:
+ if val is None and params.has_key(param):
+ del params[param]
+ else:
+ params[param] = val
- if RESPONSE is not None:
- RESPONSE.redirect('manage_main')
-
+ url=self.REQUEST['URL']+"?"+urllib.urlencode(params, doseq=True)
+ return url
+
- def imageLink(self,nr):
- """link hinter den images"""
- paramsTmp=cgi.parse_qs(self.REQUEST['QUERY_STRING'])
- params={}
- for x in paramsTmp.iteritems():
- params[x[0]]=x[1][0]
-
- params['pn']=nr
- newUrl=self.REQUEST['URL']+"?"+urllib.urlencode(params)
- return newUrl
-
-
- def thumbruler(self,cols,rows,start,maximum):
- """ruler for thumbs"""
- ret=""
- paramsTmp=cgi.parse_qs(self.REQUEST['QUERY_STRING'])
- params={}
- for x in paramsTmp.iteritems():
-
- if not x[0]=="start":
- params[x[0]]=x[1][0]
-
- newUrlSelect=self.REQUEST['URL']+"?"+urllib.urlencode(params)
- if start>0:
- newStart=max(start-cols*rows,0)
- params['start']=newStart
- newUrl=self.REQUEST['URL']+"?"+urllib.urlencode(params)
- ret+="""prev"""%newUrl
-
-
- ret+=""""
+ def getStyle(self, idx, selected, style=""):
+ """returns a string with the given style and append 'sel' if path == selected."""
+ #zLOG.LOG("documentViewer (getstyle)", zLOG.INFO, "idx: %s selected: %s style: %s"%(idx,selected,style))
+ if idx == selected:
+ return style + 'sel'
+ else:
+ return style
- if startnext"""%newUrl
- return ret
+ def getParamFromDigilib(self,path,param):
+ """gibt param von dlInfo aus"""
+ imageUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path
+
+ zLOG.LOG("documentViewer (getparamfromdigilib)", zLOG.INFO, "dirInfo (%s) from %s"%(param,imageUrl))
- def textToolThumb(self,url,start=0):
- """understands the texttool format
- @param url: url to index.meta with texttool tag
- """
- (viewerUrl,imagepath,textpath)=parseUrlTextTool(url)
+ try:
+ dom = NonvalidatingReader.parseUri(imageUrl)
+ except:
+ return None
- imageUrl=genericDigilib+"/servlet/Scaler?fn=%s"%imagepath[0]
+ params=dom.xpath("//dir/%s"%param)
+ zLOG.LOG("documentViewer (getparamfromdigilib)", zLOG.INFO, "dirInfo:%s"%params)
- pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','thumbs.zpt')).__of__(self)
- return pt(imageUrl=imageUrl,pt=imagepath[1],start=start)
+ if params:
+ return getTextFromNode(params[0])
+
- def imagePathThumb(self,path,start=0):
- """path ist the path to the images it is assumes that the index.meta file is one level higher."""
+ def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None):
+ """gets bibliographical info from the index.meta file at url or given by dom"""
+ zLOG.LOG("documentViewer (getbibinfofromindexmeta)", zLOG.INFO,"path: %s"%(path))
- path=path.replace("/mpiwg/online","")
- pt=getParamFromDigilib(path,'pt')
- imageUrl=genericDigilib+"/servlet/Scaler?fn=%s"%path
-
- pageT=PageTemplateFile(os.path.join(package_home(globals()),'zpt','thumbs.zpt')).__of__(self)
- return pageT(imageUrl=imageUrl,pt=pt,start=start)
-
- def headerFromIndexMeta(self,path):
- """gibt header from index meta out"""
+ if docinfo is None:
+ docinfo = {}
+
+ if dom is None:
+ server="http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary/servlet/Texter?fn="
+ path="/".join(path.split("/")[0:-1])
+ metaUrl=server+path+"/index.meta"
+ try:
+ dom = NonvalidatingReader.parseUri(metaUrl)
+ except:
+ return docinfo
metaData=self.metadata.main.meta.bib
- server="http://foxridge.mpiwg-berlin.mpg.de"
- path="/".join(path.split("/")[0:-1])
- metaUrl=server+path+"/index.meta"
-
- dom = NonvalidatingReader.parseUri(metaUrl)
- type=dom.xpath("//bib/@type")
- if type and (len(type)>0):
- type=type[0].value
+ bibtype=dom.xpath("//bib/@type")
+ if bibtype and (len(bibtype)>0):
+ bibtype=bibtype[0].value
else:
- type="generic"
- type=type.replace("-"," ")# wrong typesiin index meta "-" instead of " "
- hash=metaData.generateMappingForType(type)
-
- author=getTextFromNode(dom.xpath("//bib/%s"%hash['author'][0])[0])
- title=getTextFromNode(dom.xpath("//bib/%s"%hash['title'][0])[0])
- year=getTextFromNode(dom.xpath("//bib/%s"%hash['year'][0])[0])
-
- return author,title,year
-
+ bibtype="generic"
+ bibtype=bibtype.replace("-"," ") # wrong typesiin index meta "-" instead of " " (not wrong! ROC)
+ bibmap=metaData.generateMappingForType(bibtype)
+ if len(bibmap) > 0:
+ docinfo['author']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['author'][0])[0])
+ docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0])
+ docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0])
+
+ return docinfo
+
+
+ def getDocinfoFromTextTool(self,url,docinfo=None):
+ """parse texttool tag in index meta"""
+ zLOG.LOG("documentViewer (getdocinfofromtexttool)", zLOG.INFO,"url: %s"%(url))
+ if docinfo is None:
+ docinfo = {}
+
+ try:
+ dom = NonvalidatingReader.parseUri(url)
+ except:
+ zLOG.LOG("documentViewer (parseUrlTexttool)", zLOG.INFO,"%s (%s)"%sys.exc_info()[0:2])
+ return docinfo
+
+ archivePaths=dom.xpath("//resource/archive-path")
+
+ if archivePaths and (len(archivePaths)>0):
+ archivePath=getTextFromNode(archivePaths[0])
+ else:
+ archivePath=None
+
+ images=dom.xpath("//texttool/image")
+
+ if images and (len(images)>0):
+ image=getTextFromNode(images[0])
+ else:
+ image=None
+
+ if image and archivePath:
+ image=os.path.join(archivePath,image)
+ image=image.replace("/mpiwg/online",'')
+ pt=self.getParamFromDigilib(image,'size')
+ docinfo['imagePath'] = image
+ docinfo['numPages'] = pt
+
+ viewerUrls=dom.xpath("//texttool/digiliburlprefix")
+
+ if viewerUrls and (len(viewerUrls)>0):
+ viewerUrl=getTextFromNode(viewerUrls[0])
+ docinfo['imageURL'] = viewerURL
+
+ textUrls=dom.xpath("//texttool/text")
+
+ if textUrls and (len(textUrls)>0):
+ textUrl=getTextFromNode(textUrls[0])
+ docinfo['textURL'] = textURL
+
+ docinfo = self.getBibinfoFromIndexMeta(url,docinfo=docinfo,dom=dom)
+ return docinfo
+
+
+ def getDocinfoFromImagePath(self,path,docinfo=None):
+ """path ist the path to the images it assumes that the index.meta file is one level higher."""
+ zLOG.LOG("documentViewer (getdocinfofromimagepath)", zLOG.INFO,"path: %s"%(path))
+ if docinfo is None:
+ docinfo = {}
+ path=path.replace("/mpiwg/online","")
+ docinfo['imagePath'] = path
+ pt=self.getParamFromDigilib(path,'size')
+ docinfo['numPages'] = pt
+ imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn=%s"%path
+ docinfo['imageURL'] = imageUrl
+
+ docinfo = self.getBibinfoFromIndexMeta(path,docinfo=docinfo)
+ return docinfo
+
+
+ def getDocinfo(self, mode, url):
+ """returns docinfo depending on mode"""
+ zLOG.LOG("documentViewer (getdocinfo)", zLOG.INFO,"mode: %s, url: %s"%(mode,url))
+ # look for cached docinfo in session
+ if self.REQUEST.SESSION.has_key('docinfo'):
+ docinfo = self.REQUEST.SESSION['docinfo']
+ # check if its still current
+ if docinfo is not None and docinfo.get('mode') == mode and docinfo.get('url') == url:
+ zLOG.LOG("documentViewer (getdocinfo)", zLOG.INFO,"docinfo in session: %s"%docinfo)
+ return docinfo
+ # new docinfo
+ docinfo = {'mode': mode, 'url': url}
+ if mode=="texttool": #index.meta with texttool information
+ docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo)
+ elif mode=="imagepath":
+ docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo)
+ else:
+ zLOG.LOG("documentViewer (getdocinfo)", zLOG.ERROR,"unknown mode!")
+ zLOG.LOG("documentViewer (getdocinfo)", zLOG.INFO,"docinfo: %s"%docinfo)
+ self.REQUEST.SESSION['docinfo'] = docinfo
+ return docinfo
+
+
+ def getPageinfo(self, current, start=None, rows=None, cols=None, docinfo=None):
+ """returns pageinfo with the given parameters"""
+ pageinfo = {}
+ current = getInt(current)
+ pageinfo['current'] = current
+ rows = int(rows or self.thumbrows)
+ pageinfo['rows'] = rows
+ cols = int(cols or self.thumbcols)
+ pageinfo['cols'] = cols
+ grpsize = cols * rows
+ pageinfo['groupsize'] = grpsize
+ start = getInt(start, default=(int(current / grpsize) * grpsize +1))
+ print "start3:", start
+ pageinfo['start'] = start
+ pageinfo['end'] = start + grpsize
+ if docinfo is not None:
+ np = int(docinfo['numPages'])
+ pageinfo['end'] = min(pageinfo['end'], np)
+ pageinfo['numgroups'] = int(np / grpsize)
+ if np % grpsize > 0:
+ pageinfo['numgroups'] += 1
+
+ return pageinfo
+
def text(self,mode,url,pn):
"""give text"""
if mode=="texttool": #index.meta with texttool information
@@ -279,51 +345,36 @@ class documentViewer(ZopePageTemplate):
# PrettyPrint(x)
#
# return list
-#
- def image(self,mode,url,pn):
- """give image out"""
- if mode=="texttool": #index.meta with texttool information
- (viewerUrl,imagepath,textpath)=parseUrlTextTool(url)
- if not viewerUrl:
- viewerUrl=self.imageViewerUrl
- url=viewerUrl+"pn=%s&fn=%s"%(pn,imagepath[0])
- ret=""""""%url
- return url
- elif mode=="imagepath":
- url=url.replace("/mpiwg/online","")
- url=self.imageViewerUrl+"pn=%s&fn=%s"%(pn,url)
- ret=""""""%url
- return url
-
-
- def thumbs(self,mode,url,start):
- """give thumbs out"""
- if mode=="texttool": #index.meta with texttool information
- return self.textToolThumb(url,int(start))
- elif mode=="imagepath":
- return self.imagePathThumb(url,int(start))
-
- security.declareProtected('View','index_html')
-
+#
+
+ def findDigilibUrl(self):
+ """try to get the digilib URL from zogilib"""
+ url = self.imageViewerUrl[:-1] + "/getScalerUrl"
+ try:
+ scaler = urlopen(url).read()
+ return scaler.replace("/servlet/Scaler?", "")
+ except:
+ return None
- def index_html(self,mode,url,start=0,pn=1):
- '''
- view it
- @param mode: defines which type of document is behind url
- @param url: url which contains display information
- '''
+ def changeDocumentViewer(self,imageViewerUrl,title="",digilibBaseUrl=None,thumbrows=2,thumbcols=10,RESPONSE=None):
+ """init document viewer"""
+ self.title=title
+ self.imageViewerUrl=imageViewerUrl
+ self.digilibBaseUrl = digilibBaseUrl
+ self.thumbrows = thumbrows
+ self.thumbcols = thumbcols
+ if RESPONSE is not None:
+ RESPONSE.redirect('manage_main')
+
- pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','documentViewer_template.zpt')).__of__(self)
- return pt(mode=mode,url=url,start=start,pn=pn)
-
# security.declareProtected('View management screens','renameImageForm')
def manage_AddDocumentViewerForm(self):
"""add the viewer form"""
- pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','addDocumentViewer.zpt')).__of__(self)
+ pt=PageTemplateFile('zpt/addDocumentViewer', globals()).__of__(self)
return pt()
def manage_AddDocumentViewer(self,id,imageViewerUrl="",title="",RESPONSE=None):
@@ -333,4 +384,38 @@ def manage_AddDocumentViewer(self,id,ima
if RESPONSE is not None:
RESPONSE.redirect('manage_main')
+
+
+##
+## DocumentViewerTemplate class
+##
+class DocumentViewerTemplate(ZopePageTemplate):
+ """Template for document viewer"""
+ meta_type="DocumentViewer Template"
+
+
+def manage_addDocumentViewerTemplateForm(self):
+ """Form for adding"""
+ pt=PageTemplateFile('zpt/addDocumentViewerTemplate', globals()).__of__(self)
+ return pt()
+
+def manage_addDocumentViewerTemplate(self, id='viewer_main', title=None, text=None,
+ REQUEST=None, submit=None):
+ "Add a Page Template with optional file content."
+
+ self._setObject(id, DocumentViewerTemplate(id))
+ ob = getattr(self, id)
+ ob.pt_edit(open(os.path.join(package_home(globals()),'zpt/viewer_main.zpt')).read(),None)
+ if title:
+ ob.pt_setTitle(title)
+ try:
+ u = self.DestinationURL()
+ except AttributeError:
+ u = REQUEST['URL1']
+
+ u = "%s/%s" % (u, urllib.quote(id))
+ REQUEST.RESPONSE.redirect(u+'/manage_main')
+ return ''
+
+
\ No newline at end of file