documentViewer/documentViewer.py - diff

Return to documentViewer.py CVS log

Up to [Repository] / documentViewer

Diff for /documentViewer/documentViewer.py between versions 1.26 and 1.35

version 1.26, 2007/05/04 13:17:02	version 1.35, 2008/11/04 20:23:49
Line 18 import sys	Line 18 import sys
import cgi	import cgi
import urllib	import urllib
import logging	import logging
	import math

import urlparse	import urlparse

Line 31 def getInt(number, default=0):	Line 32 def getInt(number, default=0):
try:	try:
return int(number)	return int(number)
except:	except:
return default	return int(default)

def getTextFromNode(nodename):	def getTextFromNode(nodename):
"""get the cdata content of a node"""	"""get the cdata content of a node"""
Line 82 class documentViewer(Folder):	Line 83 class documentViewer(Folder):
docuviewer_css = PageTemplateFile('css/docuviewer.css', globals())	docuviewer_css = PageTemplateFile('css/docuviewer.css', globals())
info_xml = PageTemplateFile('zpt/info_xml', globals())	info_xml = PageTemplateFile('zpt/info_xml', globals())

	thumbs_main_rss = PageTemplateFile('zpt/thumbs_main_rss', globals())
security.declareProtected('View management screens','changeDocumentViewerForm')	security.declareProtected('View management screens','changeDocumentViewerForm')
changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals())	changeDocumentViewerForm = PageTemplateFile('zpt/changeDocumentViewer', globals())

Line 105 class documentViewer(Folder):	Line 107 class documentViewer(Folder):
self.manage_addFolder('template')	self.manage_addFolder('template')


	security.declareProtected('View','thumbs_rss')
	def thumbs_rss(self,mode,url,viewMode="auto",start=None,pn=1):
	'''
	view it
	@param mode: defines how to access the document behind url
	@param url: url which contains display information
	@param viewMode: if images display images, if text display text, default is images (text,images or auto)

	'''
	logging.info("HHHHHHHHHHHHHH:load the rss")
	logger("documentViewer (index)", logging.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))

	if not hasattr(self, 'template'):
	# create template folder if it doesn't exist
	self.manage_addFolder('template')

	if not self.digilibBaseUrl:
	self.digilibBaseUrl = self.findDigilibUrl() or "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary"

	docinfo = self.getDocinfo(mode=mode,url=url)
	pageinfo = self.getPageinfo(start=start,current=pn,docinfo=docinfo)
	pt = getattr(self.template, 'thumbs_main_rss')

	if viewMode=="auto": # automodus gewaehlt
	if docinfo.get("textURL",'') and self.textViewerUrl: #texturl gesetzt und textViewer konfiguriert
	viewMode="text"
	else:
	viewMode="images"

	return pt(docinfo=docinfo,pageinfo=pageinfo,viewMode=viewMode)

security.declareProtected('View','index_html')	security.declareProtected('View','index_html')
def index_html(self,mode,url,viewMode="auto",start=None,pn=1):	def index_html(self,mode,url,viewMode="auto",start=None,pn=1):
'''	'''
Line 152 class documentViewer(Folder):	Line 185 class documentViewer(Folder):
url=self.REQUEST['URL1']+"?"+ps	url=self.REQUEST['URL1']+"?"+ps
return url	return url

	def getLinkAmp(self,param=None,val=None):
	"""link to documentviewer with parameter param set to val"""
	params=self.REQUEST.form.copy()
	if param is not None:
	if val is None:
	if params.has_key(param):
	del params[param]
	else:
	params[param] = str(val)

	# quote values and assemble into query string
	logging.info("XYXXXXX: %s"%repr(params.items()))
	ps = "&".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
	url=self.REQUEST['URL1']+"?"+ps
	return url
def getInfo_xml(self,url,mode):	def getInfo_xml(self,url,mode):
"""returns info about the document as XML"""	"""returns info about the document as XML"""

Line 193 class documentViewer(Folder):	Line 240 class documentViewer(Folder):
return False	return False


def getDirinfoFromDigilib(self,path,docinfo=None):	def getDirinfoFromDigilib(self,path,docinfo=None,cut=0):
"""gibt param von dlInfo aus"""	"""gibt param von dlInfo aus"""
num_retries = 3	num_retries = 3
if docinfo is None:	if docinfo is None:
docinfo = {}	docinfo = {}

	for x in range(cut):
	path=getParentDir(path)
infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path	infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path

logger("documentViewer (getparamfromdigilib)", logging.INFO, "dirInfo from %s"%(infoUrl))	logger("documentViewer (getparamfromdigilib)", logging.INFO, "dirInfo from %s"%(infoUrl))
Line 285 class documentViewer(Folder):	Line 334 class documentViewer(Folder):
return dom	return dom


def getAuthinfoFromIndexMeta(self,path,docinfo=None,dom=None):	def getAuthinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
"""gets authorization info from the index.meta file at path or given by dom"""	"""gets authorization info from the index.meta file at path or given by dom"""
logger("documentViewer (getauthinfofromindexmeta)", logging.INFO,"path: %s"%(path))	logger("documentViewer (getauthinfofromindexmeta)", logging.INFO,"path: %s"%(path))

Line 295 class documentViewer(Folder):	Line 344 class documentViewer(Folder):
docinfo = {}	docinfo = {}

if dom is None:	if dom is None:
dom = self.getIndexMeta(getParentDir(path))	for x in range(cut+1):
	path=getParentDir(path)
	dom = self.getIndexMeta(path)

acctype = dom.xpath("//access-conditions/access/@type")	acctype = dom.xpath("//access-conditions/access/@type")
if acctype and (len(acctype)>0):	if acctype and (len(acctype)>0):
Line 307 class documentViewer(Folder):	Line 358 class documentViewer(Folder):
return docinfo	return docinfo


def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None):	def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
"""gets bibliographical info from the index.meta file at path or given by dom"""	"""gets bibliographical info from the index.meta file at path or given by dom"""
logger("documentViewer (getbibinfofromindexmeta)", logging.INFO,"path: %s"%(path))	logging.debug("documentViewer (getbibinfofromindexmeta) path: %s"%(path))

if docinfo is None:	if docinfo is None:
docinfo = {}	docinfo = {}

if dom is None:	if dom is None:
dom = self.getIndexMeta(getParentDir(path))	for x in range(cut+1):
	path=getParentDir(path)
	dom = self.getIndexMeta(path)

	# put in all raw bib fields as dict "bib"
	bib = dom.xpath("//bib/*")
	if bib and len(bib)>0:
	bibinfo = {}
	for e in bib:
	bibinfo[e.localName] = getTextFromNode(e)
	docinfo['bib'] = bibinfo

	# extract some fields (author, title, year) according to their mapping
metaData=self.metadata.main.meta.bib	metaData=self.metadata.main.meta.bib
bibtype=dom.xpath("//bib/@type")	bibtype=dom.xpath("//bib/@type")
if bibtype and (len(bibtype)>0):	if bibtype and (len(bibtype)>0):
bibtype=bibtype[0].value	bibtype=bibtype[0].value
else:	else:
bibtype="generic"	bibtype="generic"

bibtype=bibtype.replace("-"," ") # wrong typesiin index meta "-" instead of " " (not wrong! ROC)	bibtype=bibtype.replace("-"," ") # wrong typesiin index meta "-" instead of " " (not wrong! ROC)
	docinfo['bib_type'] = bibtype
bibmap=metaData.generateMappingForType(bibtype)	bibmap=metaData.generateMappingForType(bibtype)
#print "bibmap: ", bibmap, " for: ", bibtype
# if there is no mapping bibmap is empty (mapping sometimes has empty fields)	# if there is no mapping bibmap is empty (mapping sometimes has empty fields)
if len(bibmap) > 0 and len(bibmap['author'][0]) > 0:	if len(bibmap) > 0 and len(bibmap['author'][0]) > 0:
	try:
docinfo['author']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['author'][0])[0])	docinfo['author']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['author'][0])[0])
	except: pass
	try:
docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0])	docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0])
	except: pass
	try:
docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0])	docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0])
	except: pass
logging.info("bla")	logging.debug("documentViewer (getbibinfofromindexmeta) using mapping for %s"%bibtype)
try:	try:
docinfo['lang']=getTextFromNode(dom.xpath("//bib/lang")[0])	docinfo['lang']=getTextFromNode(dom.xpath("//bib/lang")[0])
except:	except:
docinfo['lang']=''	docinfo['lang']=''

return docinfo	return docinfo


Line 408 class documentViewer(Folder):	Line 477 class documentViewer(Folder):
textUrl=getTextFromNode(textUrls[0])	textUrl=getTextFromNode(textUrls[0])
if urlparse.urlparse(textUrl)[0]=="": #keine url	if urlparse.urlparse(textUrl)[0]=="": #keine url
textUrl=os.path.join(archivePath,textUrl)	textUrl=os.path.join(archivePath,textUrl)
	# fix URLs starting with /mpiwg/online
	if textUrl.startswith("/mpiwg/online"):
	textUrl = textUrl.replace("/mpiwg/online",'',1)

docinfo['textURL'] = textUrl	docinfo['textURL'] = textUrl

Line 415 class documentViewer(Folder):	Line 487 class documentViewer(Folder):
docinfo = self.getBibinfoFromIndexMeta(url,docinfo=docinfo,dom=dom) # get info von bib tag	docinfo = self.getBibinfoFromIndexMeta(url,docinfo=docinfo,dom=dom) # get info von bib tag

if presentationUrls and (len(presentationUrls)>0): # ueberschreibe diese durch presentation informationen	if presentationUrls and (len(presentationUrls)>0): # ueberschreibe diese durch presentation informationen
# presentation url ergiebt sich ersetzen von index.meta in der url der f�r die Metadaten	# presentation url ergiebt sich ersetzen von index.meta in der url der fuer die Metadaten
# durch den relativen Pfad auf die presentation infos	# durch den relativen Pfad auf die presentation infos
presentationUrl=url.replace('index.meta',getTextFromNode(presentationUrls[0]))	presentationUrl=url.replace('index.meta',getTextFromNode(presentationUrls[0]))
docinfo = self.getBibinfoFromTextToolPresentation(presentationUrl,docinfo=docinfo,dom=dom)	docinfo = self.getBibinfoFromTextToolPresentation(presentationUrl,docinfo=docinfo,dom=dom)
Line 428 class documentViewer(Folder):	Line 500 class documentViewer(Folder):
"""gets the bibliographical information from the preseantion entry in texttools	"""gets the bibliographical information from the preseantion entry in texttools
"""	"""
dom=self.getPresentationInfoXML(url)	dom=self.getPresentationInfoXML(url)
	try:
docinfo['author']=getTextFromNode(dom.xpath("//author")[0])	docinfo['author']=getTextFromNode(dom.xpath("//author")[0])
	except:
	pass
	try:
docinfo['title']=getTextFromNode(dom.xpath("//title")[0])	docinfo['title']=getTextFromNode(dom.xpath("//title")[0])
	except:
	pass
	try:
docinfo['year']=getTextFromNode(dom.xpath("//date")[0])	docinfo['year']=getTextFromNode(dom.xpath("//date")[0])
	except:
	pass
return docinfo	return docinfo

def getDocinfoFromImagePath(self,path,docinfo=None):	def getDocinfoFromImagePath(self,path,docinfo=None,cut=0):
"""path ist the path to the images it assumes that the index.meta file is one level higher."""	"""path ist the path to the images it assumes that the index.meta file is one level higher."""
logger("documentViewer (getdocinfofromimagepath)", logging.INFO,"path: %s"%(path))	logger("documentViewer (getdocinfofromimagepath)", logging.INFO,"path: %s"%(path))
if docinfo is None:	if docinfo is None:
docinfo = {}	docinfo = {}
path=path.replace("/mpiwg/online","")	path=path.replace("/mpiwg/online","")
docinfo['imagePath'] = path	docinfo['imagePath'] = path
docinfo=self.getDirinfoFromDigilib(path,docinfo=docinfo)	docinfo=self.getDirinfoFromDigilib(path,docinfo=docinfo,cut=cut)
imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn="+path	imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn="+path
docinfo['imageURL'] = imageUrl	docinfo['imageURL'] = imageUrl

docinfo = self.getBibinfoFromIndexMeta(path,docinfo=docinfo)	docinfo = self.getBibinfoFromIndexMeta(path,docinfo=docinfo,cut=cut)
docinfo = self.getAuthinfoFromIndexMeta(path,docinfo=docinfo)	docinfo = self.getAuthinfoFromIndexMeta(path,docinfo=docinfo,cut=cut)
return docinfo	return docinfo


Line 465 class documentViewer(Folder):	Line 546 class documentViewer(Folder):
docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo)	docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo)
elif mode=="imagepath":	elif mode=="imagepath":
docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo)	docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo)
	elif mode=="filepath":
	docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo,cut=2)
else:	else:
logger("documentViewer (getdocinfo)", logging.ERROR,"unknown mode!")	logger("documentViewer (getdocinfo)", logging.ERROR,"unknown mode!")
raise ValueError("Unknown mode %s"%(mode))	raise ValueError("Unknown mode %s"%(mode))
Line 485 class documentViewer(Folder):	Line 568 class documentViewer(Folder):
pageinfo['cols'] = cols	pageinfo['cols'] = cols
grpsize = cols * rows	grpsize = cols * rows
pageinfo['groupsize'] = grpsize	pageinfo['groupsize'] = grpsize
start = getInt(start, default=(int(current / grpsize) * grpsize +1))	start = getInt(start, default=(math.ceil(float(current)/float(grpsize))*grpsize-(grpsize-1)))
	# int(current / grpsize) * grpsize +1))
pageinfo['start'] = start	pageinfo['start'] = start
pageinfo['end'] = start + grpsize	pageinfo['end'] = start + grpsize
if docinfo is not None:	if docinfo is not None:

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>

Removed from v.1.26
changed lines
	Added in v.1.35