documentViewer: documentViewer.py comparison

comparison documentViewer.py @ 166:ffb5c62bd459

characterNormalization

author	abukhman
date	Tue, 24 Aug 2010 14:34:32 +0200
parents	820a2a4b23c3
children	7e2b97941a66

comparison

equal deleted inserted replaced

-:820a2a4b23c3
+:ffb5c62bd459
 response = None
 errmsg = None
 for cnt in range(num_tries):
 try:
-logging.debug("getHttpData(#%s %ss) url=%s"%(cnt+1,timeout,url))
+#logging.debug("getHttpData(#%s %ss) url=%s"%(cnt+1,timeout,url))
 if sys.version_info < (2, 6):
 # set timeout on socket -- ugly :-(
 import socket
 socket.setdefaulttimeout(float(timeout))
 response = urllib2.urlopen(url)
 else:
 response = urllib2.urlopen(url,timeout=float(timeout))
 # check result?
 break
 except urllib2.HTTPError, e:
-logging.error("getHttpData: HTTP error(%s): %s"%(e.code,e))
+#logging.error("getHttpData: HTTP error(%s): %s"%(e.code,e))
 errmsg = str(e)
 # stop trying
 break
 except urllib2.URLError, e:
-logging.error("getHttpData: URLLIB error(%s): %s"%(e.reason,e))
+#logging.error("getHttpData: URLLIB error(%s): %s"%(e.reason,e))
 errmsg = str(e)
 # stop trying
 #break
 if response is not None:
 @param mode: defines how to access the document behind url
 @param url: url which contains display information
 @param viewMode: if images display images, if text display text, default is images (text,images or auto)
 '''
-logging.debug("HHHHHHHHHHHHHH:load the rss")
+#logging.debug("HHHHHHHHHHHHHH:load the rss")
-logger("documentViewer (index)", logging.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
+#logger("documentViewer (index)", logging.INFO, "mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
 if not hasattr(self, 'template'):
 # create template folder if it doesn't exist
 self.manage_addFolder('template')
 @param tocMode: type of 'table of contents' for navigation (thumbs, text, figures, none)
 @param characterNormalization type of text display (reg, norm, none)
 @param querySearch: type of different search modes (fulltext, fulltextMorph, xpath, xquery, ftIndex, ftIndexMorph, fulltextMorphLemma)
 '''
-logging.debug("documentViewer (index) mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
+#logging.debug("documentViewer (index) mode: %s url:%s start:%s pn:%s"%(mode,url,start,pn))
 if not hasattr(self, 'template'):
 # this won't work
 logging.error("template folder missing!")
 return "ERROR: template folder missing!"
 del params[param]
 else:
 params[param] = str(val)
 # quote values and assemble into query string
-logging.debug("XYXXXXX: %s"%repr(params.items()))
+#logging.debug("XYXXXXX: %s"%repr(params.items()))
 ps = "&amp;".join(["%s=%s"%(k,urllib.quote(v)) for (k, v) in params.items()])
 url=self.REQUEST['URL1']+"?"+ps
 return url
 def getInfo_xml(self,url,mode):
 def isAccessible(self, docinfo):
 """returns if access to the resource is granted"""
 access = docinfo.get('accessType', None)
-logging.debug("documentViewer (accessOK) access type %s"%access)
+#logging.debug("documentViewer (accessOK) access type %s"%access)
 if access is not None and access == 'free':
-logging.debug("documentViewer (accessOK) access is free")
+#logging.debug("documentViewer (accessOK) access is free")
 return True
 elif access is None or access in self.authgroups:
 # only local access -- only logged in users
 user = getSecurityManager().getUser()
-logging.debug("documentViewer (accessOK) user=%s ip=%s"%(user,self.REQUEST.getClientAddr()))
+#logging.debug("documentViewer (accessOK) user=%s ip=%s"%(user,self.REQUEST.getClientAddr()))
 if user is not None:
 #print "user: ", user
 return (user.getUserName() != "Anonymous User")
 else:
 return False
-logging.error("documentViewer (accessOK) unknown access type %s"%access)
+#logging.error("documentViewer (accessOK) unknown access type %s"%access)
 return False
 def getDirinfoFromDigilib(self,path,docinfo=None,cut=0):
 """gibt param von dlInfo aus"""
 path=getParentDir(path)
 infoUrl=self.digilibBaseUrl+"/dirInfo-xml.jsp?mo=dir&fn="+path
-logging.debug("documentViewer (getparamfromdigilib) dirInfo from %s"%(infoUrl))
+#logging.debug("documentViewer (getparamfromdigilib) dirInfo from %s"%(infoUrl))
 txt = getHttpData(infoUrl)
 if txt is None:
 raise IOError("Unable to get dir-info from %s"%(infoUrl))
 dom = Parse(txt)
 sizes=dom.xpath("//dir/size")
-logging.debug("documentViewer (getparamfromdigilib) dirInfo:size"%sizes)
+#logging.debug("documentViewer (getparamfromdigilib) dirInfo:size"%sizes)
 if sizes:
 docinfo['numPages'] = int(getTextFromNode(sizes[0]))
 else:
 docinfo['numPages'] = 0
 server=self.digilibBaseUrl+"/servlet/Texter?fn="
 metaUrl=server+url.replace("/mpiwg/online","")
 if not metaUrl.endswith("index.meta"):
 metaUrl += "/index.meta"
-logging.debug("(getIndexMeta): METAURL: %s"%metaUrl)
+#logging.debug("(getIndexMeta): METAURL: %s"%metaUrl)
 txt=getHttpData(metaUrl)
 if txt is None:
 raise IOError("Unable to read index meta from %s"%(url))
 dom = Parse(txt)
 return dom
 def getAuthinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
 """gets authorization info from the index.meta file at path or given by dom"""
-logging.debug("documentViewer (getauthinfofromindexmeta) path: %s"%(path))
+#logging.debug("documentViewer (getauthinfofromindexmeta) path: %s"%(path))
 access = None
 if docinfo is None:
 docinfo = {}
 return docinfo
 def getBibinfoFromIndexMeta(self,path,docinfo=None,dom=None,cut=0):
 """gets bibliographical info from the index.meta file at path or given by dom"""
-logging.debug("documentViewer (getbibinfofromindexmeta) path: %s"%(path))
+#logging.debug("documentViewer (getbibinfofromindexmeta) path: %s"%(path))
 if docinfo is None:
 docinfo = {}
 if dom is None:
 for x in range(cut):
 path=getParentDir(path)
 dom = self.getIndexMeta(path)
-logging.debug("documentViewer (getbibinfofromindexmeta cutted) path: %s"%(path))
+#logging.debug("documentViewer (getbibinfofromindexmeta cutted) path: %s"%(path))
 # put in all raw bib fields as dict "bib"
 bib = dom.xpath("//bib/*")
 if bib and len(bib)>0:
 bibinfo = {}
 for e in bib:
 docinfo['title']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['title'][0])[0])
 except: pass
 try:
 docinfo['year']=getTextFromNode(dom.xpath("//bib/%s"%bibmap['year'][0])[0])
 except: pass
-logging.debug("documentViewer (getbibinfofromindexmeta) using mapping for %s"%bibtype)
+#logging.debug("documentViewer (getbibinfofromindexmeta) using mapping for %s"%bibtype)
 try:
 docinfo['lang']=getTextFromNode(dom.xpath("//bib/lang")[0])
 except:
 docinfo['lang']=''
 return docinfo
 def getDocinfoFromTextTool(self, url, dom=None, docinfo=None):
 """parse texttool tag in index meta"""
-logging.debug("documentViewer (getdocinfofromtexttool) url: %s" % (url))
+#logging.debug("documentViewer (getdocinfofromtexttool) url: %s" % (url))
 if docinfo is None:
 docinfo = {}
 if docinfo.get('lang', None) is None:
 docinfo['lang'] = '' # default keine Sprache gesetzt
 if dom is None:
 archivePath = '/' + archivePath
 if archiveName and (not archivePath.endswith(archiveName)):
 archivePath += "/" + archiveName
 else:
 # try to get archive-path from url
-logging.warning("documentViewer (getdocinfofromtexttool) resource/archive-path missing in: %s" % (url))
+#logging.warning("documentViewer (getdocinfofromtexttool) resource/archive-path missing in: %s" % (url))
 if (not url.startswith('http')):
 archivePath = url.replace('index.meta', '')
 if archivePath is None:
 # we balk without archive-path
 pass
 return docinfo
 def getDocinfoFromImagePath(self,path,docinfo=None,cut=0):
 """path ist the path to the images it assumes that the index.meta file is one level higher."""
-logging.debug("documentViewer (getdocinfofromimagepath) path: %s"%(path))
+#logging.debug("documentViewer (getdocinfofromimagepath) path: %s"%(path))
 if docinfo is None:
 docinfo = {}
 path=path.replace("/mpiwg/online","")
 docinfo['imagePath'] = path
 docinfo=self.getDirinfoFromDigilib(path,docinfo=docinfo,cut=cut)
 pathorig=path
 for x in range(cut):
 path=getParentDir(path)
-logging.debug("documentViewer (getdocinfofromimagepath) PATH:"+path)
+#logging.debug("documentViewer (getdocinfofromimagepath) PATH:"+path)
 imageUrl=self.digilibBaseUrl+"/servlet/Scaler?fn="+path
 docinfo['imageURL'] = imageUrl
 #path ist the path to the images it assumes that the index.meta file is one level higher.
 docinfo = self.getBibinfoFromIndexMeta(pathorig,docinfo=docinfo,cut=cut+1)
 return docinfo
 def getDocinfo(self, mode, url):
 """returns docinfo depending on mode"""
-logging.debug("documentViewer (getdocinfo) mode: %s, url: %s"%(mode,url))
+#logging.debug("documentViewer (getdocinfo) mode: %s, url: %s"%(mode,url))
 # look for cached docinfo in session
 if self.REQUEST.SESSION.has_key('docinfo'):
 docinfo = self.REQUEST.SESSION['docinfo']
 # check if its still current
 if docinfo is not None and docinfo.get('mode') == mode and docinfo.get('url') == url:
-logging.debug("documentViewer (getdocinfo) docinfo in session: %s"%docinfo)
+#logging.debug("documentViewer (getdocinfo) docinfo in session: %s"%docinfo)
 return docinfo
 # new docinfo
 docinfo = {'mode': mode, 'url': url}
 if mode=="texttool": #index.meta with texttool information
 docinfo = self.getDocinfoFromTextTool(url, docinfo=docinfo)
 elif mode=="imagepath":
 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo)
 elif mode=="filepath":
 docinfo = self.getDocinfoFromImagePath(url, docinfo=docinfo,cut=1)
 else:
-logging.error("documentViewer (getdocinfo) unknown mode: %s!"%mode)
+#logging.error("documentViewer (getdocinfo) unknown mode: %s!"%mode)
 raise ValueError("Unknown mode %s! Has to be one of 'texttool','imagepath','filepath'."%(mode))
-logging.debug("documentViewer (getdocinfo) docinfo: %s"%docinfo)
+#logging.debug("documentViewer (getdocinfo) docinfo: %s"%docinfo)
 self.REQUEST.SESSION['docinfo'] = docinfo
 return docinfo
 def getPageinfo(self, current, start=None, rows=None, cols=None, docinfo=None, viewMode=None, tocMode=None):
 """returns pageinfo with the given parameters"""
 "Add a Page Template with optional file content."
 self._setObject(id, DocumentViewerTemplate(id))
 ob = getattr(self, id)
 txt=file(os.path.join(package_home(globals()),'zpt/viewer_main.zpt'),'r').read()
-logging.info("txt %s:"%txt)
+#logging.info("txt %s:"%txt)
 ob.pt_edit(txt,"text/html")
 if title:
 ob.pt_setTitle(title)
 try:
 u = self.DestinationURL()

Mercurial > hg > documentViewer

comparison documentViewer.py @ 166:ffb5c62bd459