--- documentViewer/MpdlXmlTextServer.py 2011/01/06 15:44:18 1.222 +++ documentViewer/MpdlXmlTextServer.py 2011/02/14 14:41:12 1.225 @@ -3,6 +3,7 @@ from OFS.SimpleItem import SimpleItem from Products.PageTemplates.PageTemplateFile import PageTemplateFile from Ft.Xml import EMPTY_NAMESPACE, Parse +import md5 import sys import logging import urllib @@ -54,9 +55,7 @@ class MpdlXmlTextServer(SimpleItem): optionToggle = pageinfo['optionToggle'] tocPN = pageinfo['tocPN'] selfurl = self.absolute_url() - data = self.getServerData("doc-query.xql","document=%s&mode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s&sn=%s&viewMode=%s&characterNormalization=%s&optionToggle=%s&highlightQuery=%s"%(docpath, 'text', queryType, urllib.quote(query), pagesize, pn, sn, viewMode,characterNormalization,optionToggle ,urllib.quote(highlightQuery))) - pagexml = data.replace('?document=%s'%str(docpath),'?url=%s'%url) pagedom = Parse(pagexml) @@ -86,6 +85,7 @@ class MpdlXmlTextServer(SimpleItem): selfurl = self.absolute_url() pagexml=href.replace('mode=text','mode=texttool&viewMode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s&tocMode=%s&searchPN=%s&tocPN=%s&optionToggle=%s&characterNormalization=%s'%(viewMode,queryType,urllib.quote(query),pagesize,pn,tocMode,pn,tocPN,optionToggle,characterNormalization)) hrefNode.nodeValue = pagexml.replace('page-fragment.xql','%s'%selfurl) + logging.debug("PUREXML :%s"%(serializeNode(pagenode))) return serializeNode(pagenode) if (queryType=="fulltextMorph"): pagedivs = pagedom.xpath("//div[@class='queryResult']") @@ -176,17 +176,17 @@ class MpdlXmlTextServer(SimpleItem): return myList - def getTextPage(self, docinfo=None, pageinfo=None): + def getTextPage(self, mode="text", pn=1, docinfo=None, pageinfo=None): """returns single page from fulltext""" docpath = docinfo['textURLPath'] path = docinfo['textURLPath'] url = docinfo.get('url',None) name = docinfo.get('name',None) pn =pageinfo['current'] - #viewMode= pageinfo['viewMode'] + viewMode= pageinfo['viewMode'] sn = pageinfo['sn'] highlightQuery = pageinfo['highlightQuery'] - mode = pageinfo ['viewMode'] + #mode = pageinfo ['viewMode'] tocMode = pageinfo['tocMode'] characterNormalization=pageinfo['characterNormalization'] tocPN = pageinfo['tocPN'] @@ -363,7 +363,22 @@ class MpdlXmlTextServer(SimpleItem): hrefNode.nodeValue = href.replace('#note-',"?url=%s&viewMode=%s&tocMode=%s&tocPN=%s&pn=%s#note-"%(url,viewMode,tocMode,tocPN,pn)) return serializeNode(pagenode) return "no text here" - + + def getText(self, mode="text", pn=1, docinfo=None, pageinfo=None): + data = self.getTextPage(mode="text", pn=1 ,docinfo=docinfo, pageinfo=pageinfo) + logging.debug("TEXT ALL data: %s"%(data)) + return data + + def getXML(self, mode="xml", pn=1, docinfo=None, pageinfo=None): + data = self.getTextPage(mode="xml", pn=1 ,docinfo=docinfo, pageinfo=pageinfo) + logging.debug("TEXT ALL data: %s"%(data)) + return data + + def getDictionary(self, mode="text_dict", pn=1, docinfo=None, pageinfo=None): + data = self.getTextPage(mode="text_dict", pn=1 ,docinfo=docinfo, pageinfo=pageinfo) + logging.debug("TEXT ALL data: %s"%(data)) + return data + def getTranslate(self, query=None, language=None): """translate into another languages""" data = self.getServerData("lt/lex.xql","document=&language="+str(language)+"&query="+urllib.quote(query)) @@ -456,7 +471,7 @@ class MpdlXmlTextServer(SimpleItem): page = data.replace('page-fragment.xql?document=%s'%str(path),'%s?url=%s&viewMode=%s&tocMode=%s&tocPN=%s&optionToggle=1'%(selfurl,url, viewMode, tocMode, tocPN)) text = page.replace('mode=image','mode=texttool') #logging.debug("documentViewer (characterNormalization) characterNormalization: %s"%(characterNormalization)) - + logging.debug("TEXT %s"%(text)) return text def manage_changeMpdlXmlTextServer(self,title="",serverUrl="http://mpdl-proto.mpiwg-berlin.mpg.de/mpdl/interface/",timeout=40,RESPONSE=None): @@ -478,7 +493,4 @@ def manage_addMpdlXmlTextServer(self,id, newObj = MpdlXmlTextServer(id,title,serverUrl,timeout) self.Destination()._setObject(id, newObj) if RESPONSE is not None: - RESPONSE.redirect('manage_main') - - - + RESPONSE.redirect('manage_main') \ No newline at end of file