version 1.229, 2011/03/01 14:53:15
|
version 1.230, 2011/03/07 14:08:07
|
Line 85 class MpdlXmlTextServer(SimpleItem):
|
Line 85 class MpdlXmlTextServer(SimpleItem):
|
selfurl = self.absolute_url() |
selfurl = self.absolute_url() |
pagexml=href.replace('mode=text','mode=texttool&viewMode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s&tocMode=%s&searchPN=%s&tocPN=%s&optionToggle=%s&characterNormalization=%s'%(viewMode,queryType,urllib.quote(query),pagesize,pn,tocMode,pn,tocPN,optionToggle,characterNormalization)) |
pagexml=href.replace('mode=text','mode=texttool&viewMode=%s&queryType=%s&query=%s&queryResultPageSize=%s&queryResultPN=%s&tocMode=%s&searchPN=%s&tocPN=%s&optionToggle=%s&characterNormalization=%s'%(viewMode,queryType,urllib.quote(query),pagesize,pn,tocMode,pn,tocPN,optionToggle,characterNormalization)) |
hrefNode.nodeValue = pagexml.replace('page-fragment.xql','%s'%selfurl) |
hrefNode.nodeValue = pagexml.replace('page-fragment.xql','%s'%selfurl) |
logging.debug("PUREXML :%s"%(serializeNode(pagenode))) |
#logging.debug("PUREXML :%s"%(serializeNode(pagenode))) |
return serializeNode(pagenode) |
return serializeNode(pagenode) |
if (queryType=="fulltextMorph"): |
if (queryType=="fulltextMorph"): |
pagedivs = pagedom.xpath("//div[@class='queryResult']") |
pagedivs = pagedom.xpath("//div[@class='queryResult']") |
Line 150 class MpdlXmlTextServer(SimpleItem):
|
Line 150 class MpdlXmlTextServer(SimpleItem):
|
href= hrefNode.nodeValue |
href= hrefNode.nodeValue |
hrefList.append(href) |
hrefList.append(href) |
myList = ",".join(hrefList) |
myList = ",".join(hrefList) |
logging.debug("getGisPlaces :%s"%(myList)) |
#logging.debug("getGisPlaces :%s"%(myList)) |
return myList |
return myList |
|
|
def getAllGisPlaces (self, docinfo=None, pageinfo=None): |
def getAllGisPlaces (self, docinfo=None, pageinfo=None): |
Line 171 class MpdlXmlTextServer(SimpleItem):
|
Line 171 class MpdlXmlTextServer(SimpleItem):
|
href= hrefNode.nodeValue |
href= hrefNode.nodeValue |
hrefList.append(href) |
hrefList.append(href) |
myList = ",".join(hrefList) |
myList = ",".join(hrefList) |
logging.debug("getALLGisPlaces :%s"%(myList)) |
#logging.debug("getALLGisPlaces :%s"%(myList)) |
return myList |
return myList |
|
|
|
|
Line 202 class MpdlXmlTextServer(SimpleItem):
|
Line 202 class MpdlXmlTextServer(SimpleItem):
|
dom = Parse(pagexml) |
dom = Parse(pagexml) |
#original Pages |
#original Pages |
pagedivs = dom.xpath("//div[@class='pageNumberOrig']") |
pagedivs = dom.xpath("//div[@class='pageNumberOrig']") |
if pagedivs == dom.xpath("//div[@class='pageNumberOrig']"): |
"""if pagedivs == dom.xpath("//div[@class='pageNumberOrig']"): |
if len(pagedivs)>0: |
if len(pagedivs)>0: |
docinfo['pageNumberOrig']= getTextFromNode(pagedivs[0]) |
docinfo['pageNumberOrig']= getTextFromNode(pagedivs[0]) |
|
logging.debug("ORIGINAL PAGE: %s"%(docinfo['pageNumberOrig'])) |
|
|
#original Pages Norm |
#original Pages Norm |
pagedivs = dom.xpath("//div[@class='pageNumberOrigNorm']") |
pagedivs = dom.xpath("//div[@class='pageNumberOrigNorm']") |
if pagedivs == dom.xpath("//div[@class='pageNumberOrigNorm']"): |
if pagedivs == dom.xpath("//div[@class='pageNumberOrigNorm']"): |
if len(pagedivs)>0: |
if len(pagedivs)>0: |
docinfo['pageNumberOrigNorm']= getTextFromNode(pagedivs[0]) |
docinfo['pageNumberOrigNorm']= getTextFromNode(pagedivs[0]) |
|
logging.debug("ORIGINAL PAGE NORM: %s"%(docinfo['pageNumberOrigNorm'])) |
|
""" |
#figureEntries |
#figureEntries |
pagedivs = dom.xpath("//div[@class='countFigureEntries']") |
pagedivs = dom.xpath("//div[@class='countFigureEntries']") |
if pagedivs == dom.xpath("//div[@class='countFigureEntries']"): |
if pagedivs == dom.xpath("//div[@class='countFigureEntries']"): |
Line 363 class MpdlXmlTextServer(SimpleItem):
|
Line 365 class MpdlXmlTextServer(SimpleItem):
|
return serializeNode(pagenode) |
return serializeNode(pagenode) |
return "no text here" |
return "no text here" |
|
|
|
def getOrigPages(self, docinfo=None, pageinfo=None): |
|
docpath = docinfo['textURLPath'] |
|
pn =pageinfo['current'] |
|
selfurl = self.absolute_url() |
|
pagexml = self.getServerData("page-fragment.xql","document=%s&pn=%s"%(docpath, pn)) |
|
dom = Parse(pagexml) |
|
pagedivs = dom.xpath("//div[@class='pageNumberOrig']") |
|
if pagedivs == dom.xpath("//div[@class='pageNumberOrig']"): |
|
if len(pagedivs)>0: |
|
docinfo['pageNumberOrig']= getTextFromNode(pagedivs[0]) |
|
return docinfo['pageNumberOrig'] |
|
|
|
def getOrigPagesNorm(self, docinfo=None, pageinfo=None): |
|
docpath = docinfo['textURLPath'] |
|
pn =pageinfo['current'] |
|
selfurl = self.absolute_url() |
|
pagexml = self.getServerData("page-fragment.xql","document=%s&pn=%s"%(docpath, pn)) |
|
dom = Parse(pagexml) |
|
pagedivs = dom.xpath("//div[@class='pageNumberOrigNorm']") |
|
if pagedivs == dom.xpath("//div[@class='pageNumberOrigNorm']"): |
|
if len(pagedivs)>0: |
|
docinfo['pageNumberOrigNorm']= getTextFromNode(pagedivs[0]) |
|
return docinfo['pageNumberOrigNorm'] |
|
|
|
|
def getTranslate(self, query=None, language=None): |
def getTranslate(self, query=None, language=None): |
"""translate into another languages""" |
"""translate into another languages""" |
data = self.getServerData("lt/lex.xql","document=&language="+str(language)+"&query="+urllib.quote(query)) |
data = self.getServerData("lt/lex.xql","document=&language="+str(language)+"&query="+urllib.quote(query)) |