version 1.156, 2010/10/15 13:39:15
|
version 1.157, 2010/10/15 13:42:09
|
Line 189 class MpdlXmlTextServer(SimpleItem):
|
Line 189 class MpdlXmlTextServer(SimpleItem):
|
dom =Parse(text) |
dom =Parse(text) |
pagedivs = dom.xpath("//div[@class='pageNumberOrig']") |
pagedivs = dom.xpath("//div[@class='pageNumberOrig']") |
logging.debug("getOrigPages :%s"%(pagedivs)) |
logging.debug("getOrigPages :%s"%(pagedivs)) |
for l in pagedivs: |
original =getTextFromNode(pagedivs[0]) |
hrefNode = l.getAttributeNodeNS(None, u"div") |
logging.debug("XXXXXXXXXXXgetOrigPagesXXXXXXXX :%s"%(original)) |
href=hrefNode.nodeValue |
return original |
logging.debug("XXXXXXXXXXXgetOrigPagesXXXXXXXX :%s"%(href)) |
|
return "pagedivs" |
|
|
|
def getTextPage(self, mode="text", pn=1, docinfo=None, pageinfo=None, highlightQuery=None,sn=None, viewMode=None, tocMode=None, tocPN=None, characterNormalization=""): |
def getTextPage(self, mode="text", pn=1, docinfo=None, pageinfo=None, highlightQuery=None,sn=None, viewMode=None, tocMode=None, tocPN=None, characterNormalization=""): |
"""returns single page from fulltext""" |
"""returns single page from fulltext""" |