# HG changeset patch # User abukhman # Date 1297768359 -3600 # Node ID 630a4581992a90941f780197bdd2adfa8079e929 # Parent d6a2125a4b0937d7f98f794747f6004b48c5cc8d *** empty log message *** diff -r d6a2125a4b09 -r 630a4581992a MpdlXmlTextServer.py --- a/MpdlXmlTextServer.py Mon Feb 14 15:41:13 2011 +0100 +++ b/MpdlXmlTextServer.py Tue Feb 15 12:12:39 2011 +0100 @@ -209,7 +209,15 @@ if len(pagedivs)>0: docinfo['pageNumberOrig']= getTextFromNode(pagedivs[0]) logging.debug("ORIGINAL PAGES: %s"%(docinfo['pageNumberOrig'])) - + + #original Pages Norm + pagedivs = dom.xpath("//div[@class='pageNumberOrigNorm']") + if pagedivs == dom.xpath("//div[@class='pageNumberOrigNorm']"): + if len(pagedivs)>0: + docinfo['pageNumberOrigNorm']= getTextFromNode(pagedivs[0]) + logging.debug("ORIGINAL PAGES: %s"%(docinfo['pageNumberOrigNorm'])) + + #figureEntries pagedivs = dom.xpath("//div[@class='countFigureEntries']") if pagedivs == dom.xpath("//div[@class='countFigureEntries']"): @@ -288,6 +296,7 @@ docinfo['countPlaces'] = 0 docinfo['countTocEntries'] = 0 docinfo['numPages'] = 0 + docinfo['pageNumberOrigNorm'] = 0 #return docinfo # plain text mode