Changeset 469:15394486ab75 in documentViewer for MpdlXmlTextServer.py
- Timestamp:
- Aug 3, 2011, 7:04:18 PM (14 years ago)
- Branch:
- elementtree
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
MpdlXmlTextServer.py
r465 r469 228 228 def processPageInfo(self, dom, docinfo, pageinfo): 229 229 """processes page info divs from dom and stores in docinfo and pageinfo""" 230 # process all toplevel divs 231 alldivs = dom.findall(".//div") 232 pagediv = None 230 # assume first second level div is pageMeta 231 alldivs = dom.find("div") 233 232 for div in alldivs: 234 233 dc = div.get('class') 235 234 236 # page content div237 if dc == 'pageContent':238 pagediv = div239 240 235 # pageNumberOrig 241 elif dc == 'pageNumberOrig':236 if dc == 'pageNumberOrig': 242 237 pageinfo['pageNumberOrig'] = div.text 243 238 … … 248 243 # pageNumberOrigNorm 249 244 elif dc == 'countFigureEntries': 250 docinfo[' countFigureEntries'] = getInt(div.text)245 docinfo['numFigureEntries'] = getInt(div.text) 251 246 252 247 # pageNumberOrigNorm 253 248 elif dc == 'countTocEntries': 254 249 # WTF: s1 = int(s)/30+1 255 docinfo['countTocEntries'] = getInt(div.text) 250 docinfo['numTocEntries'] = getInt(div.text) 251 252 # pageHeaderTitle 253 elif dc == 'pageHeaderTitle': 254 docinfo['pageHeaderTitle'] = div.text 256 255 257 256 # numTextPages … … 312 311 pagediv = None 313 312 # ElementTree 1.2 in Python 2.6 can't do div[@class='pageContent'] 314 alldivs = dom.findall(".//div") 313 # so we look at the second level divs 314 alldivs = dom.findall("div") 315 315 for div in alldivs: 316 316 dc = div.get('class')
Note: See TracChangeset
for help on using the changeset viewer.