documentViewer: MpiwgXmlTextServer.py comparison

comparison MpiwgXmlTextServer.py @ 579:fc861a6cef17

update in w-tag format.

author	casties
date	Fri, 26 Oct 2012 12:53:43 +0200
parents	9251719154a3
children	ca0274423382

comparison

equal deleted inserted replaced

-:024b75162437
+:fc861a6cef17
 # TODO: change values in form
 if normMode == 'regPlusNorm':
 normMode = 'norm'
 # TODO: this should not be necessary when the backend is fixed
-textParams['normalization'] = normMode
+#textParams['normalization'] = normMode
 if not mode:
 # default is dict
 mode = 'text'
 # the text is in div@class=text
 pagediv = dom.find(".//div[@class='text']")
 logging.debug("pagediv: %s"%repr(pagediv))
 if pagediv is not None:
 # add textmode and normMode classes
-pagediv.set('class', 'text %s %s'%(textmode, normMode))
+#pagediv.set('class', 'text %s %s'%(textmode, normMode))
 self._processWTags(textmode, normMode, pagediv)
 #self._processPbTag(pagediv, pageinfo)
 self._processFigures(pagediv, docinfo)
 #self._fixEmptyDivs(pagediv)
 # get full url assuming documentViewer is parent
 l.set('href', re.sub(r'doc=[\w+/=]+', 'doc=%s'%doc, href))
 l.set('target', '_blank')
 return serialize(pagediv)
-logging.error("getTextPage: error in text mode %s or text!"%(textmode))
+logging.error("getTextPage: error in text mode %s or in text!"%(textmode))
 return None
 def _processWTags(self, textMode, normMode, pagediv):
 """selects the necessary information from w-spans and removes the rest from pagediv"""
 logging.debug("processWTags(textMode=%s,norm=%s,pagediv"%(repr(textMode),repr(normMode)))
 # delete non-a-tags
 wtag.remove(wtag.find("span[@class='nodictionary orig']"))
 wtag.remove(wtag.find("span[@class='nodictionary reg']"))
 wtag.remove(wtag.find("span[@class='nodictionary norm']"))
 # delete non-matching children of a-tag and suppress remaining tag name
-atag = wtag.find("a[@class='dictionary']")
+atag = wtag.find("*[@class='dictionary']")
 if normMode == 'orig':
 atag.remove(atag.find("span[@class='reg']"))
 atag.remove(atag.find("span[@class='norm']"))
 atag.find("span[@class='orig']").tag = None
 elif normMode == 'reg':
 atag.remove(atag.find("span[@class='reg']"))
 atag.find("span[@class='norm']").tag = None
 else:
 # delete a-tag
-wtag.remove(wtag.find("a[@class='dictionary']"))
+wtag.remove(wtag.find("*[@class='dictionary']"))
 # delete non-matching children and suppress remaining tag name
 if normMode == 'orig':
 wtag.remove(wtag.find("span[@class='nodictionary reg']"))
 wtag.remove(wtag.find("span[@class='nodictionary norm']"))
 wtag.find("span[@class='nodictionary orig']").tag = None

Mercurial > hg > documentViewer

comparison MpiwgXmlTextServer.py @ 579:fc861a6cef17