version 1.9, 2006/09/10 22:57:38
|
version 1.10, 2006/09/11 14:43:23
|
Line 24 import urllib
|
Line 24 import urllib
|
try: |
try: |
from Ft.Xml.Xslt.Processor import Processor |
from Ft.Xml.Xslt.Processor import Processor |
from Ft.Xml import InputSource, EMPTY_NAMESPACE,Parse |
from Ft.Xml import InputSource, EMPTY_NAMESPACE,Parse |
|
from Ft.Xml.Domlette import NonvalidatingReader |
except: |
except: |
print "4suite has to be installed" |
print "4suite has to be installed" |
|
|
Line 144 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 145 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
|
|
meta_type="ECHO_xslt" |
meta_type="ECHO_xslt" |
|
|
cache=ECHO_cache() |
cache=ECHO_cache() # cache for analysed pages |
|
caching="yes" |
|
|
|
appendQueryString=True # add query string to the cgiUrl can be changed with addChanges |
|
|
|
passURL=False #use url from querystring parameter fn to retrieve the text and not the url in cgi-url can be changed with addChanges |
|
|
|
|
results={} |
results={} |
manage_options=ECHO_pageTemplate.manage_options+( |
manage_options=ECHO_pageTemplate.manage_options+( |
Line 164 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 171 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
pt=zptFile(self, 'zpt/ChangeECHO_xsltForm.zpt') |
pt=zptFile(self, 'zpt/ChangeECHO_xsltForm.zpt') |
return pt() |
return pt() |
|
|
def addChanges(self,cgiUrl,RESPONSE=None): |
def addChanges(self,cgiUrl,appendQueryString=False,passURL=False,caching=False,RESPONSE=None): |
"""change the xslt, ueberschriebt addChanges in ECHO_PageTemplate""" |
"""change the xslt, ueberschriebt addChanges in ECHO_PageTemplate""" |
|
|
if urlparse.urlparse(cgiUrl)[0]=="":#relative url in absolute |
if urlparse.urlparse(cgiUrl)[0]=="":#relative url in absolute |
self.cgiUrl=urlparse.urljoin(self.absolute_url(), cgiUrl) |
self.cgiUrl=urlparse.urljoin(self.absolute_url(), cgiUrl) |
else: |
else: |
self.cgiUrl=cgiUrl |
self.cgiUrl=cgiUrl |
|
|
|
if appendQueryString: |
|
self.appendQueryString=True |
|
else: |
|
self.appendQueryString=False |
|
|
|
if passURL: |
|
self.passURL=True |
|
else: |
|
self.passURL=False |
|
|
|
if caching: |
|
self.caching="yes" |
|
else: |
|
self.caching="No" |
|
|
|
|
if RESPONSE: |
if RESPONSE: |
RESPONSE.redirect("manage_main") |
RESPONSE.redirect("manage_main") |
|
|
Line 218 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 242 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
return self._v_xmltrans.getResult() |
return self._v_xmltrans.getResult() |
|
|
|
|
|
def getText(self): |
|
"""print nur den text""" |
|
qs,baseUri=self.getTextInput() |
|
self.REQUEST.RESPONSE.redirect(qs) |
|
|
def deleteCache(self): |
def deleteCache(self): |
"""deletefrom cache""" |
"""deletefrom cache""" |
fn=self.REQUEST['fn'] |
fn=self.REQUEST['fn'] |
self.cache.deleteObject(fn) |
self.cache.deleteObject(fn) |
|
|
def getPageLex(self,_pn="1",_caching="yes"): |
def getPageLex(self,_pn="1",_caching=None): |
"""getpage mit lexikalischer analyse und xslt transform |
"""getpage mit lexikalischer analyse und xslt transform |
if _caching=yes dann wird die lwxikalisch analysierte seite in einem cache abgespeichert |
if _caching=yes dann wird die lwxikalisch analysierte seite in einem cache abgespeichert |
""" |
""" |
|
|
|
if not _caching: |
|
_caching=self.caching |
|
|
fn=self.REQUEST['fn'] |
fn=self.REQUEST['fn'] |
|
|
|
|
fromCache=self.cache.retrieveObject(fn,_pn) |
fromCache=self.cache.retrieveObject(fn,_pn) |
|
|
if fromCache and _caching=="yes": |
if fromCache and _caching=="yes": |
print "retrieve",fn,_pn |
|
txt = fromCache |
txt = fromCache |
else: |
else: |
txt=self.tagLex(nr=_pn) |
txt=self.tagLex(nr=_pn) |
print "store",fn,_pn |
|
self.cache.storeObject(fn,_pn,txt[0:]) |
self.cache.storeObject(fn,_pn,txt[0:]) |
|
|
|
|
xsl=self.xslt() |
xsl=self.xslt() |
|
|
xsltproc=Processor() |
xsltproc=Processor() |
Line 255 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 287 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
|
|
return tmp[0:] |
return tmp[0:] |
|
|
|
def getTextInput(self): |
|
"""get the text |
|
wie der text geholt wird liegt an der konfiguration, |
|
is appendQueryString gesetzt, dann wir jeweils der Querystring an vorgebenen url gesetzt, erwartet wird fn= |
|
fźr den Pfad, is passURL gesetzt, dann wird falls fn= eine vollstŠndige url enthŠlt, diese anstelle der in cgiurl definierten genommen. |
|
""" |
|
|
|
if getattr(self,'passURL',False) and self.REQUEST.has_key('fn') and (urlparse.urlparse(self.REQUEST['fn'])[0]=='http'): |
|
qs=self.REQUEST['fn'] |
|
baseUri=qs |
|
elif getattr(self,'pappendQueryString',True): |
|
qs="%s%s"%(self.cgiUrl,self.REQUEST['QUERY_STRING']) |
|
baseUri=self.cgiUrl |
|
else: |
|
qs="%s"%(self.cgiUrl) |
|
baseUri=self.cgiUrl |
|
|
|
#fact= InputSource.DefaultFactory.fromUri(qs) |
|
return qs,baseUri |
|
#return InputSource.InputSource(fact) |
|
#xmlt=urllib.urlopen(qs).read() |
|
|
def getPage(self,_pn,REQUEST=None): |
def getPage(self,_pn,REQUEST=None,_caching=None): |
"""get a page from an xml""" |
"""get a page from an xml""" |
|
|
|
if not _caching: |
|
_caching=self.caching |
|
|
pn=int(_pn)-1 |
pn=int(_pn)-1 |
if pn<0: |
if pn<0: |
if REQUEST: |
if REQUEST: |
return "Sorry, pagenumbers have to be greater than 0" |
return "Sorry, pagenumbers have to be greater than 0" |
else: |
else: |
return None |
return None |
impl=xml.dom.getDOMImplementation() |
|
newDoc=impl.createDocument(EMPTY_NAMESPACE,None,None |
|
) |
|
root=newDoc.createElement('page') |
|
newDoc.appendChild(root) |
|
|
|
|
xmlt,self.baseUri=self.getTextInput() |
|
|
qs="%s%s"%(self.cgiUrl,self.REQUEST['QUERY_STRING']) |
#get the text from cache, if existing |
|
fromCache=self.cache.retrieveObject(self.baseUri,"-1") |
|
if fromCache and _caching=="yes": |
|
|
|
txt = fromCache |
|
else: |
|
|
|
txt=urllib.urlopen(xmlt).read() |
|
|
|
self.cache.storeObject(self.baseUri,"-1",txt) |
|
|
xmlt=urllib.urlopen(qs).read() |
dom=NonvalidatingReader.parseString(txt,self.baseUri) |
dom=Parse(xmlt) |
|
|
|
|
#pb should have a namespache |
|
|
|
pbs=dom.xpath("//mpiwg:pb",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}) |
|
if len(pbs)==0: # versuche nochmal ohne |
pbs=dom.xpath("//pb") |
pbs=dom.xpath("//pb") |
|
|
if pn > len(pbs): |
if pn > len(pbs): |
if REQUEST: |
if REQUEST: |
return "Sorry, pagenumber %s does not exit"%pn+1 |
return "Sorry, pagenumber %s does not exit"%(pn+1) |
else: |
else: |
return None |
return None |
|
|
Line 292 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 356 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
else: |
else: |
endNode=None |
endNode=None |
|
|
|
|
# follower=beginNode.xpath('following::node()') |
|
# #root.appendChild(beginNode) |
|
# found=[] |
|
# |
|
# for node in endNode.xpath('preceding::node()'): |
|
# if node in follower: |
|
# found.append(node) |
|
# |
|
|
|
|
|
#rempove all children of parents which are also in the list |
|
# for x in found: |
|
# for child in x.xpath(".//*"): |
|
# try: |
|
# |
|
# nr=found.index(child) |
|
# |
|
# del(found[nr]) |
|
# except: |
|
# pass |
|
# |
|
# found.append(endNode) |
|
# |
|
deleteNodes=beginNode.xpath('preceding::node()') |
deleteNodes=beginNode.xpath('preceding::node()') |
if endNode: |
if endNode: |
deleteNodes+=endNode.xpath('following::node()') |
deleteNodes+=endNode.xpath('following::node()') |