version 1.11, 2006/09/14 14:31:53
|
version 1.19, 2007/01/31 14:12:39
|
Line 7 from ECHO_Nav import ECHO_pageTemplate
|
Line 7 from ECHO_Nav import ECHO_pageTemplate
|
from threading import Thread,Timer |
from threading import Thread,Timer |
import threading |
import threading |
from ECHO_helpers import * |
from ECHO_helpers import * |
import ECHO_language |
try: |
|
from ECHO_language import * |
|
except: |
|
print "no echo language" |
|
class ECHO_language: |
|
"""leere Klasse""" |
|
pass |
import sys |
import sys |
import urllib |
import urllib |
import urlparse |
import urlparse |
Line 19 import transaction
|
Line 25 import transaction
|
|
|
import os.path |
import os.path |
|
|
import urllib |
import urllib,cgi |
|
|
try: |
try: |
from Ft.Xml.Xslt.Processor import Processor |
from Ft.Xml.Xslt.Processor import Processor |
Line 77 class getXML(Implicit):
|
Line 83 class getXML(Implicit):
|
|
|
|
|
#print self.xsl |
#print self.xsl |
#print xsltproc.run(document) |
#< xsltproc.run(document) |
tmp=xsltproc.run(document) |
tmp=xsltproc.run(document) |
|
|
self.result=tmp[0:] |
self.result=tmp[0:] |
Line 100 from ZODB.FileStorage import FileStorage
|
Line 106 from ZODB.FileStorage import FileStorage
|
class ECHO_cache: |
class ECHO_cache: |
def __init__(self): |
def __init__(self): |
"""init the storage""" |
"""init the storage""" |
self.storage=FileStorage("/var/tmp/echo_cache.fs") |
self.storage=FileStorage(os.path.join(INSTANCE_HOME,"var/echo_cache.fs")) |
self.db=DB(self.storage) |
self.db=DB(self.storage) |
self.connection=self.db.open() |
self.connection=self.db.open() |
self.root=self.connection.root() |
self.root=self.connection.root() |
Line 137 class ECHO_cache:
|
Line 143 class ECHO_cache:
|
if not fileStore: |
if not fileStore: |
return None |
return None |
else: |
else: |
|
|
return self.root[name].get(pn,None) |
return self.root[name].get(pn,None) |
|
|
|
|
class ECHO_xslt(ECHO_pageTemplate,ECHO_language.ECHO_language): |
class ECHO_xslt(ECHO_pageTemplate,ECHO_language): |
"""ECHO_xslt classe""" |
"""ECHO_xslt classe""" |
|
|
meta_type="ECHO_xslt" |
meta_type="ECHO_xslt" |
Line 252 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 259 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
fn=self.REQUEST['fn'] |
fn=self.REQUEST['fn'] |
self.cache.deleteObject(fn) |
self.cache.deleteObject(fn) |
|
|
def getPageLex(self,_pn="1",_id=None,_caching=None): |
|
|
def createLinkNode(self,url,dom): |
|
"""createa a link node""" |
|
txt=dom.createTextNode("<XMLLink>") |
|
node=dom.createElementNS("http://test.de","a") |
|
node.setAttributeNS("http://test.de","href",url) |
|
node.appendChild(txt) |
|
return node |
|
|
|
def forwardLink(self,linkid,url,type="target",RESPONSE=None): |
|
"""forward to link""" |
|
if RESPONSE: |
|
RESPONSE.redirect(self.getLink(linkid,url,type=type)) |
|
|
|
else: |
|
return self.getLink(linkid,url,type=type) |
|
def getLink(self,linkid,url,type="target"): |
|
"""get target for linkid""" |
|
dom=NonvalidatingReader.parseUri(url) |
|
|
|
masterurl=dom.xpath("//mpiwg:masterurl/@ref",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
slaveurl=dom.xpath("//mpiwg:slaveurl/@ref",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
#check now if there are in the link file |
|
|
|
xp="//mpiwg:link[@id='%s']"%linkid |
|
|
|
if type=="target": |
|
for link in dom.xpath(xp,explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}): |
|
fn=link.xpath("mpiwg:target/@filename",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
if urlparse.urlparse(urllib.unquote(fn))[0]=="http": # fn ist eine url |
|
return urllib.unquote(fn) # dann gibt diese zurueck |
|
|
|
ref=link.xpath("mpiwg:target/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
ref2=link.xpath("mpiwg:target/mpiwg:pagelink/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
selectionNodeIndex=link.xpath("mpiwg:target/mpiwg:pagelink/@selectionNodeIndex",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
|
|
|
|
lstr=slaveurl+'fn='+fn+'&_id='+ref+'&_pagelink=%s///%s/%s/%s'%(ref2,selectionNodeIndex,linkid,'target') |
|
lstr+="&_links="+urllib.quote(url) |
|
|
|
else: |
|
for link in dom.xpath(xp,explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}): |
|
fn=link.xpath("mpiwg:source/@filename",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
if urlparse.urlparse(urllib.unquote(fn))[0]=="http": # fn ist eine url |
|
return urllib.unquote(fn) # dann gibt diese zurueck |
|
|
|
ref=link.xpath("mpiwg:source/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
ref2=link.xpath("mpiwg:source/mpiwg:pagelink/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
selectionNodeIndex=link.xpath("mpiwg:source/mpiwg:pagelink/@selectionNodeIndex",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
lstr=masterurl+'fn='+fn+'&_id='+ref+'&_pagelink=%s///%s/%s/%s'%(ref2,selectionNodeIndex,linkid,'source') |
|
lstr+="&_links="+urllib.quote(url) |
|
return lstr |
|
|
|
def addLinksUrl(self,txt,url): |
|
"""add reference to links to url""" |
|
ret=[] |
|
dom=NonvalidatingReader.parseUri(url) |
|
textDom=NonvalidatingReader.parseString(txt) |
|
|
|
#find ids in txt |
|
ids=textDom.xpath("//*[@id]") |
|
|
|
for textid in ids: |
|
xp="//mpiwg:link[mpiwg:source/@refid='%s']"%textid.xpath("@id")[0].value |
|
for link in dom.xpath(xp,explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}): |
|
ref2=link.xpath("mpiwg:source/mpiwg:pagelink/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
selectionNodeIndex=link.xpath("mpiwg:source/mpiwg:pagelink/@selectionNodeIndex",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
linkid=link.xpath("@id")[0].value |
|
ret.append('%s///%s/%s/%s'%(ref2,selectionNodeIndex,linkid,'source')) |
|
|
|
xp="//mpiwg:link[mpiwg:target/@refid='%s']"%textid.xpath("@id")[0].value |
|
for link in dom.xpath(xp,explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}): |
|
ref2=link.xpath("mpiwg:target/mpiwg:pagelink/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
selectionNodeIndex=link.xpath("mpiwg:target/mpiwg:pagelink/@selectionNodeIndex",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
linkid=link.xpath("@id")[0].value |
|
ret.append('%s///%s/%s/%s'%(ref2,selectionNodeIndex,linkid,'target')) |
|
|
|
|
|
return ret |
|
|
|
def addLinks(self,txt,url="http://127.0.0.1:8080/HFQP/linkCreator/getCollectionXML?collection=commentary2"): |
|
"""add links to a page from xml linkfile""" |
|
|
|
dom=NonvalidatingReader.parseUri(url) |
|
textDom=NonvalidatingReader.parseString(txt) |
|
|
|
#find ids in txt |
|
ids=textDom.xpath("//*[@id]") |
|
masterurl=dom.xpath("//mpiwg:masterurl/@ref",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
slaveurl=dom.xpath("//mpiwg:slaveurl/@ref",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
#check now if there are in the link file |
|
for textid in ids: |
|
xp="//mpiwg:link[mpiwg:source/@refid='%s']"%textid.xpath("@id")[0].value |
|
for link in dom.xpath(xp,explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}): |
|
fn=link.xpath("mpiwg:target/@filename",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
print fn |
|
if urlparse.urlparse(urllib.unquote(fn))[0]=="http": # fn ist eine url |
|
lstr=urllib.unquote(fn) # dann gibt diese zurueck |
|
else: |
|
try: |
|
ref=link.xpath("mpiwg:target/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
ref2=link.xpath("mpiwg:target/mpiwg:pagelink/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
selectionNodeIndex=link.xpath("mpiwg:target/mpiwg:pagelink/@selectionNodeIndex",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
linkid=link.xpath("@id")[0].value |
|
lstr=slaveurl+'fn='+fn+'&_id='+ref+'&_pagelink=%s///%s/%s/%s'%(ref2,selectionNodeIndex,linkid,'target') |
|
lstr+="&_links="+urllib.quote(url) |
|
except: |
|
lstr="" |
|
node=self.createLinkNode(lstr,textDom) |
|
textid.parentNode.insertBefore(node,textid) |
|
|
|
|
|
xp="//mpiwg:link[mpiwg:target/@refid='%s']"%textid.xpath("@id")[0].value |
|
for link in dom.xpath(xp,explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}): |
|
fn=link.xpath("mpiwg:source/@filename",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
if urlparse.urlparse(urllib.unquote(fn))[0]=="http": # fn ist eine url |
|
lstr=urllib.unquote(fn) # dann gibt diese zurueck |
|
else: |
|
|
|
ref=link.xpath("mpiwg:source/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
|
|
ref2=link.xpath("mpiwg:source/mpiwg:pagelink/@refid",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
selectionNodeIndex=link.xpath("mpiwg:source/mpiwg:pagelink/@selectionNodeIndex",explicitNss={'mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'})[0].value |
|
linkid=link.xpath("@id")[0].value |
|
lstr=masterurl+'fn='+fn+'&_id='+ref+'&_pagelink=%s///%s/%s/%s'%(ref2,selectionNodeIndex,linkid,"source") |
|
lstr+="&_links="+urllib.quote(url) |
|
|
|
node=self.createLinkNode(lstr,textDom) |
|
textid.parentNode.insertBefore(node,textid) |
|
|
|
|
|
|
|
strio = StringIO() |
|
PrettyPrint(textDom,strio) |
|
xmlstr = strio.getvalue() |
|
|
|
return xmlstr |
|
|
|
|
|
|
|
def getPageLex(self,_pn="1",_id=None,_caching=None,_links=None,_showall="no",_displaylinks="yes"): |
"""getpage mit lexikalischer analyse und xslt transform |
"""getpage mit lexikalischer analyse und xslt transform |
if _caching=yes dann wird die lwxikalisch analysierte seite in einem cache abgespeichert |
if _caching=yes dann wird die lwxikalisch analysierte seite in einem cache abgespeichert |
""" |
""" |
|
def encode(hash): |
|
ret=[] |
|
for x in hash.keys(): |
|
value=hash[x] |
|
|
|
if type(value) is ListType: |
|
for z in value: |
|
ret.append("%s=%s"%(x,z)) |
|
else: |
|
ret.append("%s=%s"%(x,value)) |
|
return "&".join(ret) |
|
|
|
|
|
|
if not _caching: |
if not _caching: |
_caching=self.caching |
_caching=self.caching |
Line 263 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 431 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
fn=self.REQUEST['fn'] |
fn=self.REQUEST['fn'] |
|
|
if not _id: |
if not _id: |
|
|
fromCache=self.cache.retrieveObject(fn,_pn) |
fromCache=self.cache.retrieveObject(fn,_pn) |
|
|
if fromCache and _caching=="yes": |
if fromCache and _caching=="yes": |
Line 276 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 445 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
else: |
else: |
txt=self.tagLex(id=_id) |
txt=self.tagLex(id=_id) |
|
|
|
if _showall=="yes": |
|
params=cgi.parse_qs(self.REQUEST['QUERY_STRING']) |
|
|
|
params['_pagelink']=self.addLinksUrl(txt,url=_links) |
|
params['_showall']='no' |
|
|
|
print self.absolute_url()+"?"+encode(params) |
|
self.REQUEST.RESPONSE.redirect(self.absolute_url()+"/getPageLex?"+encode(params)) |
|
|
|
|
xsl=self.xslt() |
xsl=self.xslt() |
|
|
xsltproc=Processor() |
xsltproc=Processor() |
Line 286 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 465 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
stylesheet = InputSource.DefaultFactory.fromString(xsl) |
stylesheet = InputSource.DefaultFactory.fromString(xsl) |
xsltproc.appendStylesheet(stylesheet) |
xsltproc.appendStylesheet(stylesheet) |
tmp=xsltproc.run(document) |
tmp=xsltproc.run(document) |
|
|
|
if _links and (_displaylinks=='yes'): |
|
_links=urllib.unquote(_links) |
|
tmp=self.addLinks(tmp,url=_links) |
|
|
#bugfix for digilib images which doesn't accept & |
#bugfix for digilib images which doesn't accept & |
tmp=tmp.replace("&","&") |
tmp=tmp.replace("&","&") |
|
|
|
|
return tmp[0:] |
return tmp[0:] |
|
|
def getTextInput(self): |
def getTextInput(self): |
Line 328 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 514 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
xmlt,self.baseUri=self.getTextInput() |
xmlt,self.baseUri=self.getTextInput() |
|
|
#get the text from cache, if existing |
#get the text from cache, if existing |
|
try: |
fromCache=self.cache.retrieveObject(self.baseUri,"-1") |
fromCache=self.cache.retrieveObject(self.baseUri,"-1") |
|
except: |
|
fromCache=None |
if fromCache and _caching=="yes": |
if fromCache and _caching=="yes": |
|
|
txt = fromCache |
txt = fromCache |
Line 338 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 527 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
|
|
self.cache.storeObject(self.baseUri,"-1",txt) |
self.cache.storeObject(self.baseUri,"-1",txt) |
|
|
|
|
dom=NonvalidatingReader.parseString(txt,self.baseUri) |
dom=NonvalidatingReader.parseString(txt,self.baseUri) |
|
|
#pb should have a namespache |
#pb should have a namespache |
Line 351 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 541 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
#suche wieviele pb for der id |
#suche wieviele pb for der id |
|
|
|
|
idpb=dom.xpath("//*[@id='%s']/preceding::node()/mpiwg:pb"%_id,explicitNss={'html':'http://test.de','mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}) |
idpb=dom.xpath("//*[@id='%s']/preceding::node()/mpiwg:pb"%_id,explicitNss={'html':'http://www.w3.org/1999/xhtml','mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}) |
if len(idpb)==0: |
if len(idpb)==0: |
idpb=dom.xpath("//*[@id='%s']/preceding::node()/pb"%_id) |
idpb=dom.xpath("//*[@id='%s']/preceding::node()/pb"%_id) |
|
|
if len(idpb)==0: |
if len(idpb)==0: |
k=0 |
k=0 |
for node in dom.xpath("//*[@id='%s']//preceding::node()"%_id,explicitNss={'html':'http://test.de','mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}): |
for node in dom.xpath("//*[@id='%s']//preceding::node()"%_id,explicitNss={'html':'http://www.w3.org/1999/xhtml','mpiwg':'http://www.mpiwg-berlin.mpg.de/namespace'}): |
if getattr(node,'tagName',"")=="mpiwg:pb": |
if getattr(node,'tagName',"")=="mpiwg:pb": |
k+=1 |
k+=1 |
else: |
else: |
k=len(idpb) |
k=len(idpb) |
|
#pn=k-1 #-1 wegen Seitenzahlzaehlung startet mit 0 |
pn=k-1 #-1 wegen Seitenzahlzaehlung startet mit 0 |
pn=k-1 #-1 wegen Seitenzahlzaehlung startet mit 0 |
|
|
if pn > len(pbs): |
if pn > len(pbs): |
if REQUEST: |
if REQUEST: |
return "Sorry, pagenumber %s does not exit"%(pn+1) |
return "Sorry, pagenumber %s does not exit"%(pn+1) |
Line 387 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
Line 577 class ECHO_xslt(ECHO_pageTemplate,ECHO_l
|
if parent: |
if parent: |
parent[0].removeChild(node) |
parent[0].removeChild(node) |
except: |
except: |
zLOG.LOG("ECHO_Resource (getAccessRightMD)", zLOG.INFO,"%s (%s)"%sys.exc_info()[0:2]) |
logger("ECHO_Resource (getAccessRightMD)", logging.INFO,"%s (%s)"%sys.exc_info()[0:2]) |
strio = StringIO() |
strio = StringIO() |
PrettyPrint(dom,strio) |
PrettyPrint(dom,strio) |
xmlstr = strio.getvalue() |
xmlstr = strio.getvalue() |
Line 445 def manage_addECHO_xslt(self, id, label,
|
Line 635 def manage_addECHO_xslt(self, id, label,
|
u = "%s/%s" % (u, quote(id)) |
u = "%s/%s" % (u, quote(id)) |
REQUEST.RESPONSE.redirect(u+'/manage_main') |
REQUEST.RESPONSE.redirect(u+'/manage_main') |
return '' |
return '' |
|
|