1: """
2: This module contains extensions which where originally made for the VLP.
3: """
4: from OFS.Cache import Cacheable
5: from Products.PageTemplates.PageTemplateFile import PageTemplateFile
6: from Products.PageTemplates.PageTemplate import PageTemplate
7: from Products.PageTemplates.ZopePageTemplate import ZopePageTemplate
8: from OFS.Image import File
9: import xml.dom.minidom
10: import urllib
11: import xmlrpclib
12: import vlp_xmlhelpers
13: import sys
14: import os
15: from stat import *
16: from types import *
17: from Globals import package_home
18: import transaction
19: import Acquisition
20:
21: from Products.ECHO_content.ECHO_collection import *
22: from vlp_xmlhelpers import *
23: try:
24: from Products.zogiLib import zogiLib
25: except:
26: print "Zogilib not installed, VLP_resource will not work"
27:
28:
29: def lemmatize(str):
30: """takes a str and addes links the dictionary service"""
31: server = xmlrpclib.ServerProxy("http://archimedes.fas.harvard.edu/cgi-bin/donatus-rpc")
32: if server:
33: splitted=str.split(" ")
34: wordlist=["<w>%s</w>"%split for split in splitted].join()
35: return wordlist
36:
37:
38:
39:
40: def makeXML(str):
41:
42: try:
43: dom=xml.dom.minidom.parseString(str)
44: return str
45: except:
46: str=str.replace("& ","& ")
47: return """<?xml version="1.0" encoding="utf-8" ?><!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"><page>
48: %s
49: </page>"""%str
50:
51:
52: def checkXMLfrag(str):
53: """checks and returns str as XML fragment"""
54:
55: xmltempl = """<?xml version="1.0" encoding="utf-8" ?><!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
56: <txt>%s</txt>"""
57:
58: try:
59: dom=xml.dom.minidom.parseString(xmltempl%utf8ify(str))
60: return str
61: except:
62: str=str.replace("& ","& ")
63:
64: dom=xml.dom.minidom.parseString(xmltempl%utf8ify(str))
65: return str
66:
67:
68:
69: def getText(nodelist):
70:
71: rc = ""
72: for node in nodelist:
73: if node.nodeType == node.TEXT_NODE:
74: rc = rc + node.data
75: return rc
76:
77: class sendMailForm(ZopePageTemplate):
78: """sendMailForm"""
79: meta_type="sendMailForm"
80:
81: _default_content_fn = os.path.join(package_home(globals()), 'vlp','sendMail_template.zpt')
82:
83: manage_options = ZopePageTemplate.manage_options+(
84: {'label':'Main Config','action':'main_configForm'},
85: )
86:
87: main_configForm = PageTemplateFile(
88: 'vlp/changeSendMailForm', globals())
89:
90: def main_config(self, toAddrs,mailServer, subjectAdd=None, RESPONSE=None):
91: """main_config"""
92: self.toAddrs=toAddrs.split("\n")
93: self.mailServer=mailServer
94: self.subjectAdd=subjectAdd
95: if RESPONSE:
96: RESPONSE.redirect('manage_main')
97:
98: def sendForm(self,fromaddr,subject,content,nextPage="index_html",RESPONSE=None):
99: """sendform"""
100: fromaddr=fromaddr.strip("\r\n\t") # sicherstellen dass keine zusaetzlichen headerzeilen eingefuegt werden
101: subject=subject.strip("\r\n\t") # sicherstellen dass keine zusaetzlichen headerzeilen eingefuegt werden
102: toaddrs=self.toAddrs
103:
104: subject="%s %s"%(self.subjectAdd,subject)
105:
106: msg = ("From: %s\r\nSubject: %s\r\nTo: %s\r\n\r\n"
107: % (fromaddr, subject, ", ".join(toaddrs)))
108: server = smtplib.SMTP(self.mailServer)
109: #server.set_debuglevel(1)
110: msg=msg+content
111: server.sendmail(fromaddr, toaddrs, msg)
112: server.quit()
113:
114: if RESPONSE:
115: RESPONSE.redirect(nextPage)
116:
117: manage_addSendMailFormForm = PageTemplateFile(
118: 'vlp/addSendMailForm', globals(), __name__='manage_addSendMailFormFrom')
119:
120: from urllib import quote
121:
122: def manage_addSendMailForm(self, id, toAddrs,mailServer, title=None, text=None, subjectAdd=None,
123: REQUEST=None, submit=None):
124: "Add a Page Template with optional file content."
125: toAddrsList=toAddrs.split("\n")
126: id = str(id)
127: if REQUEST is None:
128: self._setObject(id, sendMailForm(id, text))
129: ob = getattr(self, id)
130: if title:
131: ob.pt_setTitle(title)
132: setattr(ob,'toAddrs',toAddrsList)
133: setattr(ob,'mailServer',mailServer)
134: setattr(ob,'subjectAdd',subjectAdd)
135: return ob
136: else:
137: file = REQUEST.form.get('file')
138: headers = getattr(file, 'headers', None)
139: if headers is None or not file.filename:
140: zpt = sendMailForm(id)
141: else:
142: zpt = sendMailForm(id, file, headers.get('content_type'))
143:
144: self._setObject(id, zpt)
145:
146: try:
147: u = self.DestinationURL()
148: except AttributeError:
149: u = REQUEST['URL1']
150:
151: if submit == " Add and Edit ":
152: u = "%s/%s" % (u, quote(id))
153:
154: ob = getattr(self, id)
155: if title:
156: ob.pt_setTitle(title)
157:
158: setattr(ob,'toAddrs',toAddrsList)
159: setattr(ob,'mailServer',mailServer)
160: setattr(ob,'subjectAdd',subjectAdd)
161: REQUEST.RESPONSE.redirect(u+'/manage_main')
162: return ''
163:
164:
165: class VLP_collectionFolder(Folder):
166: """klasse fuer folder innerhalb der collection"""
167: meta_type="VLP_collectionFolder"
168:
169: class VLP_essay(Folder):
170: """classe fr VLP essays"""
171:
172: meta_type="VLP_essay"
173:
174: manage_options = Folder.manage_options+(
175: {'label':'Main Config','action':'ConfigVLP_essayForm'},
176: {'label':'Generate Essay Template','action':'generateEssayTemplateHTML'},
177: )
178:
179: def content_html(self,type='collection'):
180: """template fuer content"""
181: #templates = self.ZopeFind(self.aq_parent,obj_ids=[type+"_template"])
182: #
183: #if templates:
184: # return templates[0][1]()
185:
186: if hasattr(self,type+"_template"):
187: obj=getattr(self,type+"_template")
188: return obj()
189: else:
190: pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','ECHO_%s_template_standard.zpt'%type)).__of__(self)
191: pt.content_type="text/html"
192: return pt()
193:
194: def ConfigVLP_essayForm(self):
195: """Form for adding"""
196: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','ChangeVLP_essay.zpt')).__of__(self)
197: return pt()
198:
199: def ChangeVLP_essay(self,title,label,description,RESPONSE=None):
200: """Change vlp_essay"""
201: self.title=title
202: self.label=label
203: self.description=description
204:
205: if RESPONSE is not None:
206: RESPONSE.redirect('manage_main')
207:
208: def __init__(self,id,title,label):
209: """init"""
210: self.id=id
211: self.title=title
212: self.label=label
213:
214: def index_html(self):
215:
216: """show the rendered file"""
217:
218: if hasattr(self,'essayTemplate.html'):
219: return getattr(self,'essayTemplate.html')()
220:
221: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','essay_template.zpt')).__of__(self)
222: pt.content_type="text/html"
223: return pt()
224:
225: def generateEssayTemplateHTML(self,RESPONSE=None):
226: """lege standard index.html an"""
227:
228: if not hasattr(self,'essayTemplate.html'):
229: zt=ZopePageTemplate('essayTemplate.html')
230: self._setObject('essayTemplate.html',zt)
231: default_content_fn = os.path.join(package_home(globals()),
232: 'vlp/essay_template.zpt')
233: text = open(default_content_fn).read()
234: zt.pt_edit(text, 'text/html')
235:
236: else:
237: return "already exists!"
238:
239: if RESPONSE is not None:
240: RESPONSE.redirect('manage_main')
241:
242: def getPageList(self):
243: """returns sorted list of (id,object) of page objects"""
244:
245: def sortFind(x,y):
246: return cmp(x[0],y[0])
247:
248: # pages=[]
249: # pagestmp=self.ZopeFind(self,obj_metatypes=['DTML Document','File'])
250: # for page in pagestmp:
251: # if not (page[1].getId()[0]=="."):
252: # pages.append(page)
253:
254: pages = self.objectItems(['DTML Document','File'])
255: pages.sort(sortFind)
256: #logging.debug("pageList=%s"%repr(pages))
257: return pages
258:
259:
260: def getPageXMLfrag(self, pageNum=None, pageId=None, pageObj=None):
261: """returns XML fragment of page with id"""
262: xml = None
263:
264: if pageNum is not None:
265: pl = self.getPageList()
266: pageObj = pl[int(pageNum)-1][1]
267:
268: if pageId is not None:
269: pageObj = getattr(self, pageId, None)
270:
271: if pageObj is not None:
272: txt = ""
273: if pageObj.meta_type == 'File':
274: data = pageObj.data
275: #logging.debug("data=%s txt=%s"%(repr(data),txt))
276: while data is not None:
277: if isinstance(data, str):
278: txt += data
279: data = None
280: else:
281: txt += data.data
282: data = data.next
283:
284: else:
285: # not a File object... perhaps its executable
286: txt += pageObj()
287:
288: xml = checkXMLfrag(txt)
289:
290: return unicodify(xml)
291:
292:
293: def getPage(self,pagenum):
294: """gibt essay page mit num aus"""
295: def sortFind(x,y):
296: return cmp(x[0],y[0])
297: pages=[]
298: pagestmp=self.ZopeFind(self,obj_metatypes=['DTML Document','File'])
299: for page in pagestmp:
300: if not (page[1].getId()[0]=="."):
301: pages.append(page)
302:
303: pages.sort(sortFind)
304: #print str(pages[int(pagenum)][1]())
305:
306: if pages[int(pagenum)-1][1].meta_type=='File':
307: #return makeXML(str(pages[int(pagenum)-1][1]))
308: #txt=pages[int(pagenum)-1][1].data.decode('utf-8')
309: txt=pages[int(pagenum)-1][1].data
310: #print txt.encode('utf-8')
311: return self.xml2html(makeXML(txt),quote="no")
312: else:
313: return self.xml2html(makeXML(pages[int(pagenum)-1][1]()),quote="no")
314:
315: def nextPage(self,pagenum,url):
316: pages=len(self.ZopeFind(self,obj_metatypes=['DTML Document','File'])) # teste ob performance ok, sonst in variable
317: if int(pagenum)+1 <= pages:
318: retstr=url+"?p="+str(int(pagenum)+1)
319: return """<td align="right" <a href="%s">next</a></td>"""%retstr
320:
321: def previousPage(self,pagenum,url):
322:
323: if int(pagenum)-1 > 0:
324: retstr=url+"?p="+str(int(pagenum)-1)
325: return """<td align="left" <a href="%s">previous</a></td>"""%retstr
326:
327: def nextURL(self,pagenum,url):
328: pages=len(self.ZopeFind(self,obj_metatypes=['DTML Document','File'])) # teste ob performance ok, sonst in variable
329: if int(pagenum)+1 <= pages:
330: retstr=url+"?p="+str(int(pagenum)+1)
331: return retstr
332:
333: def lastURL(self,pagenum,url):
334: # teste ob performance ok, sonst in variable
335: pages=len(self.ZopeFind(self,obj_metatypes=['DTML Document','File']))
336:
337: return url+"?p="+str(pages)
338:
339: def previousURL(self,pagenum,url):
340:
341: if int(pagenum)-1 > 0:
342: retstr=url+"?p="+str(int(pagenum)-1)
343: return retstr
344:
345:
346: def manage_addVLP_essayForm(self):
347: """Form for adding"""
348: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','AddVLP_essay.zpt')).__of__(self)
349: return pt()
350:
351: def manage_addVLP_essay(self, id,title,label,RESPONSE=None):
352: """add the copyright"""
353:
354:
355: self._setObject(id, VLP_essay(id, title,label))
356:
357: if RESPONSE is not None:
358: RESPONSE.redirect('manage_main')
359:
360:
361: class VLP_encyclopaedia(VLP_essay):
362: """essay"""
363:
364: meta_type="VLP_encyclopaedia"
365:
366: manage_options = VLP_essay.manage_options+(
367: {'label':'Load File','action':'loadNewFileForm'},
368: )
369:
370:
371: def loadNewFileForm(self):
372: """Neues XML-File einlesen"""
373: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','VLP_newfile.zpt')).__of__(self)
374: return pt()
375:
376: def loadNewFile(self,RESPONSE=None):
377: """einlesen des neuen files"""
378: fileupload=self.REQUEST['fileupload']
379: if fileupload:
380: file_name=fileupload.filename
381: filedata=fileupload.read()
382:
383: argv=vlp_xmlhelpers.proj2hash(self,filedata)
384: textsStr=string.join(argv['text']).encode('utf-8')
385:
386: texts=textsStr.split("<pb/>")
387:
388: i=0
389: for text in texts:
390: i+=1
391: pageName='page%03d.xml'%i
392: pages=self.ZopeFind(self,obj_ids=[pageName])
393: if pages:
394: pages[0][1].update_data(text)
395:
396: else:
397: zt=File(pageName,pageName,text,content_type="text/plain")
398: self._setObject(pageName,zt)
399:
400: if RESPONSE is not None:
401: RESPONSE.redirect('manage_main')
402:
403:
404: def manage_addVLP_encycForm(self):
405: """Form for adding"""
406: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','AddVLP_encyc.zpt')).__of__(self)
407: return pt()
408:
409: def manage_addVLP_encyc(self, id,title,label,RESPONSE=None):
410: """add the copyright"""
411:
412:
413: self._setObject(id, VLP_encyclopaedia(id, title,label))
414:
415: if RESPONSE is not None:
416: RESPONSE.redirect('manage_main')
417:
418: class VLP_subcollection(ECHO_collection):
419: """ subcollection of elements"""
420:
421: meta_type="VLP_subcollection"
422:
423: def getVLPSubcollectionToc(self,type):
424:
425: #different ordering depending on the type
426: if(type == "(Collection)"):
427: sort= "shortreference"
428: else:
429: sort = "startpages"
430:
431: #content of journals also displayed if not online
432:
433: if (type == "(JournalVolume)"):
434: online =""
435: else:
436: online ="AND online = 1"
437: sort=self.collectionSort(type)
438:
439: item = [x for x in self.ZSQLSimpleSearch("""SELECT * FROM vl_literature
440: WHERE volumeid ~ '%s\\\\M' """%self.getId()
441: + """ %s AND not referenceType='%s' """%(online,type)
442: + """ORDER BY """ + sort)]
443:
444: tocItem = [x for x in self.ZSQLSimpleSearch("""SELECT * FROM vl_literature
445: WHERE reference = '%s' """%self.getId()
446: + """AND online = 1 AND referenceType='%s' """%type
447: + """ORDER BY """ + sort)]
448:
449:
450:
451: return tocItem+item
452:
453: def checkForFrontMatter(self,item):
454: """Teste ob Frontmatter exists"""
455: if not item==self.getId():
456: return False
457:
458: if self.ZopeFind(self,obj_ids=[self.getId()]):
459: return True
460: else:
461: return False
462:
463: def generateSubCollectionFromDB(self):
464: """erzeuge subcollection"""
465: for item in self.ZSQLSimpleSearch("select * from vl_literature where volumeid like '%s'"%self.id):
466: manage_addECHO_link(self,item.reference,item.titlerefdisplay,item.titlerefdisplay)
467:
468:
469: def index_html(self):
470: """erzeuge darstellung"""
471:
472: if hasattr(self,'subCollection_template.html'):
473: return getattr(self,'subCollection_template.html')()
474:
475: pt=zptFile(self, 'vlp/subCollection_template.zpt')
476: return pt()
477:
478:
479: def manage_addVLP_subCollection(self,id,title,label,RESPONSE=None):
480:
481: self._setObject(id,VLP_subcollection(id,title,label))
482:
483: if RESPONSE is not None:
484: RESPONSE.redirect('manage_main')
485:
486: from zope.publisher.interfaces import IPublishTraverse
487: from zope.interface import implements
488: from zope.publisher.interfaces import NotFound
489: #from zope.app import zapi
490: from zope.component import queryMultiAdapter
491: try:
492: from ZPublisher.BaseRequest import DefaultPublishTraverse
493: except:
494: pass
495:
496: class VLP_collection(ECHO_collection,Acquisition.Explicit):
497: """VLP spezifische Erweiterung der Collection"""
498:
499:
500:
501: implements(IPublishTraverse)
502: def findObjFromLitName(self,fileName):
503: if not fileName[0:3]=="lit":
504: logging.error("getOrCreateFolder wrong filename: %s"%fileName)
505: return None
506:
507:
508: restName="%08d"%int(fileName[3:])
509:
510: fs=(restName[0:2],restName[0:4],restName[0:6])
511:
512: current =self
513: for f in fs:
514: obj = getattr(current,f,None)
515: if not obj: #subfolder existiert nicht
516: return None
517: current=obj
518:
519: return getattr(current,fileName,None)
520:
521: def publishTraverse(self,request,name):
522: """change the traversal if literature object"""
523:
524: actual_url=request['ACTUAL_URL']
525: lastActual=actual_url.split("/")[-1]
526: logging.debug("pub_trav:"+actual_url)
527:
528: if name.startswith("lit"): #umleitung wenn lit aufgerufen wirk
529: # umleitung auf den eigentlichen folder nur wenn direkt der Folder litXXX oder dessen index_html methode aufgerufen wird
530: if lastActual.startswith("lit") or (lastActual=="index_html") or (lastActual=="index_meta") or (lastActual=="getTitle") or (lastActual=="getMetaDataLink") or (lastActual=="hasTranscription") or (lastActual=="transcription"):
531: #obj=self. ZopeFind(self,obj_ids=[name],search_sub=1)
532: ob=self.findObjFromLitName(name)
533: if not ob:
534: return "LIt not found"
535: else:
536:
537: logging.debug("request:"+repr(ob))
538: request.response.setStatus(200)
539: #if (lastActual=="index_meta"):
540: # logging.debug("index_meta requested")
541: # return ob.index_meta
542: return ob
543:
544: else: ## andern falls transversiere zum parent.
545: obj = self.aq_parent
546: return obj
547: else: # mache gar nichts falls nicht lit aufgerufen wird
548:
549:
550: tr=DefaultPublishTraverse(self, request)
551: ob= tr.publishTraverse(request, name)
552:
553: return ob
554: #raise NotFound(self.context, name, request)
555: #return repr(request)
556:
557: meta_type="VLP_collection"
558: manage_options=ECHO_collection.manage_options+(
559: {'label':'Change Path','action':'VLP_path_configForm'},
560: {'label':'Update Library','action':'updateCollection'},
561: {'label':'Update Metadata','action':'updateCollectionMD'},
562: )
563: def getAllRessources(self):
564: """getallressources"""
565: res=self.ZopeFind(self,obj_metatypes=['VLP_resource'],search_sub=1)
566: ret=[]
567: for r in res:
568: ret.append([r[0],r[1].absolute_url()])
569:
570: return ret
571:
572: def generateSubCollections(self,errorsTXT="",forceUpdate=False,RESPONSE=None):
573: """erzeuge subcollectionen"""
574: logging.debug("generateSubCollections")
575: founds=self.ZSQLSimpleSearch("select * from vl_literature where referencetype in ('(Edited Book)','(Book)','(Collection)','(JournalVolume)','(Generic Container)')")
576:
577: if RESPONSE is not None:
578: RESPONSE.setHeader('Content-Type','text/html')
579: self.REQUEST.RESPONSE.write("<h2>Create Subcollections</h2>\n")
580: for found in founds:
581: try:
582: litid = str(found.reference)
583: foundCol=self.findObjFromLitName(litid)
584: #foundCol=self.ZopeFind(self,obj_ids=[litid])
585: if foundCol:
586: col = foundCol
587: logging.debug("generateSubCollections: subcollection %s exists (%s)"%(repr(col),found.reference))
588: logging.debug(repr([col.title,found.titlerefdisplay,col.label,found.titlerefdisplay]))
589: if (unicodify(col.title) != unicodify(found.titlerefdisplay)) or (unicodify(col.label) != unicodify(found.titlerefdisplay)):
590: # subcollection seems to have changed
591: logging.debug("generateSubCollections: subcollection has changed, recreating!")
592: col.aq_parent.manage_delObjects([col.getId()])
593: manage_addVLP_subCollection(self.getOrCreateFolderForFile(litid),litid,found.titlerefdisplay,found.titlerefdisplay)
594: else:
595: logging.debug("generateSubCollections: creating new subcollection %s"%found.reference)
596: manage_addVLP_subCollection(self.getOrCreateFolderForFile(litid),litid,found.titlerefdisplay,found.titlerefdisplay)
597:
598: #teste ob es Images auf dem Server gibt mit gleichem Namen (frontmatter)
599: if os.path.exists(os.path.join(self.vlp_basis,litid)):
600: logging.debug("generateSubCollections: found frontmatter in %s"%litid)
601: obj=self.findObjFromLitName(litid)
602: if not self.ZopeFind(obj,obj_ids=[litid]):
603: metalink=self.REQUEST['URL1']+"/"+litid+"/"+litid+"/index_meta"
604: newObj=VLP_resource(litid,'',metalink,litid,litid,litid,'generated','book','','','','','','')
605: obj._setObject(litid,newObj)
606:
607: genObj=getattr(obj,litid)
608: genObj.createIndexFile(forceUpdate=forceUpdate)
609:
610: if RESPONSE is not None:
611: self.REQUEST.RESPONSE.write("<p>%s</p>\n"%litid)
612: logging.debug("<p>%s</p>\n"%litid)
613:
614: except:
615: error=sys.exc_info()[0:2]
616: logging.error("generateSubCollections: ERROR in %s"%litid)
617: if RESPONSE is not None:
618: RESPONSE.write("<p>(ERROR updateII(%s): %s %s TXT: %s)\n</p>"%(litid,error[0],error[1],sys.exc_info()[2]))
619: RESPONSE.write("<p>(ERROR (%s): %s %s)</p>\n"%(litid,error[0],error[1]))
620: logging.error("generateSubCollections: %s %s"%error)
621: self.REQUEST.RESPONSE.write("(ERROR (%s): %s %s)\n"%(litid,repr(error[0]),repr(error[1])))
622: errorsTXT+="<p>ERROR: No subcollection of %s (ERROR: %s %s)</p>\n"%(litid,error[0],error[1])
623: errorsTXT+="<p>No subcollection of %s "%litid+"(ERROR: %s %s)</p>"%error
624:
625: return errorsTXT
626:
627: def VLP_path_configForm(self):
628: """change pt"""
629: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','ChangeVLPPath.zpt')).__of__(self)
630: return pt()
631:
632: def VLP_path_config(self,path,RESPONSE=None):
633: """config"""
634: self.vlp_basis=path
635: if RESPONSE is not None:
636: RESPONSE.redirect('manage_main')
637:
638:
639: def getOrCreateFolderForFile(self,fileName):
640:
641: if not fileName[0:3]=="lit":
642: logging.error("getOrCreateFolder wrong filename: %s"%fileName)
643: return None
644:
645: try:
646: restName="%08d"%int(fileName[3:])
647: except:
648: logging.error("getOrCreateFolder wrong filename: %s"%fileName)
649: return None
650:
651: fs=(restName[0:2],restName[0:4],restName[0:6])
652:
653: current =self
654: for f in fs:
655: obj = getattr(current,f,None)
656: if not obj:
657: newObj=VLP_collectionFolder(f)
658: current._setObject(f,newObj)
659: obj = getattr(current,f)
660: current=obj
661:
662: return current
663:
664: def changeOrAddResources(self,forceUpdate=False,RESPONSE=None):
665: """changes ord updates all resources found in the file system"""
666:
667: errorsTXT="<h2>Errors</h2>"
668: if RESPONSE is not None:
669: RESPONSE.setHeader('Content-Type','text/html')
670: RESPONSE.write("<html><body>")
671:
672: files=os.listdir(self.vlp_basis)
673: i=0
674: for fileName in files:
675: if i<100:
676: i+=1
677: else:
678: i=0
679: j=0
680: while j<5:
681: try:
682: transaction.get().commit()
683: j=6
684: except:
685: logging.error("Commit: %s"%j)
686: j+=1
687:
688: RESPONSE.write("<p>committed</p>")
689: if fileName[0:3]=="lit":
690: metalink=self.REQUEST['URL1']+"/"+fileName+"/index_meta"
691:
692: folder=self.getOrCreateFolderForFile(fileName) #get the folder where fileName lives or should live
693: if not folder: #folder gave an error
694: continue
695: try:
696: if not hasattr(folder,fileName):
697: # create new resource
698: logging.debug("updateCollection: new %s"%fileName)
699: if RESPONSE is not None:
700: RESPONSE.write("<p>new: %s</p>\n"%fileName)
701: logging.debug("new: %s \n"%fileName)
702: newObj=VLP_resource(fileName,'',metalink,fileName,fileName,fileName,'generated','book','','','','','','')
703:
704: folder._setObject(fileName,newObj)
705:
706: if RESPONSE is not None:
707: RESPONSE.write("<p>got: %s "%fileName)
708:
709: genObj=getattr(folder,fileName)
710: logging.debug("got: %s "%fileName)
711:
712: logging.debug("updateCollection: inspecting %s"%fileName)
713: # create index
714: if hasattr(genObj,'createIndexFile'):
715: try:
716: logging.debug("updateCollection: creating index for %s"%fileName)
717: msg = genObj.createIndexFile(forceUpdate=forceUpdate)
718: if msg and RESPONSE is not None:
719: RESPONSE.write(msg)
720: except:
721: error=sys.exc_info()[0:2]
722: if RESPONSE is not None:
723: RESPONSE.write("(ERROR Update(%s): %s %s %s) "%(fileName,error[0],error[1],sys.exc_info()[2]))
724: errorsTXT+="<p>ERROR creating index for %s "%fileName+"(ERROR: %s %s)</p>\n"%error
725:
726: # update pageSizeSum for subcollections
727: if genObj.meta_type=="VLP_subcollection":
728: if RESPONSE is not None:
729: RESPONSE.write(" is subcollection")
730: logging.debug("updateCollection: %s is subcollection"%fileName)
731: genObj.pageSizeSum=getattr(genObj,fileName).getPageSizeSum()
732: else:
733: genObj.pageSizeSum=genObj.getPageSizeSum()
734:
735: if RESPONSE is not None:
736: RESPONSE.write("</p>\n")
737:
738: except:
739: error=sys.exc_info()[0:2]
740: logging.error("updateCollection: ERROR in %s (%s %s)"%(fileName,error[0],error[1]))
741: if RESPONSE is not None:
742: RESPONSE.write("(ERROR updateII(%s): %s %s %s) "%(fileName,error[0],error[1],sys.exc_info()[2]))
743: errorsTXT+="<p>File not created:%s (ERROR: %s %s)</p>\n"%(fileName,error[0],error[1])
744: return errorsTXT
745:
746: def updateCollection(self,forceUpdate=True,RESPONSE=None):
747: """liest verzeichnisse aus dem pfad und legt sie dann als objekte in den ordner"""
748:
749: # update subcollections
750: errorsTXT=""
751: errorsTXT+=self.changeOrAddResources(forceUpdate, RESPONSE);
752: errorsTXT+=self.generateSubCollections(forceUpdate=forceUpdate,RESPONSE=RESPONSE)
753: errorsTXT+="\n"
754: if RESPONSE is not None:
755: RESPONSE.write(errorsTXT)
756: RESPONSE.write("</body></html>")
757:
758: def updateCollectionMD(self,RESPONSE=None):
759: """updateMD"""
760: files=os.listdir(self.vlp_basis)
761: for fileName in files:
762: if fileName[0:3]=="lit":
763: genObj=getattr(self,fileName)
764: genObj.copyIndex_meta2echo_resource()
765: genObj.generate_title()
766:
767: if RESPONSE is not None:
768: RESPONSE.redirect('manage_main')
769:
770: def copyFullTextsFromDB(self,RESPONSE=None):
771: """copy fulltext aus DB"""
772:
773: ress=self.ZopeFind(self,obj_metatypes=['VLP_resource'])
774: ret=""
775: for res in ress:
776: tmp=res[1].copyTranscriptionFromDB()
777: ret+=tmp
778:
779: if RESPONSE:
780: RESPONSE.write(tmp+"\n")
781: if not RESPONSE:
782: return ret
783: else:
784: RESPONSE.write("END\n")
785:
786:
787: def manage_addVLP_collectionForm(self):
788: """Form for adding a ressource"""
789: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','AddVLP_collectionForm.zpt')).__of__(self)
790: return pt()
791:
792:
793:
794: def manage_addVLP_collection(self,id,title,label,description,contentType,responsible,weight,sortfield,path,coords="",secondaryLinkTitle="",secondaryLink="",credits=None,RESPONSE=None,imageTag="",bgcolour=""):
795: """add a echo collection"""
796:
797:
798: newObj=VLP_collection(id,title,label,description,contentType,responsible,credits,weight,sortfield,coords,secondaryLinkTitle=secondaryLinkTitle,secondaryLink=secondaryLink,imageTag=imageTag,bgcolour="")
799:
800: self._setObject(id,newObj)
801: setattr(newObj,'path',path)
802:
803: if RESPONSE is not None:
804: RESPONSE.redirect('manage_main')
805:
806:
807:
808: class VLP_resource(ECHO_resource,Cacheable):
809: """VLP spezifische Erweiterung"""
810:
811: meta_type="VLP_resource"
812:
813: def _p_resolveConflict(self,oldstate,savedstate,newstate):
814: logging.debug("updateCollection: Have to resolve conflict!")
815: return newstate
816:
817: #vlp_basis="/mpiwg/online/permanent/vlp"
818:
819:
820:
821: referencetypes=[]
822:
823: manage_options=ECHO_resource.manage_options+Cacheable.manage_options+(
824: {'label':'Update Index','action':'createIndexFile'},
825: {'label':'Reset MetaLink','action':'resetMetaLink'},
826: {'label':'Generate Title','action':'generate_title'},
827: {'label':'Generate Library Template','action':'generateLibraryTemplateHTML'},
828: )
829:
830: def getMetaDataLink(self):
831: """link auf die metatdaten"""
832: return self.absolute_url()+"/index_meta"
833:
834:
835: def getTitle(self):
836: """Title der Ressource"""
837: title= self.ZSQLSimpleSearch("""select title from vl_literature where reference= \'%s\' """ %self.getId())[0].title
838: logging.debug(title)
839: return title
840:
841: def getImagePath(self):
842: """Pfad zu den Images"""
843: path=None
844:
845: if os.path.isdir(os.path.join(self.vlp_basis,self.resourceID,'pageimg')):
846: path= os.path.join(self.vlp_basis,self.resourceID,'pageimg')
847: elif os.path.isdir(os.path.join(self.vlp_basis,self.resourceID,'pages')):
848: path = os.path.join(self.vlp_basis,self.resourceID,'pages')
849: # workaround in some cases there seem to be no pictures in pages
850:
851: if os.path.isdir(os.path.join(self.vlp_basis,self.resourceID,'pagesHi')):
852:
853:
854: pagesHi = os.listdir(os.path.join(self.vlp_basis,self.resourceID,'pagesHi'))
855: if path is None:
856: return os.path.join(self.vlp_basis,self.resourceID,'pagesHi')
857:
858: pages = os.listdir(path)
859:
860: if len (pagesHi) > len(pages):
861:
862: countHi=0
863: for p in pagesHi:
864: dat,ext = os.path.splitext(p)
865: if ext.lower() in [".tiff",".tif",".jpg"]:
866: countHi+=1
867: count=0
868: for p in pages:
869: dat,ext = os.path.splitext(p)
870: if ext.lower() in [".tiff",".tif",".jpg"]:
871: count+=1
872:
873: if countHi > count:
874: path=os.path.join(self.vlp_basis,self.resourceID,'pagesHi')
875:
876: logging.error("pages < pagesHi: %s"%self.resourceID)
877: if path is None:
878:
879:
880: if len (os.listdir(os.path.join(self.vlp_basis,self.resourceID,'pagesHi'))) > len(os.listdir(path)):
881:
882:
883:
884: path=os.path.join(self.vlp_basis,self.resourceID,'pagesHi')
885: logging.error("pages < pagesHi: %s"%self.resourceID)
886: else:
887:
888: logging.error("no images: %s"%self.resourceID)
889: return None
890:
891: return path
892:
893:
894: def transcription(self):
895: """show the rendered transcriptiofile"""
896:
897: if hasattr(self,'libraryTranscriptionTemplate.html'):
898: return getattr(self,'libraryTranscriptionTemplate.html')()
899:
900: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','library_transcriptionTemplate.zpt')).__of__(self)
901: pt.content_type="text/html"
902: return pt()
903:
904:
905:
906: def identifyMediaType(self):
907: """identifiziert den Medientype aus der VLP Datenbank"""
908: founds=self.ZSQLSimpleSearch('select * from vl_literature where reference=\''+self.resourceID+'\' order by id')
909: if (not founds) or (len(founds)==0):
910: self.mediaType="generic" # steht nicht in der Datenbank, dann nimm generisch an
911: return self.mediaType
912:
913:
914: if founds[0].referencetype =="Audio":
915: self.mediaType ="audio"
916: elif founds[0].referencetype =="Film":
917: self.mediaType ="video"
918: else:
919: self.mediaType ="image" # nimm an, dass alle anderen Eintrage in der Datenbank auf images verweisen (Buecher oder Fotografien).
920:
921: return self.mediaType
922:
923: def getMediaType(self,cached=False):
924: """give the Media-type back, if chached False, then get it from the database"""
925:
926: if (not hasattr(self,'mediaType')) or (self.mediaType=="") or (not cached):
927: self.identifyMediaType()
928:
929: return self.mediaType
930:
931:
932:
933:
934: def copyTranscriptionFromDB(self):
935: """checks if transcription exits in DB"""
936: founds=self.ZSQLSimpleSearch('select * from vl_transcript where source=\''+self.resourceID+'\' order by id')
937:
938:
939: ret="""<?xml version="1.0" encoding="utf-8"?>
940: <text>"""
941:
942: if founds:
943:
944: for found in founds:
945:
946: text=found.transcript
947: if not text: text=""
948: ret+="<page><pb/>"+text+"</page>"
949:
950: ret+="</text>"
951: re2=ret[0:]
952: re3=self.unicodify(re2)
953: #re3=re2
954: ft=self.ZopeFind(self,obj_metatypes=['ECHO_fullText'])
955:
956: if ft:
957:
958: ft[0][1].pt_edit(re3,'text/xml')
959:
960: else:
961:
962: self._setObject('fulltext',ECHO_fullText(id,''))
963:
964: try:
965: getattr(self,'fulltext').pt_edit(re3.encode('utf-8','ignore'),'text/xml')
966: except:
967: getattr(self,'fulltext').pt_edit(re3.encode('latin-1').decode('utf-8'),'text/xml')
968:
969: return "FT: %s"%self.getId()
970: else:
971: return "no: %s"%self.getId()
972:
973: def hasTranscription(self):
974: """transcription"""
975:
976: if not hasattr(self,'fulltext'):
977: self.copyTranscriptionFromDB()
978: if not hasattr(self,'fulltext'): #still not
979: return False
980:
981: return True
982:
983: def resetMetaLink(self,all="no",RESPONSE=None):
984: """resets metalink to standard resp. in case of server change it sets to the new server url"""
985: if all=="yes":
986: self.metalink=self.absolute_url()+"/index_meta"
987: else:
988: splitted=self.metalink.split("/")
989: if (len(splitted)>1) and (splitted[len(splitted)-1]=="index_meta") and (splitted[len(splitted)-2]==self.getId()): # heuristic nur generische Metadatafiles andern
990: self.metalink=self.absolute_url()+"/index_meta"
991:
992: if RESPONSE:
993: return "done"
994:
995: def show(self):
996: """show the rendered file"""
997:
998: mt = self.getMediaType()
999:
1000: if (mt in ['video','audio']):
1001: pt = self.getVLPTemplate('libraryMovieTemplate')
1002: else: #zur zeit werden alle anderen type auf das libraryTemplate abgebildet.
1003:
1004: if self.REQUEST.get('p',None): #make sure that parameter p exists
1005: #self.REQUEST.set('pn',self.file2page(self.REQUEST.get('p',None)))
1006: params = "pn=%s"%self.file2page(self.REQUEST.get('p',None))
1007: mk = self.REQUEST.get('mk',None)
1008: if mk:
1009: params += "&mk=%s"%mk
1010: self.REQUEST.RESPONSE.redirect(self.REQUEST['URL']+'?'+params)
1011:
1012: pt = self.getVLPTemplate('libraryTemplate')
1013:
1014: return pt()
1015:
1016: def getVLPTemplate(self,name):
1017: html=name+".html"
1018: if hasattr(self,html):
1019: return getattr(self,html)
1020:
1021: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp',name+'.zpt')).__of__(self)
1022: pt.content_type="text/html"
1023: return pt
1024:
1025: def index_html(self):
1026: """index_html"""
1027: #return self.REQUEST
1028: if not self.REQUEST.has_key("ws"):
1029: self.REQUEST.form["ws"]="1.5"
1030:
1031: return self.show()
1032:
1033: def generateLibraryTemplateHTML(self,RESPONSE=None):
1034: """lege standard index.html an"""
1035:
1036: if not hasattr(self,'libraryTemplate.html'):
1037: zt=ZopePageTemplate('libraryTemplate.html')
1038: self._setObject('libraryTemplate.html',zt)
1039: default_content_fn = os.path.join(package_home(globals()),
1040: 'vlp/library_template.zpt')
1041: text = open(default_content_fn).read()
1042: zt.pt_edit(text, 'text/html')
1043:
1044: else:
1045: return "already exists!"
1046:
1047: if RESPONSE is not None:
1048: RESPONSE.redirect('manage_main')
1049:
1050:
1051: def index_meta(self,RESPONSE=None):
1052: """index_meta"""
1053:
1054: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','index_meta.zpt')).__of__(self)
1055: pt.content_type="text/xml"
1056: x= pt.pt_render()
1057: #logging.debug("index_meta 4:"+x)
1058: if RESPONSE:
1059: RESPONSE.setHeader("Content-Type","text/xml")
1060: return x
1061: def file2page(self,p):
1062: """converts filename to pagenumber"""
1063:
1064: #dom=xml.dom.minidom.parse(ECHO_helpers.urlopen(getattr(self,'index.xml').absolute_url()))
1065: index=getattr(self,'index.xml')
1066:
1067: txt=index.pt_render()
1068: dom=xml.dom.minidom.parseString(txt)
1069:
1070: for page in dom.getElementsByTagName('page'):
1071: # pageummer mit lo oder hi sind aequivalent
1072: if (page.getAttribute('file')==p) or ("%slo"%page.getAttribute('file')==p) or ("%shi"%page.getAttribute('file')==p):
1073: nr=page.getAttribute('nr')
1074:
1075: return nr
1076:
1077: return 0
1078:
1079: def getPageSizeSum(self):
1080: """generate average page size"""
1081:
1082: #size of hi resolution
1083: files=[]
1084: try:
1085: pathHi=os.path.join(self.vlp_basis,self.resourceID,'pages')
1086: files=os.listdir(pathHi)
1087: hi=0
1088: for f in files:
1089: hi+=os.stat(os.path.join(pathHi,f))[ST_SIZE]
1090:
1091: except:
1092: hi=0
1093:
1094: #size of hi resolution
1095: try:
1096: pathHi=os.path.join(self.vlp_basis,self.resourceID,'pagesLo')
1097: files=os.listdir(pathHi)
1098: lo=0
1099: for f in files:
1100: lo+=os.stat(os.path.join(pathHi,f))[ST_SIZE]
1101:
1102: except:
1103: lo=0
1104:
1105:
1106: return (hi,lo,len(files))
1107:
1108:
1109: def getPageWeights(self):
1110: """average Page sizes in kBytes"""
1111:
1112: res=getattr(self,'pageSizeSum',(0,0,1))
1113: return (res[0]/(1024*res[2]),res[1]/(1024*res[2]))
1114:
1115:
1116:
1117: def dir2index(self):
1118: """dir to index"""
1119:
1120: excludeNames=['Icon']
1121:
1122:
1123: def calculateName(str):
1124: name=os.path.splitext(str[1:])[0]
1125: ret="%s: %s"%(str[0],name)
1126: return ret
1127:
1128: self.imagePathFull=self.getImagePath();
1129: self.imagePath=self.imagePathFull.split("/")[-1]
1130: if (self.imagePath is None):
1131: return None
1132:
1133: temp=[]
1134: ret = os.listdir(self.imagePathFull)
1135:
1136: ret.sort()
1137: for x in ret:
1138: if (not (x[0] in ('.',':'))) and (not x[0:4] in excludeNames):
1139: temp.append((calculateName(x),os.path.splitext(x)[0]))
1140: return temp
1141:
1142:
1143: def firstPage(self,url=None):
1144: """showlink to the first image"""
1145: if self.REQUEST.get('pn','1')=="1": #erste seinte dann kein a tag
1146: return """<img src="/images/first.gif" alt="first" width="14" height="14" border="0"><br>first"""
1147:
1148: else:
1149: ws=self.REQUEST.get('ws','1')
1150: return """<a href=%s>
1151: <img src="/images/first.gif" alt="first" width="14" height="14" border="0"><br>first
1152: </a>
1153: """%(self.REQUEST['URL']+"?pn=1&ws=%s"%ws)
1154:
1155: def lastPage(self,url=None):
1156: """showlink to the first image"""
1157: pages=self.readIndexFile(url)
1158: if pages:
1159: ln=len(pages)
1160:
1161: if (self.REQUEST.get('pn')==str(ln)) or (ln==1): #letzte seite dann kein a tag oder nur eine Seite
1162: return """<img src="/images/last.gif" alt="last" width="14" height="14" border="0"><br>last"""
1163:
1164: else:
1165: ws=self.REQUEST.get('ws','1')
1166: return """<a href=%s>
1167: <img src="/images/last.gif" alt="last" width="14" height="14" border="0"><br>last
1168: </a>
1169: """%(self.REQUEST['URL']+"?pn="+str(ln)+"&ws="+ws)
1170:
1171: def prevPage(self,url=None):
1172: """showlink to the first image"""
1173:
1174:
1175: nn = int(self.REQUEST.get('pn','1'))-1
1176: if nn < 1: #letzte seite dann kein a tag
1177: return """<img src="/images/lisePrev.gif" alt="prev" width="14" height="14" border="0"><br>prev"""
1178:
1179: else:
1180: ws=self.REQUEST.get('ws','1')
1181: return """<a href=%s>
1182: <img src="/images/lisePrev.gif" alt="prev" width="14" height="14" border="0"><br>prev
1183: </a>
1184: """%(self.REQUEST['URL']+"?pn="+str(nn)+"&ws="+ws)
1185:
1186: def nextPage(self,url=None):
1187: """showlink to the first image"""
1188: pages=self.readIndexFile(url)
1189: if pages:
1190: ln=len(pages)
1191:
1192: nn = int(self.REQUEST.get('pn','1'))+1
1193: if (nn>int(ln)) or (ln==1): #letzte seite dann kein a tag
1194: return """<img src="/images/liseNext.gif" alt="next" width="14" height="14" border="0"><br>next"""
1195:
1196: else:
1197: ws=self.REQUEST.get('ws','1')
1198: return """<a href=%s>
1199: <img src="/images/liseNext.gif" alt="next" width="14" height="14" border="0"><br>next
1200: </a>
1201: """%(self.REQUEST['URL']+"?pn="+str(nn)+"&ws="+ws)
1202:
1203:
1204: def readIndexFile(self,url=None):
1205: """reads the indexfile. presently url not None isn't implemented. In the future url can be defined."""
1206: if not url:
1207: urlTmp=self.absolute_url()+"/index.xml"
1208:
1209: if self.ZCacheable_isCachingEnabled():
1210:
1211: result = self.ZCacheable_get(view_name=urlTmp)
1212: if result is not None:
1213: # Got a cached value.
1214: return result
1215:
1216: pagelist=[]
1217:
1218: if not url:
1219:
1220: xmlTxt=getattr(self,'index.xml')()
1221: dom=xml.dom.minidom.parseString(xmlTxt)
1222: else:
1223: fh=ECHO_helpers.urlopen(urlTmp)
1224: dom=xml.dom.minidom.parse(fh)
1225:
1226:
1227: for page in dom.getElementsByTagName('page'):
1228: text=getText(page.childNodes)
1229: pageNum=page.getAttribute('nr')
1230: fileName=page.getAttribute('file')
1231: pagelist.append((pageNum,text,fileName))
1232:
1233: self.ZCacheable_set(pagelist,view_name=urlTmp)
1234: return pagelist
1235:
1236: def getFileName(self):
1237: """getNameOfCurrentFile"""
1238: try:
1239: pn=int(self.REQUEST.get('pn','1'))
1240: except:
1241: pn=1
1242: pageinfo=self.readIndexFile()[pn-1]
1243: return pageinfo[2]
1244:
1245: def createIndexFile(self,forceUpdate=False,RESPONSE=None):
1246: """create index file"""
1247: logging.debug("createindexfile of %s"%self.id)
1248:
1249: if hasattr(self,'index.xml'):
1250: # index exists
1251: zt=getattr(self,'index.xml')
1252: if not forceUpdate:
1253: # check if directory is newer (self.imagePath sould be set by now)
1254: path = self.getImagePath()
1255: if (path is None):
1256: return "CREATE INDEX FILE NOT POSSIBLE"
1257: imgdir = os.path.join(path)
1258: dirtime = os.path.getmtime(imgdir)
1259: zttime = zt.bobobase_modification_time()
1260: logging.debug("createindexfile: dir %s of %s index of %s"%(imgdir,dirtime,zttime))
1261: if dirtime < zttime:
1262: # nothing to do
1263: logging.debug("createindexfile: dir %s older than index"%(imgdir))
1264: return "index is up to date"
1265:
1266: else:
1267: # create new index template
1268: zt=ZopePageTemplate('index.xml')
1269: self._setObject('index.xml',zt)
1270:
1271: # fill index template
1272: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','index_template.zpt')).__of__(self)()
1273: #logging.debug("createindexfile uses %s"%pt)
1274: zt.pt_edit(pt, 'text/xml')
1275: transaction.get().commit()
1276:
1277: if RESPONSE is not None:
1278: RESPONSE.redirect('manage_main')
1279:
1280:
1281: def manage_addVLP_resourceForm(self):
1282: """Form for adding a ressource"""
1283: pt=PageTemplateFile(os.path.join(package_home(globals()),'vlp','AddVLP_resourceForm.zpt')).__of__(self)
1284: return pt()
1285:
1286:
1287:
1288: def manage_addVLP_resource(self,id,title,label,description,responsible,link,metalink,weight,resourceID=None,contentType=None,renderingType=None,credits=None,coords=None,RESPONSE=None):
1289: """addaresource"""
1290:
1291:
1292: if metalink=='':
1293: metalink=self.absolute_url()+"/"+id+"/index_meta"
1294:
1295: newObj=VLP_resource(id,link,metalink,resourceID,title,label,description,contentType,renderingType,responsible,credits,weight,coords)
1296:
1297: self._setObject(id,newObj)
1298:
1299: if RESPONSE is not None:
1300: RESPONSE.redirect('manage_main')
1301:
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>