File:  [Repository] / cdli / cdli_files.py
Revision 1.87: download - view: text, annotated - select for diffs - revision graph
Wed Oct 1 15:58:11 2008 UTC (15 years, 9 months ago) by dwinter
Branches: MAIN
CVS tags: HEAD
Incomplete - # 17: Erstellen gro§er Baskets
https://itgroup.mpiwg-berlin.mpg.de:8080/tracs/cdli/ticket/17

    1: """CDLI extensions of the filearchive"""    
    2: from Products.versionedFile.extVersionedFile import *
    3: from Products.ZCatalog.CatalogPathAwareness import CatalogAware
    4: from tempfile import mkstemp,mkdtemp    
    5: import os.path
    6: import os
    7: from types import *
    8: import urlparse
    9: import urllib
   10: import cgi
   11: from OFS.OrderedFolder import OrderedFolder
   12: from OFS.SimpleItem import SimpleItem
   13: import time
   14: from OFS.Folder import manage_addFolder
   15: import re
   16: from AccessControl import ClassSecurityInfo
   17: from Acquisition import Implicit
   18: from Globals import Persistent
   19: from threading import Thread
   20: from ZPublisher.HTTPRequest import HTTPRequest
   21: from ZPublisher.HTTPResponse import HTTPResponse
   22: from ZPublisher.BaseRequest import RequestContainer
   23: import threading
   24: from BTrees.OOBTree import OOBTree, OOTreeSet
   25: import logging
   26: import transaction
   27: import copy
   28: import codecs
   29: import sys
   30: from BTrees.IOBTree import IOBTree 
   31: import cdliSplitter
   32: from sets import Set
   33: import md5
   34: from DownloadBasket import DownloadBasketFinallyThread
   35:                                        
   36: def makelist(mySet):
   37:         x = list(mySet)
   38:         x.sort()
   39:         return x
   40:     
   41: def unicodify(s):
   42:     """decode str (utf-8 or latin-1 representation) into unicode object"""
   43:     if not s:
   44:         return u""
   45:     if isinstance(s, str):
   46:         try:
   47:             return s.decode('utf-8')
   48:         except:
   49:             return s.decode('latin-1')
   50:     else:
   51:         return s
   52: 
   53: def utf8ify(s):
   54:     """encode unicode object or string into byte string in utf-8 representation.
   55:        assumes string objects to be utf-8"""
   56:     if not s:
   57:         return ""
   58:     if isinstance(s, str):
   59:         return s
   60:     else:
   61:         return s.encode('utf-8')
   62: 
   63: def formatAtfHtml(l):
   64:     """escape special ATF characters for HTML"""
   65:     if not l:
   66:         return ""
   67: 
   68:     # replace &
   69:     l = l.replace('&','&')
   70:     # replace angular brackets
   71:     l = l.replace('<','&lt;')
   72:     l = l.replace('>','&gt;')
   73:     return l
   74: 
   75: def formatAtfLineHtml(l, nolemma=True):
   76:     """format ATF line for HTML"""
   77:     if not l:
   78:         return ""
   79: 
   80:     if nolemma:
   81:         # ignore lemma lines
   82:         if l.lstrip().startswith('#lem:'):
   83:             return ""
   84:     
   85:     return formatAtfHtml(l)
   86: 
   87: 
   88: 
   89: def formatAtfFullLineNum(txt, nolemma=True):
   90:     """format full line numbers in ATF text"""
   91:     # surface codes
   92:     surfaces = {'@obverse':'obv',
   93:                 '@reverse':'rev',
   94:                 '@surface':'surface',
   95:                 '@edge':'edge',
   96:                 '@left':'left',
   97:                 '@right':'right',
   98:                 '@top':'top',
   99:                 '@bottom':'bottom',
  100:                 '@face':'face',
  101:                 '@seal':'seal'}
  102: 
  103:     if not txt:
  104:         return ""
  105:     
  106:     ret = []
  107:     surf = ""
  108:     col = ""
  109:     for line in txt.splitlines():
  110:         line = unicodify(line)
  111:         if line and line[0] == '@':
  112:             # surface or column
  113:             words = line.split(' ')
  114:             if words[0] in surfaces:
  115:                 surf = line.replace(words[0],surfaces[words[0]]).strip()
  116:             
  117:             elif words[0] == '@column':
  118:                 col = ' '.join(words[1:])
  119:             
  120:         elif line and line[0] in '123456789':
  121:             # ordinary line -> add line number
  122:             line = "%s:%s:%s"%(surf,col,line)
  123:             
  124:         ret.append(line)
  125:     
  126:     return '\n'.join(ret)
  127:             
  128:             
  129: def generateXMLReturn(hash):
  130:     """erzeugt das xml file als returnwert fuer uploadATFRPC"""
  131: 
  132:     ret="<return>"
  133:     
  134:     ret+="<errors>"
  135:     for error in hash['errors']:
  136:         ret+="""<error atf="%s">%s</error>"""%error
  137:     
  138:     ret+="</errors>"
  139:     
  140:     ret+="<changes>"
  141:     for changed in hash['changed']:
  142:         ret+="""<change atf="%s">%s</change>"""%changed
  143:     ret+="</changes>"
  144:     
  145:     ret+="<newPs>"
  146:     for new in hash['newPs']:
  147:         ret+="""<new atf="%s"/>"""%new
  148:     ret+="</newPs>"
  149:     
  150:     ret+="</return>"
  151:     return ret
  152:     
  153:     
  154: def unique(s):
  155:     """Return a list of the elements in s, but without duplicates.
  156: 
  157:     For example, unique([1,2,3,1,2,3]) is some permutation of [1,2,3],
  158:     unique("abcabc") some permutation of ["a", "b", "c"], and
  159:     unique(([1, 2], [2, 3], [1, 2])) some permutation of
  160:     [[2, 3], [1, 2]].
  161: 
  162:     For best speed, all sequence elements should be hashable.  Then
  163:     unique() will usually work in linear time.
  164: 
  165:     If not possible, the sequence elements should enjoy a total
  166:     ordering, and if list(s).sort() doesn't raise TypeError it's
  167:     assumed that they do enjoy a total ordering.  Then unique() will
  168:     usually work in O(N*log2(N)) time.
  169: 
  170:     If that's not possible either, the sequence elements must support
  171:     equality-testing.  Then unique() will usually work in quadratic
  172:     time.
  173:     (from the python cookbook)
  174:     """
  175: 
  176:     n = len(s)
  177:     if n == 0:
  178:         return []
  179: 
  180:     # Try using a dict first, as that's the fastest and will usually
  181:     # work.  If it doesn't work, it will usually fail quickly, so it
  182:     # usually doesn't cost much to *try* it.  It requires that all the
  183:     # sequence elements be hashable, and support equality comparison.
  184:     u = {}
  185:     try:
  186:         for x in s:
  187:             u[x] = 1
  188:     except TypeError:
  189:         del u  # move on to the next method
  190:     else:
  191:         return u.keys()
  192: 
  193:     # We can't hash all the elements.  Second fastest is to sort,
  194:     # which brings the equal elements together; then duplicates are
  195:     # easy to weed out in a single pass.
  196:     # NOTE:  Python's list.sort() was designed to be efficient in the
  197:     # presence of many duplicate elements.  This isn't true of all
  198:     # sort functions in all languages or libraries, so this approach
  199:     # is more effective in Python than it may be elsewhere.
  200:     try:
  201:         t = list(s)
  202:         t.sort()
  203:     except TypeError:
  204:         del t  # move on to the next method
  205:     else:
  206:         assert n > 0
  207:         last = t[0]
  208:         lasti = i = 1
  209:         while i < n:
  210:             if t[i] != last:
  211:                 t[lasti] = last = t[i]
  212:                 lasti += 1
  213:             i += 1
  214:         return t[:lasti]
  215: 
  216:     # Brute force is all that's left.
  217:     u = []
  218:     for x in s:
  219:         if x not in u:
  220:             u.append(x)
  221:     return u
  222: 
  223: 
  224: class BasketContent(SimpleItem):
  225:     """classe fuer den Inhalt eines Baskets"""
  226:    
  227:     def __init__(self,content=[]):
  228:         """content"""
  229:         self.contentList=content[0:]
  230:     
  231:     def getContent(self):
  232:         """get content"""
  233:         
  234:         return self.contentList
  235:     
  236:     def setContent(self,content):
  237:         self.contentList=content[0:]
  238:     
  239:     def numberOfItems(self):
  240:         """number"""
  241:         
  242:         return len(self.getContent())
  243:         
  244:     
  245: class uploadATFfinallyThread(Thread):
  246:     """class for adding uploaded filed (temporarily stored in the staging area at /tmp"""
  247:     
  248:     def __init__(self):
  249:         """init for uploadATFfinallyThread"""
  250:         self.continueVar=True
  251:         self.returnValue=None
  252:         self.end=False
  253:         Thread.__init__(self)
  254:            
  255:     def set(self,procedure,comment="",basketname='',unlock=None,SESSION=None,username=None,serverport="8080"):
  256:         """set start values for the thread"""
  257:         self.procedure=procedure
  258:         self.comment=comment
  259:         self.basketname=basketname
  260:         self.unlock=unlock
  261:         self.SESSION=SESSION
  262:         self.username=username
  263:         self.serverport=serverport
  264:        
  265:         
  266:     def __call__(self):
  267:         """call of the thread (equals run)"""
  268:         self.run()
  269:         return True
  270:     
  271:     def getContext(self, app,serverport="8080"):
  272:         """get the context within the ZODB"""
  273:         
  274:         resp = HTTPResponse(stdout=None)
  275:         env = {
  276:             'SERVER_NAME':'localhost',
  277:             'SERVER_PORT':serverport,
  278:             'REQUEST_METHOD':'GET'
  279:             }
  280:         req = HTTPRequest(None, env, resp)
  281:         return app.__of__(RequestContainer(REQUEST = req))
  282:           
  283:         
  284:     def run(self):
  285:         """run"""
  286:         
  287:         self.result=""
  288:         #find context within ZODB
  289:         from Zope import DB
  290:         conn = DB.open()
  291:         root = conn.root()
  292:         app  = root['Application']
  293:         ctx = self.getContext(app,serverport=self.serverport)
  294: 
  295:         #add the files
  296:         self.uploadATFfinallyThread(ctx,self.procedure,comment=self.comment,basketname=self.basketname,unlock=self.unlock,SESSION=self.SESSION,username=self.username)
  297:         #commit the transactions
  298:         transaction.get().commit()
  299:         conn.close()
  300:         #set flag for end of this method
  301:         self.end=True
  302:         logging.info("ended")
  303:         return True
  304:     
  305:     def __del__(self):
  306:         """delete"""
  307:         
  308:         
  309:     
  310:     def getResult(self):
  311:         """method for accessing result"""
  312:         
  313:         return self.result
  314:      
  315:     def uploadATFfinallyThread(self,ctx,procedure,comment="",basketname='',unlock=None,RESPONSE=None,SESSION=None,username=None):
  316:         """upload the files"""
  317:         #TODO: make this configurable, at the moment, rootFolder for cdli has to be cdliRoot
  318:         ctx2=ctx.cdliRoot
  319:    
  320:         self.result+="<h2>Start processing</h2>"
  321:         
  322:         #shall I only upload the changed files?
  323:         logging.debug("uploadATFfinally procedure: %s"%procedure)
  324:         if procedure=="uploadchanged":
  325:             changed=[x[0] for x in SESSION.get('changed',[])]
  326:             uploadFns=changed+SESSION.get('newPs',[])
  327:         
  328:         #or all
  329:         elif procedure=="uploadAll":
  330:             uploadFns=[]
  331:             for x in os.listdir(SESSION['tmpdir']):
  332:                 if not x in SESSION['lockerrors']:
  333:                     uploadFns.append(x)
  334:                     
  335:         #or maybe nothing
  336:         elif procedure=="noupload":
  337:             return True
  338:         else:
  339:             uploadFns=[]
  340:             
  341:         #do first the changed files    
  342:         i=0
  343:         for fn in uploadFns:
  344:             logging.debug("uploadATFfinally uploadFn=%s"%fn)
  345:             i+=1
  346:             founds=ctx2.CDLICatalog.search({'title':fn})
  347:             if len(founds)>0:
  348:                 SESSION['author']=str(username)
  349:                 self.result="<p>Changing : %s"%fn+self.result
  350:                 logging.debug("uploadatffinallythread changing:%s"%fn+self.result)
  351:                 founds[0].getObject().manage_addCDLIFileObject('',comment,SESSION['author'],file=os.path.join(SESSION['tmpdir'],fn),from_tmp=True)
  352:             if i%200==0:
  353:                 transaction.get().commit()
  354:                 logging.debug("uploadatffinallythread changing: do commit")
  355:         
  356:         transaction.get().commit()
  357:         logging.debug("uploadatffinallythread changing: last commit")
  358: 
  359:         #now add the new files        
  360:         newPs=SESSION['newPs']
  361:         if len(newPs)>0:
  362:             tmpDir=SESSION['tmpdir']
  363:             logging.debug("uploadatffinallythread adding start")
  364:             self.result="<p>Adding files</p>"+self.result
  365:             #TODO: make this configurable, at the moment base folder for the files has to be cdli_main
  366:             ctx2.importFiles(comment=comment,author=str(username) ,folderName=tmpDir, files=newPs,ext=self)
  367:             logging.debug("uploadatffinallythread adding finished")
  368:         
  369:         #unlock locked files?
  370:         if unlock:
  371:             logging.debug("uploadatffinallythread unlocking start")
  372:             self.result="<p>Unlock files</p>"+self.result
  373:             unlockFns=[]
  374:             for x in os.listdir(SESSION['tmpdir']):
  375:                     if not x in SESSION['errors']:
  376:                         unlockFns.append(x)
  377:                         
  378:             logging.debug("unlocking have now what to unlock")
  379:                         
  380:             for fn in unlockFns:
  381:                 #logging.info("will unlock: %s"%fn)
  382:                 founds=ctx2.CDLICatalog.search({'title':fn})
  383:                 #logging.info("found it: %s"%repr(founds))
  384:                 if len(founds)>0:
  385:                     #logging.info("unlock: %s"%founds[0].getObject().getId())
  386:                     SESSION['author']=str(username)
  387:                     founds[0].getObject().lockedBy=""
  388: 
  389:             logging.debug("uploadatffinallythread unlocking done")
  390:                     
  391:         #if a basketname is given, add files to the basket
  392:         if not (basketname ==''):
  393:             logging.debug("uploadatffinallythread add to basket %s"%basketname)
  394:             self.result="<p>Add to basket</p>"+self.result
  395:             basketId=ctx2.basketContainer.getBasketIdfromName(basketname)
  396:             
  397:             if not basketId: # create new basket
  398:                 logging.debug("uploadatffinallythread create basket %s"%basketname)
  399:                 self.result="<p>Create a new basket</p>"+self.result
  400:                 ob=ctx2.basketContainer.addBasket(basketname)
  401:                 basketId=ob.getId()
  402:             basket=getattr(ctx2.basketContainer,str(basketId))
  403:             ids=os.listdir(SESSION['tmpdir'])
  404:             logging.debug("should add:"+repr(ids))
  405:             basket.addObjects(ids,deleteOld=True,username=str(username))    
  406:                
  407:         logging.debug("uploadatffinallythread uploadfinally done")
  408: 
  409:         if RESPONSE is not None:
  410:             RESPONSE.redirect(self.aq_parent.absolute_url())
  411:         
  412:         return True
  413: 
  414: class tmpStore(SimpleItem):
  415:     """simple item"""
  416:     meta_type="cdli_upload"
  417:     
  418:     def __init__(self,id):
  419:         """init tmp"""
  420:         self.id=id
  421:         
  422: class uploadATFThread(Thread):
  423:     """class for checking the files befor uploading"""
  424:     
  425:     def __init__(self):
  426:         """initialise"""
  427:         
  428:         self.continueVar=True
  429:         self.returnValue=None
  430:         
  431:         Thread.__init__(self)
  432:         
  433:         
  434:     def set(self,upload,basketId,username,idTmp,serverport="8080"):
  435:         """set start values for the thread"""
  436:         self.result=""
  437:         self.upload=upload
  438:         self.basketId=basketId
  439:         self.username=username
  440:         self.serverport=serverport
  441:         self.idTmp=idTmp
  442:         
  443:     def __call__(self):
  444:         """call method """
  445:         self.run()
  446:         return True
  447:     
  448:     def getContext(self, app,serverport="8080"):
  449:         """get the context within the ZODB"""
  450:         resp = HTTPResponse(stdout=None)
  451:         env = {
  452:             'SERVER_NAME':'localhost',
  453:             'SERVER_PORT':serverport,
  454:             'REQUEST_METHOD':'GET'
  455:             }
  456:         req = HTTPRequest(None, env, resp)
  457:         return app.__of__(RequestContainer(REQUEST = req))
  458:         
  459:     def run(self):
  460:         idTmp=self.idTmp
  461:         self.result=""
  462:         #find context within ZODB
  463:         from Zope import DB
  464:         conn = DB.open()
  465:         root = conn.root()
  466:         app  = root['Application']
  467:         ctx = self.getContext(app,serverport=self.serverport)
  468:         logging.info("run intern")
  469:         try:
  470:             logging.info("created: %s"%idTmp)
  471:             ctx.temp_folder._setObject(idTmp,tmpStore(idTmp))
  472:         except:
  473:             logging.error("thread upload: %s %s"%sys.exc_info()[0:2])
  474:             
  475:         logging.info("call thread intern")
  476:         self.uploadATFThread(ctx,self.upload,idTmp,self.basketId)
  477:      
  478:         #ctx.cdliRoot.cdli_main.tmpStore2[self.getName()[0:]]=self.returnValue
  479:         
  480:         
  481:         transaction.get().commit()
  482:        
  483:         conn.close()
  484:         
  485:         return getattr(ctx.temp_folder,idTmp)
  486:         
  487:     def getResult(self):
  488:         """method for accessing result"""
  489:         return self.result
  490:     
  491:     def uploadATFThread(self,ctx,upload,idTmp,basketId=0):
  492:         """upload an atf file"""
  493:         #TODO: add comments
  494:         #TODO: finish uploadATF
  495:         
  496:         stObj=getattr(ctx.temp_folder,idTmp)
  497:         logging.info("start, upload thread")
  498:         self.result="<html><body><h2>I got your file, start now to split it into single atf-files!</h2><p>"
  499:     
  500:         #make sure that id is a string and not an integer
  501:         basketId=str(basketId)
  502:         
  503:         #TODO: make this configurable, at the moment, rootFolder for cdli has to be cdliRoot
  504:         ctx2=ctx.cdliRoot
  505:         
  506:         #get temporary file for staging the downloaded and splitted files
  507:         dir=mkdtemp()
  508:         
  509:         
  510:         changed=[] # changed files
  511:         errors=[]  # files with errors
  512:         lockerrors=[]  # files with errors
  513: 
  514:         newPs=[]   # new p filed
  515:         psNotInCatalog=[] # files not in the catalog
  516:         
  517:         #split the uploadedd atf file
  518:         basketNameFromFile, numberOfFiles=splitatf(upload,dir,ext=self)
  519:         
  520:         #find basketId if not set
  521:         
  522:         #get active abaket
  523:         if basketId == '0':
  524:             basketObj=ctx2.basketContainer.getActiveBasket()
  525:             if basketObj:
  526:                 basketId=basketObj.getId()
  527:                 
  528:         #if there is no active basket and no basketid given, id is empty, else get besketname and length
  529:         if basketId == '0':
  530:             basketNameFromId=""
  531:             basketLen=0
  532:         else:
  533:             basketNameFromId=getattr(ctx2.basketContainer,basketId).title
  534:             basketLen=getattr(ctx2.basketContainer,basketId).getLastVersion().numberOfItems()
  535:             
  536:         logging.info("got the file, upload thread")
  537:         self.result+="""<html><body><h2>I got the files</h2><
  538:                         p>I am computing the differences to the exisiting files</p>"""
  539:                                    
  540:         #start to check the files
  541:         for fn in os.listdir(dir):
  542:             
  543:             self.result="<p>process:%s</p>"%fn+self.result
  544:             
  545:             # check if file is in the catalog
  546:             #TODO: checkCatalog is not implemented yet
  547:             if ctx2.cdli_main.checkCatalog(fn):
  548:                 psNotInCatalog.append(fn)
  549:                 
  550:             #check if p-file already at the server  
  551:             founds=ctx2.CDLICatalog.search({'title':fn})    
  552:       
  553:             #if not than add filename to the list of newfiles
  554:             
  555:             data=file(os.path.join(dir,fn)).read()
  556:             status,msg=checkFile(fn,data,dir)
  557:             #status=True
  558:             
  559:             
  560:             if not status: # error
  561:                 errors.append((fn,msg))
  562:             
  563:             else:
  564:                 if len(founds)==0:
  565:                     newPs.append(fn)
  566: 
  567:                 #if p file alread at the server    
  568:                 for found in founds:
  569:                     #analyse the differences to the actual file
  570:                     obj=found.getObject()
  571: 
  572:                     if (not (str(obj.lockedBy))=='') and (not (str(obj.lockedBy)==str(self.username))):
  573:                                 lockerrors.append((fn,str(obj.lockedBy)))
  574:                     else:
  575:                 
  576:                         diffs=obj.diff(data)
  577:                         if diffs[0]>0:
  578:                             changed.append((obj,diffs)) #hochladen
  579: 
  580:         #ready, set the returnValues
  581:         self.result+="<h3>Done</h3></body></html>"
  582:         
  583:         stObj.returnValue={}
  584:         
  585:         stObj.returnValue['errors']=errors
  586:         
  587:         stObj.returnValue['newPs']=newPs
  588:         stObj.returnValue['tmpdir']=dir
  589:         stObj.returnValue['basketLen']=basketLen
  590:         stObj.returnValue['numberOfFiles']=numberOfFiles
  591:         stObj.returnValue['basketNameFromId']=basketNameFromId
  592:         stObj.returnValue['basketNameFromFile']=basketNameFromFile
  593:         stObj.returnValue['basketId']=basketId
  594:         stObj.returnValue['dir']=dir
  595:         #stObj.returnValue['changed']=copy.copy(changed)
  596:         stObj.returnValue['changed']=[(x[0].getId(),x[1][0]) for x in changed]
  597:         #stObj.returnValue['lockerrors']=[x[0].getId() for x in lockerrors]
  598:         stObj.returnValue['lockerrors']=[x for x in lockerrors]
  599:         self.returnValue=True
  600:         #ctx2.cdli_main.setTemp('v_uploadATF_returnValue',True)
  601:     
  602:  
  603: class CDLIBasketContainer(OrderedFolder):
  604:     """contains the baskets"""
  605:     
  606: 
  607:     security=ClassSecurityInfo()
  608:     meta_type="CDLIBasketContainer"
  609:     
  610:     def getPNumbersOfBasket(self,basketName):
  611:         """get all pnumbers of a basket as a list, returns an empty list if basket not found
  612:         @param basketName: name of the basket
  613:         """
  614:         ret=[]
  615:         basketId=self.getBasketIdfromName(basketName)
  616:         if not basketId:
  617:             return []
  618:         
  619:         ob=getattr(self,basketId).getContent()
  620:         
  621:         ret=[x[0].split(".")[0] for x in ob]
  622:         
  623:         return ret
  624:     
  625:     security.declareProtected('manage','getBasketAsOneFile')       
  626:     def getBasketAsOneFile(self,basketName,current="no"):
  627:         """returns all files of the basket combined in one file
  628:         @param basketName: Name of the basket
  629:         @param current: (optional) if current is set to "yes" then the most current version of 
  630:                         all files are downloaded and not the versions of the files as stored in the basket
  631:         """
  632:         ret=""
  633:         basketId=self.getBasketIdfromName(basketName)
  634:         if not basketId:
  635:             return ""
  636:         
  637:         ob=getattr(self,basketId).getLastVersion()
  638:         for object in ob.getContent():
  639:             if current=="no": #version as they are in the basket
  640:                             ret+=str(object[0].getData())+"\n"
  641:             elif current=="yes":
  642:                             #search current object
  643:                             logging.debug("current: %s"%object[1].getId().split(".")[0])
  644:                             founds=self.CDLICatalog.search({'title':object[1].getId().split(".")[0]})
  645:                             if len(founds)>0:      
  646:                                 ret+=str(founds[0].getObject().getLastVersion().getData())+"\n"
  647:         return ret
  648:     
  649:     security.declareProtected('manage','upDateBaskets') 
  650:     def upDateBaskets(self):
  651:         """update content in to objects"""
  652:         
  653:         founds=self.ZopeFind(self,obj_metatypes=['CDLIBasketVersion'],search_sub=1)
  654: 
  655:         for found in founds:
  656:             found[1].updateBasket()
  657:         
  658:     security.declareProtected('manage','deleteBaskets')        
  659:     def deleteBaskets(self,ids=None):
  660:         """delete baskets, i.e. move them into trash folder"""
  661:         
  662:         
  663:         found=self.ZopeFind(self,obj_ids=['trash'])
  664:         
  665:         if len(found)<1:
  666:             manage_addFolder(self, 'trash')
  667:             trash=self._getOb('trash')
  668:         else:
  669:             trash=found[0][1]
  670:         
  671:         if type(ids) is not ListType:
  672:             ids=[ids]
  673:         cut=self.manage_cutObjects(ids)
  674:         trash.manage_pasteObjects(cut)
  675:         
  676:     security.declareProtected('manage','manageBaskets')       
  677:     def manageBaskets(self,submit,ids=None,basket1="",basket2="",joinBasket="",subtractBasket="",REQUEST=None,RESPONSE=None):
  678:         """manage baskets, delete or copy"""
  679:         if submit=="delete":
  680:             self.deleteBaskets(ids)
  681:         
  682:         elif submit=="join":
  683:             flag,msg=self.joinBasket(joinBasket, ids)
  684:             logging.info("joining %s %s"%(flag,msg))
  685:             
  686:         elif submit=="subtract":
  687:             logging.info("BBBb %s %s"%(basket1,basket2))
  688:             flag,msg=self.subtractBasket(subtractBasket, basket1,basket2)
  689:             logging.info("subtract %s %s"%(flag,msg))
  690:             
  691:         if RESPONSE:
  692:             RESPONSE.redirect(self.absolute_url())
  693:     
  694:     security.declareProtected('View','getBasketIdfromName')       
  695:     def getBasketIdfromName(self,basketname):
  696:         """get id from name"""
  697: 
  698:         for basket in self.ZopeFind(self,obj_metatypes=["CDLIBasket"]):
  699:             if basket[1].title==basketname:
  700:                 return basket[0]
  701:         else:
  702:             None
  703:     
  704:     security.declareProtected('manage','uploadBasket_html')        
  705:             
  706:     def uploadBasket_html(self,basketId='0'):
  707:         """upload an atf file, html form"""
  708:         
  709: 
  710:         basketId=str(basketId)
  711:         if not basketId=='0':
  712:             basketName=getattr(self.basketContainer,basketId).title
  713:         else:
  714:             basketName=""
  715:             
  716:         pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadBasket_html.zpt')).__of__(self)
  717:         return pt(basketId=basketId,basketName=basketName)
  718:    
  719: 
  720:     security.declareProtected('manage','index_html')    
  721:     def index_html(self):
  722:         """stanadard ansicht"""
  723:         
  724: 
  725: 
  726:         ext=self.ZopeFind(self,obj_ids=["index.html"])
  727:         if ext:
  728:             return ext[0][1]()
  729:         
  730:         pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','BasketContainerMain')).__of__(self)
  731:         return pt()
  732:     
  733:     def getStorageFolderRoot(self):
  734:         """root des storage folders"""
  735:         return self.cdli_main
  736:     
  737:     def __init__(self,id,title):
  738:         """ init basket container"""
  739:         self.id=id
  740:         self.title=title
  741:      
  742:  
  743:     def getBasketsId(self):
  744:         """get all baskets als klartext"""
  745:         
  746:         ret=""
  747:         baskets=self.ZopeFind(self,obj_metatypes=['CDLIBasket'])
  748:         for basket in baskets:
  749:             com,user,time,values = basket[1].getContentIds()
  750:             ret+= "BASKET:"+com+"\t"+user+"\t"+time+"\n"
  751:             for x in values:
  752:                 ret+= x[0]+"\t"+x[1]+"\n"
  753:                 return ret
  754: 
  755:     def getBaskets(self,sortField='title'):
  756:         """get all baskets files"""
  757: 
  758:         def sortName(x,y):
  759:             return cmp(x[1].title.lower(),y[1].title.lower())
  760: 
  761:         def sortDate(x,y):
  762:             return cmp(y[1].getLastVersion().getTime(),x[1].getLastVersion().getTime())
  763: 
  764:         
  765:         def sortComment(x,y):
  766: 
  767:         
  768:             
  769:              try:
  770:                 xc=getattr(x[1],'comment','ZZZZZZZZZZZZZ').lower()
  771:              except:
  772:                 xc='ZZZZZZZZZZZZZ'.lower()
  773:              try:
  774:                 yc=getattr(y[1],'comment','ZZZZZZZZZZZZZ').lower()
  775:              except:
  776:                 yc='ZZZZZZZZZZZZZ'.lower()
  777:     
  778:     
  779:              if (xc=='') or (xc=='ZZZZZZZZZZZZZ'.lower()):
  780:                  
  781:                  try:
  782:                      xc=x[1].getLastVersion().getComment().lower()
  783:                  except:
  784:                      xc='ZZZZZZZZZZZZZ'.lower()
  785:                      
  786:              if (yc=='') or (yc=='ZZZZZZZZZZZZZ'.lower()):
  787:                  try:
  788:                      yc=y[1].getLastVersion().getComment().lower()
  789:                  except:
  790:                      yc='ZZZZZZZZZZZZZ'.lower()
  791:     
  792:              
  793:                  return cmp(xc,yc)
  794:         
  795:         def sortAuthor(x,y):
  796:             
  797:             return cmp(x[1].getLastVersion().getUser().lower(),y[1].getLastVersion().getUser().lower())
  798:         
  799:         baskets=self.ZopeFind(self,obj_metatypes=['CDLIBasket'])
  800:         
  801:         
  802:         if sortField=='title':
  803:             baskets.sort(sortName)
  804:         elif sortField=='date':
  805:             baskets.sort(sortDate)
  806:         elif sortField=='author':
  807:             baskets.sort(sortAuthor)
  808:         elif sortField=='comment':
  809:             baskets.sort(sortComment)
  810: 
  811:         return baskets
  812:     
  813:         
  814:     def subtractBasket(self,newBasket,basket1,basket2):
  815:         """subtract basket2 from basket1 
  816:         (i.e. newbasket will contain alle elements of basket1 which are not in basket2), 
  817:         if basket2 contains files which are not in basket1, then theses files fill be ignored
  818:                
  819:         @param newbasket: name of the new basket
  820:         @param basket1: basket where basket2 will be subtracted from
  821:         @param basket2: see above
  822:       
  823:         """
  824:         logging.info("CCCCC %s %s"%(basket1,basket2))
  825:    
  826:         try:
  827:             newB=self.addBasket(newBasket)
  828:         except:
  829:             return False, "cannot create the new basket"
  830:         
  831:         
  832: 
  833:        
  834:      
  835:         bas2= getattr(self,basket2)            
  836:         bas2content=bas2.getContent()
  837:         bas2ids=[x[0] for x in bas2content]
  838:         
  839:        
  840:             
  841:         bas1= getattr(self,basket1)   
  842:         bas1content=bas1.getContent()
  843:         
  844:         
  845:         newBasketContent={}
  846:         
  847:         for id,version in bas1content:
  848:             if not (id in bas2ids):
  849:                 newBasketContent[id]=version
  850:         
  851:         username=self.getActualUserName()
  852:         
  853:         logging.info("sbc %s"%newBasketContent)
  854:         newB.addObjectsWithVersion(newBasketContent,username=username,catalog=self.CDLICatalog)
  855:         
  856:         return True, ""
  857:     
  858:             
  859:     def joinBasket(self,newBasket,oldBaskets):
  860:         """join two baskets
  861:         @param newbasket: name of the new basket
  862:         @param oldbaskets: list of baskets to be joined
  863:         """
  864:         try:
  865:             newB=self.addBasket(newBasket)
  866:         except:
  867:             return False, "cannot create the new basket"
  868:         
  869:         newBasketContent={}
  870:         for ob in oldBaskets:
  871:             x= getattr(self,ob,None)
  872:             if x is None:
  873:                 return False, "cannot find basket: %s"%ob
  874:             
  875:             ids=x.getContent() # hole den Inhalt
  876:             
  877:             for id,version in ids:
  878:                 if newBasketContent.has_key(id): # p number gibt's schon
  879:                     newBasketContent[id]=max(newBasketContent[id],version) # speichere die groessere Versionsnumber
  880:                 else:
  881:                     newBasketContent[id]=version
  882:         username=self.getActualUserName()
  883:         
  884:         logging.info("nbc %s"%newBasketContent)
  885:         newB.addObjectsWithVersion(newBasketContent,username=username,catalog=self.CDLICatalog)
  886:         
  887:         return True, ""
  888:     
  889:     def getNewId(self):
  890:         """createIds"""
  891:         last=getattr(self,'last',0)
  892:         last +=1
  893:         while len(self.ZopeFind(self,obj_ids=[str(last)]))>0:
  894:             last+=1
  895:     
  896:         self.last=last
  897:         return last
  898:     
  899:     def setActiveBasket(self,basketId,REQUEST=None):
  900:         """store active basketId in a cookie"""
  901:         self.REQUEST.RESPONSE.setCookie("CDLIActiveBasket",basketId,path="/")
  902:         try:
  903:             qs=cgi.parse_qs(REQUEST['QUERY_STRING'])
  904:             del(qs['basketId'])
  905:         except:
  906:             qs={}
  907:         if REQUEST:
  908:             REQUEST.RESPONSE.redirect(REQUEST['URL1']+'?'+urllib.urlencode(qs))
  909:             
  910:     def getActiveBasket(self):
  911:         """get active basket from cookie"""
  912:         
  913:         id= self.REQUEST.cookies.get('CDLIActiveBasket',None)
  914:         if id:
  915:             obj=getattr(self,str(id),None)
  916:         else:
  917:             obj=None
  918:         return obj
  919:     
  920:     def getActualUserName(self):
  921:         """get name of the actualuser"""
  922:         return str(self.REQUEST['AUTHENTICATED_USER'])
  923:     
  924:     security.declareProtected('manage','addBasket') 
  925:     def addBasket(self,newBasketName):
  926:         """add a new basket"""
  927:         
  928:         ob=manage_addCDLIBasket(self,newBasketName)
  929:         return ob
  930: 
  931:     def storeInBasket(self,submit,ids=None,newBasketName=None,fromFileList=None,RESPONSE=None,REQUEST=None):
  932:         """store it"""
  933:         if not ids:
  934:             ids=self.REQUEST.SESSION['fileIds']
  935:            
  936:         if (type(ids) is not ListType) and (not isinstance(ids,Set)):
  937:             ids=[ids]
  938:         
  939:         if isinstance(ids,Set):
  940:             ids=list(ids)
  941:             
  942:         if (submit.lower()=="store in new basket") or (submit.lower()=="new basket"):
  943:             basketRet=self.addBasket(newBasketName)
  944:             self.setActiveBasket(basketRet.getId())
  945:             basket=getattr(self,basketRet.getId())
  946:         elif (submit.lower()=="store in active basket") or (submit.lower()=="active basket"):
  947:             basket=self.getActiveBasket()
  948:         
  949:         added=basket.addObjects(ids)
  950:         back=self.REQUEST['HTTP_REFERER'].split("?")[0]+"?basketName="+basket.title+"&numberOfObjects="+str(added)
  951:         
  952:         
  953:         if fromFileList:
  954: 
  955:             return self.cdli_main.findObjectsFromList(list=ids,basketName=basket.title,numberOfObjects=added)
  956:        
  957:         if RESPONSE:
  958:             
  959:             RESPONSE.redirect(back)
  960:             
  961:         return True
  962:     
  963: def manage_addCDLIBasketContainerForm(self):
  964:     """add the CDLIBasketContainer form"""
  965:     pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','addCDLIBasketContainer.zpt')).__of__(self)
  966:     return pt()
  967: 
  968: def manage_addCDLIBasketContainer(self,id,title,RESPONSE=None):
  969:     """add the basket"""
  970:     ob=CDLIBasketContainer(id,title)
  971:     
  972:     self._setObject(id, ob)
  973:     
  974:     if RESPONSE is not None:
  975:         RESPONSE.redirect('manage_main')
  976: 
  977: class CDLIBasket(Folder,CatalogAware):
  978:     """basket"""
  979:     
  980:     meta_type="CDLIBasket"
  981:     default_catalog="CDLIBasketCatalog"
  982:     
  983:     def searchInBasket(self,indexName,searchStr,regExp=False):
  984:         """searchInBasket"""
  985: 
  986:         lst=self.searchInLineIndexDocs(indexName,searchStr,uniq=True,regExp=regExp) #TODO: fix this
  987:         ret={}
  988:         
  989:         lv=self.getLastVersion()
  990: 
  991: 
  992:         for obj in lv.content.getContent():
  993:             id=obj[1].getId().split(".")[0]
  994:             if id in lst:
  995:         
  996:                 ret[id]=self.showWordInFile(id,searchStr,lineList=self.getLinesFromIndex(indexName,searchStr,id,regExp=regExp),regExp=regExp,indexName=indexName)
  997:         
  998:         
  999:         pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','searchResultsInBasket')).__of__(self)
 1000:         return pt(result=ret,indexName=indexName,regExp=regExp,word=searchStr)
 1001:         
 1002:          
 1003:  
 1004:         
 1005:     def searchInBasket_v1(self,searchStr):
 1006:         """search occurences of searchStr in files im basket"""
 1007:         ret=[]
 1008:         lv=self.getLastVersion()
 1009:         logging.info("searching")
 1010:         for obj in lv.content.getContent():
 1011:             txt=obj[0].getData()
 1012:             for x in txt.split("\n"):
 1013:                 logging.info("search %s"%x)
 1014:                 if re.match(searchStr,x):
 1015:                     ret.append(x)
 1016:         
 1017:         return "\n".join(ret)
 1018:                 
 1019:             
 1020:     def getFile(self,obj):
 1021:         return obj[1]
 1022:     
 1023:     def getFileLastVersion(self,obj):
 1024:         return obj[0]
 1025:     
 1026:     def getFileNamesInLastVersion(self):
 1027:         """get content of the last version as list"""
 1028:         
 1029:         return [x[1].getId() for x in self.getLastVersion().getContent()]
 1030:     
 1031: 
 1032:     def isActual(self,obj):
 1033:         """teste ob im basket die aktuelle version ist"""
 1034:         try:
 1035:             logging.debug("isActual:"+repr(obj))
 1036:             actualNo=obj[1].getLastVersion().getVersionNumber()
 1037:             storedNo=obj[0].getVersionNumber()
 1038:             
 1039:            
 1040:             actualNo=self.getFileObjectLastVersion(obj.getId()).getVersionNumber()
 1041:                 
 1042:             #if len(founds)>0 and founds[0].getObject().aq_parent.getId()==".trash":
 1043:             #    return False, -1
 1044:             
 1045:             if actualNo==storedNo:
 1046:                 return True , 0
 1047:             else:
 1048:                 return False, actualNo
 1049:         except:
 1050:             return False, -1
 1051:             
 1052:     def history(self):
 1053:         """history"""  
 1054: 
 1055:         ext=self.ZopeFind(self.aq_parent,obj_ids=["history_template.html"])
 1056:         if ext:
 1057:             return getattr(self,ext[0][1].getId())()
 1058:         
 1059:         pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','BasketHistory')).__of__(self)
 1060:         return pt()
 1061:     
 1062:     def getStorageFolderRoot(self):
 1063:         """root des storage folders"""
 1064:         return self.aq_parent.cdli_main
 1065:     
 1066:     def __init__(self,id,title,shortDescription="",comment=""):
 1067:         """init a CDLIBasket"""
 1068:         
 1069:         self.id=id
 1070:         self.title=title
 1071:         self.shortDescription=shortDescription
 1072:         self.comment=comment
 1073:  
 1074:     def getActualUserName(self):
 1075:         """get name of the actualuser"""
 1076:        
 1077:         return str(self.REQUEST['AUTHENTICATED_USER'])
 1078:   
 1079:            
 1080:     def getLastVersion(self):
 1081:         """hole letzte version"""
 1082: 
 1083:         ids=[]
 1084:         idsTmp= self.objectIds()
 1085:         for x in idsTmp:
 1086:             try:
 1087:                 ids.append(int(x))
 1088:             except:
 1089:                 pass
 1090:         ids.sort()
 1091:       
 1092:         if len(ids)==0:
 1093:             return None
 1094:         else:    
 1095:             ob=getattr(self,str(ids[-1]))
 1096: 
 1097:             
 1098:             return ob
 1099:    
 1100:     def getVersions(self):
 1101:         """get versions"""
 1102:         versions=self.ZopeFind(self,obj_metatypes=["CDLIBasketVersion"])
 1103:         return versions
 1104: 
 1105:    
 1106:     def updateObjects(self,ids,RESPONSE=None,REQUEST=None):
 1107:         """update ids, ids not in the basket the add"""
 1108:         if type(ids) is not ListType:
 1109:             ids=[ids]
 1110:        
 1111:         lastVersion=self.getLastVersion() 
 1112:         oldContent=lastVersion.content.getContent()
 1113:         newContent=[]
 1114:         
 1115:         #first copy the old
 1116:         for obj in oldContent:
 1117:             if obj[1].getId() not in ids:
 1118:                 newContent.append(obj)
 1119:         #now add the new
 1120:                
 1121:         for id in ids:
 1122:             founds=self.CDLICatalog.search({'title':id})
 1123: 
 1124:             for found in founds:
 1125:                 if found.getObject() not in oldContent:
 1126:                     #TODO: was passiert wenn, man eine Object dazufŸgt, das schon da ist aber eine neuere version
 1127:                     newContent.append((found.getObject().getLastVersion(),found.getObject()))
 1128:         
 1129: 
 1130:         content=newContent 
 1131:         user=self.getActualUserName()
 1132:         
 1133:         ob=manage_addCDLIBasketVersion(self,user,comment="",basketContent=newContent)
 1134:         
 1135:         obj=self._getOb(ob.getId())
 1136:         if RESPONSE:
 1137:            
 1138:             RESPONSE.redirect(obj.absolute_url())
 1139:         
 1140:         return obj
 1141:     
 1142:     def addObjectsWithVersion(self,ids,deleteOld=None,username=None,catalog=None):
 1143:         """generate a new version of the basket with objects added, 
 1144:         hier wird jedoch nicht die letzte Version jedes Files hinzugefuegt, s
 1145:         ondern ids is ein Tupel mit der Id (d.h. der p-number) und der Versionsnummer.
 1146:         """
 1147:         logging.info("add to basket (%s)"%(self.getId()))
 1148:         lastVersion=self.getLastVersion()
 1149:         
 1150:         if not catalog:
 1151:             catalog=self.CDLICatalog
 1152:             
 1153:         if lastVersion is None:
 1154:             oldContent=[]
 1155:         else:
 1156:             oldContent=lastVersion.content.getContent()
 1157: 
 1158:         if deleteOld:
 1159:             oldContent=[]
 1160: 
 1161:         newContent=[]
 1162:         added=0
 1163:        
 1164:         for id,version in ids.iteritems():
 1165:             logging.info("adding %s %s"%(id,version))
 1166:             id=id.split(".")[0] # title nur die pnumber ohne atf
 1167:            
 1168:             try:
 1169:                 founds=catalog.search({'title':id})
 1170:             except:
 1171:                 founds=[]
 1172:             logging.info(" found %s "%(founds))
 1173:             for found in founds:
 1174:                 if found.getObject() not in oldContent:
 1175:                  
 1176:                     #TODO: was passiert wenn, man eine Object dazufŸgt, das schon da ist aber eine neuere version
 1177:                     newContent.append((found.getObject().getVersions()[version-1][1],found.getObject()))
 1178:                     added+=1
 1179: 
 1180:         content=oldContent+newContent
 1181:         if not username:
 1182:             logging.error("XXXXXXXXXXX %s"%repr(self))
 1183:             user=self.getActualUserName()
 1184:         else:
 1185:             user = username
 1186:             
 1187:         ob=manage_addCDLIBasketVersion(self,user,comment="",basketContent=content)
 1188:         logging.info("add to basket (%s) done"%(self.getId()))
 1189:         return added
 1190:     
 1191:     
 1192:     def addObjects(self,ids,deleteOld=None,username=None):
 1193:         """generate a new version of the basket with objects added"""
 1194:         
 1195:         def swap(x):
 1196:             return (x[1],x[0])
 1197:             
 1198:         logging.info("add to basket (%s)"%(self.getId()))
 1199:         lastVersion=self.getLastVersion()
 1200:         
 1201:         if lastVersion is None:
 1202:             oldContent=[]
 1203:         else:
 1204:             oldContent=lastVersion.content.getContent()
 1205: 
 1206:         if deleteOld:
 1207:             oldContent=[]
 1208: 
 1209:         added=0
 1210: #        for id in ids:
 1211: #            logging.debug("adding:"+id)
 1212: #            try:
 1213: #                founds=self.CDLICatalog.search({'title':id})
 1214: #            except:
 1215: #                founds=[]
 1216: #           
 1217: #            for found in founds:
 1218: #                if found.getObject() not in oldContent:
 1219: #                    #TODO: was passiert wenn, man eine Object dazufŸgt, das schon da ist aber eine neuere version
 1220: #                    newContent.append((found.getObject().getLastVersion(),found.getObject()))
 1221: #                    added+=1
 1222: 
 1223:         hash = md5.new(repr(makelist(ids))).hexdigest() # erzeuge hash als identification
 1224:         #logging.debug("JJJJJJJ:"+repr(self.makelist(ids)))
 1225:         logging.debug("JJJJJJJ:"+repr(hash))
 1226:                       
 1227:         if hasattr(self.cdliRoot,'v_tmpStore') and self.cdliRoot.v_tmpStore.has_key(hash): 
 1228:             logging.debug("from store!")
 1229:             newContent=Set(map(swap,self.cdliRoot.v_tmpStore[hash]))
 1230:          
 1231:         else:
 1232:             logging.debug("not from store!")
 1233:             newContent=Set([(self.getFileObjectLastVersion(x),self.getFileObject(x)) for x in ids])
 1234:         
 1235:         
 1236:         content=Set(oldContent).union(newContent)
 1237:         added = len(content)-len(oldContent)
 1238:         if not username:
 1239:             user=self.getActualUserName()
 1240:         else:
 1241:             user = username
 1242:         
 1243:         #logging.debug("content:"+repr(list(content)))
 1244:         ob=manage_addCDLIBasketVersion(self,user,comment="",basketContent=list(content))
 1245:         logging.info("add to basket (%s) done"%(self.getId()))
 1246:         return added
 1247:     
 1248:     
 1249:                 
 1250:     def getContent(self):
 1251:         """print content"""
 1252:         ret=[]
 1253:         
 1254:         lv=self.getLastVersion()
 1255:         for obj in lv.content.getContent():
 1256:             logging.info("XXXXXXXXXX %s"%repr(obj))
 1257:             ret.append((obj[1].getId(),obj[0].versionNumber))
 1258:             
 1259:         return ret
 1260:         
 1261:     def getContentIds(self):
 1262:         """print basket content"""
 1263:         ret=[]
 1264:         lv=self.getLastVersion()
 1265:         for obj in lv.content.getContent():
 1266:             ret.append((obj[0].getId(),obj[1].getId()))
 1267:         
 1268:         
 1269:         return lv.getComment(),lv.getUser(),lv.getTime(),ret
 1270: 
 1271:     def changeBasket(self,ids,submit,RESPONSE=None,REQUEST=None):
 1272:         """change a basket"""
 1273:         if submit=="update":
 1274:             return self.updateObjects(ids,RESPONSE=RESPONSE,REQUEST=REQUEST)
 1275:         elif submit=="delete":
 1276:             return self.deleteObjects(ids,RESPONSE=RESPONSE,REQUEST=REQUEST)
 1277:             
 1278:     def deleteObjects(self,ids,RESPONSE=None,REQUEST=None):
 1279:         """delete objects"""
 1280:         
 1281:         if type(ids) is not ListType:
 1282:             ids=[ids]
 1283:        
 1284:         lastVersion=self.getLastVersion() 
 1285:         oldContent=lastVersion.content.getContent()
 1286:         newContent=[]
 1287:         for obj in oldContent:
 1288:             if obj[1].getId() not in ids:
 1289:                 newContent.append(obj)
 1290:         
 1291:                 
 1292:         user=self.getActualUserName()
 1293:         
 1294:         ob=manage_addCDLIBasketVersion(self,user,comment="",basketContent=newContent)
 1295:         
 1296:         if RESPONSE:
 1297:             obj=self._getOb(ob.getId())
 1298:             RESPONSE.redirect(obj.absolute_url())
 1299:         
 1300: def manage_addCDLIBasketForm(self):
 1301:     """add the CDLIBasketContainer form"""
 1302:     pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','addCDLIBasket.zpt')).__of__(self)
 1303:     return pt()
 1304: 
 1305: def manage_addCDLIBasket(self,title,shortDescription="",comment="",RESPONSE=None):
 1306:     """add the basket"""
 1307:     
 1308:     id=str(self.getNewId())
 1309:     
 1310:     ob=CDLIBasket(id,title,shortDescription,comment)
 1311:     
 1312:     self._setObject(id, ob)
 1313:     
 1314:     if RESPONSE is not None:
 1315:         RESPONSE.redirect('manage_main')
 1316:     else:
 1317:         return ob
 1318: 
 1319: class CDLIBasketVersion(Implicit,Persistent,Folder):
 1320:     """version of a basket"""
 1321:     
 1322:     meta_type="CDLIBasketVersion"
 1323:     security=ClassSecurityInfo()
 1324:     
 1325:     def updateBasket(self):
 1326:         """update"""
 1327:         try:
 1328:             self._setObject('content',BasketContent(self.basketContent))
 1329:         except:
 1330:             try:
 1331:                 if len(self.basketContent)>0:
 1332:                     self.content.setContent(self.basketContent)
 1333:             except:
 1334:                 print "error",self.getId(),self.aq_parent.getId()
 1335:         self.basketContent=[]
 1336: 
 1337:         
 1338:     def containsNonActualFiles(self):
 1339:         """returns True if basket contains one or more non current files"""
 1340:         
 1341:         objs=self.getContent()
 1342:         for obj in objs:
 1343:             if not self.isActual(obj)[0]:
 1344:                 return True
 1345:         return False
 1346:     
 1347:     def downloadListOfPnumbers(self):
 1348:         """download pnumbers of the basket as list"""
 1349:         
 1350:         basket_name=self.aq_parent.title
 1351:         
 1352:         ids=self.getContent() # get the list of objects
 1353:         logging.error(ids)
 1354:         ret="\n".join([x[1].getId().split(".")[0] for x in ids])
 1355:         
 1356:         self.REQUEST.RESPONSE.setHeader("Content-Disposition","""attachement; filename="%s.txt" """%basket_name)
 1357:         self.REQUEST.RESPONSE.setHeader("Content-Type","application/octet-stream")
 1358:         length=len(ret)
 1359:         self.REQUEST.RESPONSE.setHeader("Content-Length",length)
 1360:         self.REQUEST.RESPONSE.write(ret)    
 1361:         
 1362:     security.declareProtected('manage','downloadObjectsAsOneFile')
 1363:     def downloadObjectsAsOneFile(self,lock=None,procedure=None,REQUEST=None,check="yes",current="no"):
 1364:         """download all selected files in one file"""
 1365:         logging.debug("doasof")
 1366:         if self.temp_folder.downloadCounterBaskets > 10000:
 1367:             return """I am sorry, currently the server has to many requests for downloads, please come back later!"""
 1368: 
 1369: 
 1370:         if (check=="yes") and self.containsNonActualFiles():
 1371:             pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','downloadObjectAsOneFile_check.zpt')).__of__(self)
 1372:             
 1373:             return pt(lock=lock)
 1374:             
 1375:         else:
 1376:             
 1377:             return self.downloadObjectsAsOneFileFinally(lock=lock,procedure=procedure,REQUEST=REQUEST,current="no")
 1378:         
 1379:     def downloadObjectsAsOneFileFinally(self,lock=None,procedure=None,REQUEST=None,current="no",repeat=None):
 1380:         """print do the download"""
 1381:  
 1382:         logging.debug("HIHHHH")
 1383:         ret=""
 1384:         lockedObjects={}
 1385: 
 1386:            
 1387:         logging.debug("lock:"+repr(lock))
 1388:         if lock:
 1389:             logging.debug("------lock:"+repr(lock))
 1390:             if str(self.REQUEST['AUTHENTICATED_USER'])=='Anonymous User':
 1391:                 
 1392:                 return "please login first"
 1393: 
 1394:             #check if a locked object exist in the basket.
 1395:             lockedObjects={}
 1396:             for object in self.content.getContent():
 1397: 
 1398:                 if (not str(object[1].lockedBy)=="") and (not (str(object[1].lockedBy)==str(self.REQUEST['AUTHENTICATED_USER']))):
 1399:                     lockedObjects[object[1].title]=repr(object[1].lockedBy)
 1400:                    
 1401:                     
 1402:             keys=lockedObjects.keys()
 1403:             
 1404:             
 1405:             if len(keys)>0 and (not procedure):
 1406:                 self.REQUEST.SESSION['lockedObjects']=lockedObjects
 1407:                 pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','lockedObjects.zpt')).__of__(self)
 1408:                 
 1409:                
 1410:                 return pt()
 1411:          
 1412:             elif not procedure: #keine fails gesperrt dann alle donwloaden
 1413:                 procedure="downloadAll" 
 1414:         
 1415:         
 1416:        
 1417:        
 1418:         threadName=repeat
 1419:         if not threadName or threadName=="":
 1420:             thread=DownloadBasketFinallyThread()
 1421:             threadName=thread.getName()[0:]
 1422: 
 1423:             if (not hasattr(self,'_v_downloadBasket')):
 1424:                                 self._v_downloadBasket={}
 1425: 
 1426: 
 1427:             self._v_downloadBasket[threadName]=thread
 1428:             logging.debug("dwonloadfinally:"+repr(self))
 1429:             basketID=self.aq_parent.aq_parent.getId()
 1430:             versionNumber=self.aq_parent.getId()
 1431:             self._v_downloadBasket[threadName].set(lock,procedure,REQUEST,current,basketID,versionNumber)
 1432: 
 1433:             self._v_downloadBasket[threadName].start()
 1434: 
 1435:             
 1436:             
 1437:             wait_template=self.aq_parent.ZopeFind(self.aq_parent,obj_ids=['wait_template'])
 1438: 
 1439:             if wait_template:
 1440:                 return wait_template[0][1]()
 1441:             pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','downloadBasketWait.zpt')).__of__(self)
 1442: 
 1443:             return pt(txt=self.absolute_url()+'/downloadObjectsAsOneFileFinally',threadName=threadName)
 1444:             #_v_xmltrans.run()
 1445:         
 1446:         else:
 1447:             #recover thread, if lost
 1448:             if not hasattr(self,'_v_downloadBasket'):
 1449:                self._v_downloadBasket={}
 1450:             if not self._v_downloadBasket.get(threadName,None):
 1451:                  for thread in threading.enumerate():
 1452:                          if threadName == thread.getName():
 1453:                                        self._v_downloadBasket[threadName]=thread
 1454:                                        
 1455:             if self._v_downloadBasket.get(threadName,None) and (self._v_downloadBasket[threadName] is not None) and (not self._v_downloadBasket[threadName].end) :
 1456: 
 1457:                 wait_template=self.aq_parent.ZopeFind(self.aq_parent,obj_ids=['wait_template'])
 1458:                 if wait_template:
 1459:                         return wait_template[0][1]()
 1460:                 
 1461:                 pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','downloadBasketWait.zpt')).__of__(self)
 1462:                 return pt(txt=self.absolute_url()+'/downloadObjectsAsOneFileFinally',threadName=threadName)
 1463:             else:
 1464:               
 1465:              
 1466:               logging.debug("FINISHED")
 1467:               if not self._v_downloadBasket.get(threadName,None):
 1468:                  for thread in threading.enumerate():
 1469:                          if threadName == thread.getName():
 1470:                                        self._v_downloadBasket[threadName]=thread
 1471:                                        
 1472:               #files = self._v_downloadBasket[threadName].result
 1473:               files=self.basketContainer.resultHash[threadName]
 1474:              # fh=file("/var/tmp/test")
 1475:               #ret =fh.read()
 1476:          
 1477:               if (not isinstance(self.aq_parent,CDLIBasket)):
 1478:                   basket_name=self.aq_parent.aq_parent.title+"_V"+self.getId()
 1479:               else:
 1480:                   basket_name=self.aq_parent.title+"_V"+self.getId()
 1481:         
 1482:         
 1483:     
 1484:                   #write basketname to header of atf file
 1485:               
 1486: 
 1487:               self.REQUEST.RESPONSE.setHeader("Content-Disposition","""attachement; filename="%s.atf" """%basket_name)
 1488:               self.REQUEST.RESPONSE.setHeader("Content-Type","application/octet-stream")
 1489:               #length=len(ret)
 1490:               #self.REQUEST.RESPONSE.setHeader("Content-Length",length)
 1491:               ret="#basket: %s\n"%basket_name
 1492:               self.REQUEST.RESPONSE.write(ret)    
 1493:               for fileName in files:
 1494:                   self.REQUEST.RESPONSE.write(file(fileName).read())
 1495:  
 1496:               del self.basketContainer.resultHash[threadName]
 1497:              
 1498:     def numberOfItems(self):
 1499:         """return anzahl der elemente im basket"""
 1500:         return self.content.numberOfItems()
 1501:     
 1502:     def getTime(self):
 1503:         """getTime"""
 1504:         #return self.bobobase_modification_time().ISO()
 1505:       
 1506:         if hasattr(self,'time'):
 1507:             return time.strftime("%Y-%m-%d %H:%M:%S",self.time)
 1508:         elif hasattr(self,'timefixed'):
 1509:             return self.timefixed
 1510:         else:
 1511:             setattr(self,'timefixed',self.bobobase_modification_time().ISO())
 1512:             return self.bobobase_modification_time().ISO()
 1513:     
 1514:     def getContent(self):
 1515:         """get Basket Content"""
 1516:         return self.content.getContent()
 1517: 
 1518:     
 1519:     def __init__(self,id,user,comment="",basketContent=[]):
 1520:         """ init a basket version"""
 1521:         self.id=id
 1522:         self.comment=comment
 1523:         self._setObject('content',BasketContent(basketContent))
 1524:         #self.basketContent=basketContent[0:]a
 1525:         self.user=user
 1526:         self.time=time.localtime()
 1527:         
 1528:     def getUser(self):
 1529:         """get user"""
 1530:         return self.user
 1531:     
 1532:     def getComment(self):
 1533:         """get Comment"""
 1534:         return self.comment
 1535:  
 1536:     security.declareProtected('manage','index_html')
 1537:     def index_html(self):
 1538:             """view the basket"""
 1539: 
 1540:             if self.REQUEST.get('change',False):
 1541:                     ob=self.aq_parent.updateObjects(self.REQUEST['change'])
 1542:                    
 1543:                     self.REQUEST.RESPONSE.redirect(ob.absolute_url())#go to new basket, because changing generates a new basket
 1544:                                         
 1545:             pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','BasketVersionMain.zpt')).__of__(self)
 1546:             return pt()
 1547:      
 1548:     def getObjUrl(self,result):
 1549:         """getUrl of the version of the object"""
 1550:         objId=result[1].getTitle()
 1551:         founds=self.CDLICatalog.search({'title':objId})
 1552:         if len(founds)>0:
 1553:              return founds[0].getObject().getLastVersion().absolute_url()
 1554:          
 1555:         else: #assume version number
 1556:             splitted=objId.split("_")
 1557:             founds=self.CDLICatalog.search({'title':splitted[1]})        
 1558:             return founds[0].getObject().getLastVersion().absolute_url()+'/'+objId
 1559:    
 1560: def manage_addCDLIBasketVersion(self,user,comment="",basketContent=[],RESPONSE=None):
 1561:     """add a version"""
 1562:     
 1563:     #check for already existing versions
 1564:  
 1565:     lastVersion=self.getLastVersion()
 1566:     if lastVersion is None:
 1567:         newId=str(1)
 1568:     else:
 1569:         newId=str(int(lastVersion.getId())+1)
 1570:     
 1571:     ob=CDLIBasketVersion(newId,user,comment,basketContent)
 1572:     
 1573:     self._setObject(newId, ob)
 1574:     
 1575:     if RESPONSE is not None:
 1576:         RESPONSE.redirect('manage_main')
 1577:     else:
 1578:         return ob
 1579:     
 1580: class CDLIFileObject(CatalogAware,extVersionedFileObject):
 1581:     """CDLI file object"""
 1582:     
 1583:     meta_type="CDLI File Object"
 1584:     default_catalog='CDLIObjectsCatalog'
 1585:     
 1586:     security=ClassSecurityInfo()
 1587:     
 1588:     security.declareProtected('manage','index_html')
 1589: 
 1590:     security.declarePublic('view')
 1591:     view = PageTemplateFile('zpt/viewCDLIFile.zpt', globals())
 1592: 
 1593:     security.declarePublic('editATF')
 1594:     editATF = PageTemplateFile('zpt/editATFFile.zpt', globals())
 1595: 
 1596:     def PrincipiaSearchSource(self):
 1597:            """Return cataloguable key for ourselves."""
 1598:            return str(self)
 1599:        
 1600:     def makeThisVersionCurrent_html(self):
 1601:         """form for mthis version current"""
 1602:         
 1603:         pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','makeThisVersionCurrent.zpt')).__of__(self)
 1604:         return pt()                 
 1605: 
 1606:     security.declarePublic('makeThisVersionCurrent')
 1607:     def makeThisVersionCurrent(self,comment,author,RESPONSE=None):
 1608:         """copy this version to current"""
 1609:         parent=self.aq_parent
 1610:         parent.manage_addVersionedFileObject(id=None,vC=comment,author=author,file=self.getData(),RESPONSE=RESPONSE)
 1611:         #newversion=parent.manage_addCDLIFileObject('',comment,author)
 1612:         #newversion.manage_upload(self.getData())
 1613:                                         
 1614:         #if RESPONSE is not None:
 1615:         #    RESPONSE.redirect(self.aq_parent.absolute_url()+'/history')
 1616: 
 1617:         return True
 1618:     
 1619:     def getFormattedData(self):
 1620:         """fromat text"""
 1621:         data=self.getData()
 1622: #        return re.sub("\s\#lem"," #lem",data) #remove return vor #lem
 1623:         return re.sub("#lem","       #lem",data) #remove return vor #lem
 1624:         
 1625:     
 1626:     security.declarePublic('getPNumber')
 1627:     def getPNumber(self):
 1628:         """get the pnumber"""
 1629:         try:
 1630:                 txt=re.match("&[Pp](\d*)\s*=([^\r\n]*)",self.getData()[0:])
 1631:         except:
 1632:                 txt=self.getData()[0:]
 1633:                 
 1634:                 return "ERROR"
 1635:         try:
 1636:             return "P"+txt.group(1)
 1637:         except:
 1638:             return "ERROR"
 1639: 
 1640:     security.declarePublic('getDesignation')
 1641:     def getDesignation(self):
 1642:         """get the designation out of the file"""
 1643:         try:
 1644:                 txt=re.match("&[Pp](\d*)\s*=([^\r\n]*)",self.getData()[0:])
 1645:         except:
 1646:                 txt=self.getData()[0:]
 1647:                 
 1648:                 return "ERROR"
 1649:         try:
 1650:             return txt.group(2)
 1651:         except:
 1652:             return "ERROR"
 1653: 
 1654:         
 1655: manage_addCDLIFileObjectForm=DTMLFile('dtml/fileAdd', globals(),Kind='CDLIFileObject',kind='CDLIFileObject', version='1')
 1656: 
 1657: def manage_addCDLIFileObject(self,id,vC='',author='', file='',title='',versionNumber=0,
 1658:                              precondition='', content_type='',
 1659:                              from_tmp=False,REQUEST=None):
 1660:     """Add a new File object.
 1661:     Creates a new File object 'id' with the contents of 'file'"""
 1662:  
 1663:     id=str(id)
 1664:     title=str(title)
 1665:     content_type=str(content_type)
 1666:     precondition=str(precondition)
 1667:     
 1668:     id, title = cookId(id, title, file)
 1669: 
 1670:     self=self.this()
 1671: 
 1672:     # First, we create the file without data:
 1673:     self._setObject(id, CDLIFileObject(id,title,versionNumber=versionNumber,versionComment=vC,time=time.localtime(),author=author))
 1674:     fob = self._getOb(id)
 1675:     
 1676:     # Now we "upload" the data.  By doing this in two steps, we
 1677:     # can use a database trick to make the upload more efficient.
 1678: 
 1679:     if file and not from_tmp:
 1680:         fob.manage_upload(file)
 1681:     elif file and from_tmp:
 1682:         fob.manage_file_upload(file) # manage_upload_from_tmp doesn't exist in ExtFile2
 1683:     #    fob.manage_upload_from_tmp(file) # manage_upload_from_tmp doesn't exist in ExtFile2
 1684:     if content_type:
 1685:         fob.content_type=content_type
 1686: 
 1687:     #logging.debug("manage_add: lastversion=%s"%self.getData())
 1688:     logging.debug("reindex1: %s in %s"%(repr(self),repr(self.default_catalog)))
 1689:     self.reindex_object()
 1690:     #logging.debug("manage_add: fob_data=%s"%fob.getData())
 1691:     logging.debug("reindex2: %s in %s"%(repr(fob), repr(fob.default_catalog)))
 1692:     fob.index_object()
 1693: 
 1694:     self.CDLIRoot.updateOrAddToFileBTree(ob)
 1695:     if REQUEST is not None:
 1696:         REQUEST['RESPONSE'].redirect(self.absolute_url()+'/manage_main')
 1697:     
 1698: 
 1699: class CDLIFile(extVersionedFile,CatalogAware):
 1700:     """CDLI file"""
 1701:     
 1702:     security=ClassSecurityInfo()
 1703:     meta_type="CDLI file"
 1704:     content_meta_type = ["CDLI File Object"]
 1705:     
 1706:     default_catalog='CDLICatalog'
 1707:     
 1708:     security.declareProtected('manage','index_html')
 1709:     
 1710:     def getLastVersionData(self):
 1711:         """get last version data"""
 1712:         return self.getData()
 1713: 
 1714:     def getLastVersionFormattedData(self):
 1715:         """get last version data"""
 1716:         return self.getContentObject().getFormattedData()
 1717: 
 1718:     def getTextId(self):
 1719:         """returns P-number of text"""
 1720:         # assuming that its the beginning of the title
 1721:         return self.title[:7]
 1722: 
 1723:     #security.declarePublic('history')
 1724:     def history(self):
 1725:         """history"""  
 1726: 
 1727:         ext=self.ZopeFind(self.aq_parent,obj_ids=["history_template.html"])
 1728:         if ext:
 1729:             return getattr(self,ext[0][1].getId())()
 1730:         
 1731:         pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','versionHistory')).__of__(self)
 1732:         return pt()
 1733: 
 1734: 
 1735:     def getBasketFromId(self,basketid, context=None):
 1736:         """get basket from id"""
 1737: 
 1738:         if not context:
 1739:             context=self
 1740:             
 1741:         for basket in self.ZopeFind(context,obj_metatypes=["CDLIBasket"]):
 1742:             if basket[0]==basketid:
 1743:                 return basket[1]
 1744:         else:
 1745:             None
 1746: 
 1747:  
 1748:     def isContainedInBaskets(self,context=None):
 1749:         """check is this file is part of any basket
 1750:         @param context: (optional) necessessary if CDLIBasketCatalog is not an (inherited) attribute of self, context.CDLIBasketCatalog
 1751:                         has to exist.
 1752:         """
 1753: 
 1754:         if not context:
 1755:             context=self
 1756:         
 1757:         ret=[]
 1758:         for x in context.CDLIBasketCatalog.search({'getFileNamesInLastVersion':self.getId()}):
 1759:             #if the basket x is deleted it seemes to be that x is sometimes still in the Catalog, why?
 1760:             try:
 1761:                 ret.append(x.getObject())
 1762:             except:
 1763:                 pass
 1764:         return ret
 1765:         #return [x.getObject() for x in context.CDLIBasketCatalog.search({'getFileNamesInLastVersion':self.getId()})]
 1766:         
 1767:         
 1768:     def _newContentObject(self, id, title='', versionNumber=0, versionComment=None, time=None, author=None):
 1769:         """factory for content objects. to be overridden in derived classes."""
 1770:         logging.debug("_newContentObject(CDLI)")
 1771:         return CDLIFileObject(id,title,versionNumber=versionNumber,versionComment=versionComment,time=time,author=author)
 1772: 
 1773: 
 1774:     def addCDLIFileObjectForm(self):
 1775:         """add a new version"""
 1776:         
 1777:         if str(self.REQUEST['AUTHENTICATED_USER']) in ["Anonymous User"]:
 1778:             return "please login first"
 1779:         if (self.lockedBy==self.REQUEST['AUTHENTICATED_USER']) or (self.lockedBy==''):
 1780:             out=DTMLFile('dtml/fileAdd', globals(),Kind='CDLIFileObject',kind='CDLIFileObject',version=self.getVersion()).__of__(self)
 1781:             return out()
 1782:         else:
 1783:             return "Sorry file is locked by somebody else"
 1784:         
 1785:     def manage_addCDLIFileObject(self,id,vC,author,
 1786:                                  file='',title='',
 1787:                                  precondition='', 
 1788:                                  content_type='',
 1789:                                  changeName='no',newName='', 
 1790:                                  come_from=None,
 1791:                                  from_tmp=False,RESPONSE=None):
 1792:         """add"""
 1793:       
 1794:         try: #TODO: der ganze vC unsinn muss ueberarbeitet werden
 1795:             vC=self.REQUEST['vC']
 1796:         except:
 1797:             pass
 1798:         
 1799:         ob = self.addContentObject(id, vC, author, file, title, changeName=changeName, newName=newName, from_tmp=from_tmp,
 1800:                                    precondition=precondition, content_type=content_type)
 1801: 
 1802:         try:
 1803:             #FIXME: wozu ist das gut?
 1804:             self.REQUEST.SESSION['objID_parent']=self.getId()
 1805:         except:
 1806:             pass
 1807:   
 1808:         #self.cdliRoot.updateOrAddToFileBTree(self)# now update the object in the cache
 1809:       
 1810:         
 1811:         if RESPONSE:
 1812:             if ob.getSize()==0:
 1813:                 self.REQUEST.SESSION['objID']=ob.getId()
 1814:                 pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','errorUploadFile')).__of__(self)
 1815:                 return pt()
 1816:             else:
 1817:                 if come_from and (come_from!=""):
 1818:                     RESPONSE.redirect(come_from+"?change="+self.getId())
 1819:                 else:
 1820:                     RESPONSE.redirect(self.REQUEST['URL2']+'?uploaded=%s'%self.title)
 1821:         else:
 1822:             return ob
 1823:         
 1824:         
 1825: def manage_addCDLIFileForm(self):
 1826:     """interface for adding the OSAS_root"""
 1827:     pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','addCDLIFile.zpt')).__of__(self)
 1828:     return pt()
 1829: 
 1830: def manage_addCDLIFile(self,id,title,lockedBy, author=None, RESPONSE=None):
 1831:     """add the OSAS_root"""
 1832:     newObj=CDLIFile(id,title,lockedBy,author)
 1833:                                         
 1834:     tryToggle=True
 1835:     tryCount=0
 1836: 
 1837:     self._setObject(id,newObj)                  
 1838:     getattr(self,id).reindex_object()
 1839:         
 1840:     if RESPONSE is not None:
 1841:         RESPONSE.redirect('manage_main')
 1842: 
 1843: 
 1844: def checkUTF8(data):
 1845:     """check utf 8"""
 1846:     try:
 1847:         data.encode('utf-8')
 1848:         return True
 1849:     except:
 1850:         return False
 1851:     
 1852: 
 1853: def checkFile(filename,data,folder):
 1854:     """check the files"""
 1855:     # first check the file name
 1856:     fn=filename.split(".") # no extension
 1857: 
 1858:     if not fn[0][0]=="P":
 1859:         return False,"P missing in the filename"
 1860:     elif len(fn[0])!=7:
 1861:         return False,"P number has not the right length 6"
 1862:     elif not checkUTF8(data):
 1863:         return False,"not utf-8"
 1864:     else:
 1865:         return True,""
 1866:     
 1867:     
 1868: def splitatf(fh,dir=None,ext=None):
 1869:     """split it"""
 1870:     ret=None
 1871:     nf=None
 1872:     i=0
 1873: 
 1874:     #ROC: why split \n first and then \r???
 1875:     if (type(fh) is StringType) or (type(fh) is UnicodeType):
 1876:         iter=fh.split("\n")
 1877:     else:
 1878:         iter=fh.readlines()
 1879:         
 1880:     for lineTmp in iter:
 1881:         lineTmp=lineTmp.replace(codecs.BOM_UTF8,'') # make sure that all BOM are removed..
 1882:         for line in lineTmp.split("\r"):
 1883:             #logging.log("Deal with: %s"%line)
 1884:             if ext:
 1885:                 i+=1
 1886:                 if (i%100)==0:
 1887:                     ext.result+="."
 1888:                 if i==10000:
 1889:                     i=0
 1890:                     ext.result+="<br>"
 1891:             #check if basket name is in the first line
 1892:             if line.find("#atf basket")>=0: #old convention
 1893:                 ret=line.replace('#atf basket ','')
 1894:                 ret=ret.split('_')[0]
 1895:             elif line.find("#basket:")>=0: #new convention
 1896:                 ret=line.replace('#basket: ','')
 1897:                 ret=ret.split('_')[0]
 1898: 
 1899:             else:
 1900:                 if (len(line.lstrip())>0) and (line.lstrip()[0]=="&"): #newfile
 1901:                     if nf:
 1902:                         nf.close() #close last file
 1903: 
 1904: 
 1905:                     filename=line[1:].split("=")[0].rstrip()+".atf"
 1906:                     if dir:
 1907:                         filename=os.path.join(dir,filename)
 1908:                     nf=file(filename,"w")
 1909:                     logging.info("open %s"%filename)
 1910:                 if nf:    
 1911:                     nf.write(line.replace("\n","")+"\n")
 1912: 
 1913:     try:        
 1914:         nf.close()
 1915:     except:
 1916:         pass
 1917:     
 1918:     if not((type(fh) is StringType) or (type(fh) is UnicodeType)):
 1919:         fh.close()
 1920:     return ret,len(os.listdir(dir))
 1921: 
 1922: 
 1923: class CDLIFileFolder(extVersionedFileFolder):
 1924:     """CDLI File Folder"""
 1925:     
 1926:     security=ClassSecurityInfo()
 1927:     meta_type="CDLI Folder"
 1928:     file_meta_type=['CDLI file']
 1929:     folder_meta_type=['CDLI Folder']
 1930: 
 1931:     file_catalog='CDLICatalog'
 1932: 
 1933:     #downloadCounter=0 # counts how many download for all files currently run, be mehr als 5 wird verweigert.
 1934:     tmpStore2={}
 1935: 
 1936:     def _newVersionedFile(self, id, title='', lockedBy=None, author=None):
 1937:         """factory for versioned files. to be overridden in derived classes."""
 1938:         logging.debug("_newVersionedFile(CDLI)")
 1939:         return CDLIFile(id, title, lockedBy=lockedBy, author=author)
 1940: 
 1941:     def setTemp(self,name,value):
 1942:         """set tmp"""
 1943: 
 1944:         setattr(self,name,value)
 1945:                                         
 1946:     deleteFileForm = PageTemplateFile("zpt/doDeleteFile", globals())
 1947:                                        
 1948:     def delete(self,ids,REQUEST=None):
 1949:         """delete these files"""
 1950:         if type(ids) is not ListType:
 1951:             ids=[ids]
 1952: 
 1953:         self.manage_delObjects(ids)
 1954:         
 1955:         if REQUEST is not None:
 1956:             return self.index_html()
 1957: 
 1958: 
 1959:     def getVersionNumbersFromIds(self,ids):
 1960:         """get the numbers of the current versions of documents described by their ids"""
 1961:         
 1962:         ret=[]
 1963:         searchStr=" OR ".join(ids)
 1964:         
 1965:         founds=self.CDLICatalog.search({'title':searchStr})
 1966:         
 1967:         for found in founds:
 1968:             lastVersion=found.getObject().getContentObject()
 1969:             ret.append((found.getId,lastVersion))
 1970:         
 1971:         return ret
 1972:     
 1973:     def getFile(self,fn):
 1974:         """get the content of the file fn"""
 1975:         logging.debug("getFile: %s"%repr(fn))
 1976:         if not self.hasObject(fn):
 1977:             # search deeper
 1978:             founds=getattr(self, self.file_catalog).search({'textid':fn})
 1979:             if founds:
 1980:                 obj=founds[0].getObject().getContentObject()
 1981:             else:
 1982:                 return "" 
 1983:         else:
 1984:             obj = self[fn].getContentObject()
 1985: 
 1986:         return obj.getData()[0:] 
 1987:  
 1988:     
 1989:     def checkCatalog(self,fn):
 1990:         """check if fn is in the catalog"""
 1991:         #TODO add checkCatalog
 1992:         
 1993:                                    
 1994:     def findObjectsFromListWithVersion(self,list,author=None):
 1995:         """find objects from a list with versions
 1996:         @param list: list of tuples  (cdliFile,version)
 1997:         """
 1998:         #self.REQUEST.SESSION['fileIds']=list#store fieldIds in session for further usage
 1999:         #self.REQUEST.SESSION['searchList']=self.REQUEST.SESSION['fileIds']
 2000:         
 2001:         pt=getattr(self,'filelistVersioned.html')
 2002:             
 2003:         return pt(search=list,author=author)
 2004:     
 2005:     
 2006:     def getAllPNumbers(self):
 2007:         """get a list of all files (resp their p-numbers) stored"""
 2008:         
 2009:         ret=[x.getId for x in  self.CDLICatalog()]
 2010:      
 2011:         return ret
 2012:     
 2013:     def expandFile(self,fileId,fileTree):
 2014:         """wildcard in fileID suche alle Treffer"""
 2015:         founds=self.CDLICatalog({'title':fileId})
 2016:         for found in founds:
 2017:             fileTree.add(found.getId)
 2018:             logging.debug("ADDD:"+found.getId)
 2019:          
 2020:     def findObjectsFromList(self,enterList=None,display=False,start=None,upload=None,list=None,basketName=None,numberOfObjects=None,RESPONSE=None,REQUEST=None,returnHash=False,hash=None):
 2021:         """findObjectsFromList (, TAB oder LINE separated)"""
 2022:                                        
 2023:         logging.debug("start: findObjectsFromList")
 2024:         #logging.debug("start: findObjectsFromList"+repr(list))
 2025:         
 2026:             
 2027:         if upload: # list from file upload
 2028:             txt=upload.read()
 2029:                                        
 2030:         if enterList:
 2031:             txt=enterList
 2032:             
 2033:         if upload or enterList:
 2034:             txt=txt.replace(",","\n")
 2035:             txt=txt.replace("\t","\n")
 2036:             txt=txt.replace("\r","\n")
 2037:             idsTmp=txt.split("\n")
 2038:             ids=[]
 2039:             for id in idsTmp: # make sure that no empty lines
 2040:                 idTmp=id.lstrip().rstrip()
 2041:                 if len(idTmp)>0:
 2042:                     
 2043:                     ids.append(idTmp)
 2044:                     
 2045:             #self.REQUEST.SESSION['ids']=" OR ".join(ids)
 2046: 
 2047:             pt=getattr(self,'filelist.html')
 2048:             self.REQUEST.SESSION['searchList']=ids
 2049:             return pt(search=ids)
 2050:         
 2051:         if basketName:
 2052:             #TODO: get rid of one of these..
 2053:             
 2054:             pt=getattr(self,'filelist.html')
 2055:             return pt(basketName=basketName,numberOfObjects=numberOfObjects)
 2056:         
 2057:         if hash is not None and hasattr(self.cdliRoot,'v_tmpStore') and self.cdliRoot.v_tmpStore.has_key(hash): 
 2058:                
 2059:                logging.debug("asking for storage2")
 2060:                result =self.cdliRoot.v_tmpStore[hash]
 2061:                if result:
 2062:                    logging.debug("give result from storage2")
 2063:                    return hash,self.cdliRoot.v_tmpStore[hash]
 2064:           
 2065:         if list is not None: # got already a list
 2066:             
 2067:             logging.debug(" ----List version")
 2068:             ret=[]
 2069:             fileTree=Set()
 2070:             
 2071:             for fileId in list:
 2072:                
 2073:                 if fileId.find("*")>-1: #check for wildcards
 2074:                         self.expandFile(fileId,fileTree)
 2075:                         
 2076:                 elif len(fileId.split("."))==1:
 2077:                         fileId=fileId+".atf"
 2078:                         fileTree.add(fileId)
 2079:                 #logging.debug("   -----:"+fileId)
 2080:                 #ret+=self.CDLICatalog({'title':fileId})
 2081:                 #x =self.getFileObject(fileId)
 2082:                 #if x is not None:
 2083:                 #    ret.append(x)
 2084:                 
 2085:             
 2086:             
 2087:             ids = fileTree & self.v_file_ids
 2088:             #self.REQUEST.SESSION['fileIds']=ids#store fieldIds in session for further usage
 2089:             l=makelist(fileTree)[0:]
 2090:             logging.debug("l-list:"+repr(l))
 2091:             self.REQUEST.SESSION['fileIds']=l#store fieldIds in session for further usage
 2092:             self.REQUEST.SESSION['searchList']=l
 2093:             #self.REQUEST.SESSION['searchList']=['P000001.atf']
 2094:           
 2095:             
 2096:             hash = md5.new(repr(makelist(fileTree))).hexdigest() # erzeuge hash als identification
 2097:             self.REQUEST.SESSION['hash']=hash
 2098:             #TODO: do I need garbage collection for v_tmpStore ?
 2099:             
 2100:             #logging.debug("Hash:"+repr(hash))
 2101: #        
 2102: #            if hasattr(self.cdliRoot,'v_tmpStore') and self.cdliRoot.v_tmpStore.has_key(hash): 
 2103: #               logging.debug("asking for storage")
 2104: #               res=self.cdliRoot.v_tmpStore[hash]
 2105: #               if res:
 2106: #                   if returnHash == True:
 2107: #                       return hash,res
 2108: #                   return res
 2109:           
 2110:             #TODO: get rid of one of these..
 2111:             #ids=[x.getObject().getId() for x in ret]
 2112:             ret=[(self.getFileObject(x),self.getFileObjectLastVersion(x)) for x in ids]
 2113:             
 2114:             #self.REQUEST.SESSION['fileIds']=ids#store fieldIds in session for further usage
 2115:             #self.REQUEST.SESSION['searchList']=self.REQUEST.SESSION['fileIds']
 2116:            
 2117:             if display:
 2118:                 pt=getattr(self,'filelist.html')
 2119:                 
 2120:                 return pt(search=ids)
 2121:             else:     
 2122:                 #self.REQUEST.SESSION['hash'] = ret # store in session 
 2123:                 if not hasattr(self,'v_tmpStore'):
 2124:                     self.cdliRoot.v_tmpStore={}
 2125:                 #logging.debug("HHHHHHNEU:"+repr(self.makelist(ids)))
 2126:                 #logging.debug("HHHHHHNEU:"+repr(hash))
 2127:                 self.cdliRoot.v_tmpStore[hash] = ret # store in session 
 2128:                 if returnHash == True:
 2129:                     return hash,ret
 2130:                 return ret
 2131:         
 2132:         
 2133:         
 2134:         if start:
 2135:             RESPONSE.redirect("filelist.html?start:int="+str(start))
 2136: 
 2137:     security.declareProtected('Manage','createAllFilesAsSingleFile')
 2138:     def createAllFilesAsSingleFile(self,RESPONSE=None):
 2139:         """download all files"""
 2140:         
 2141:         def sortF(x,y):
 2142:             return cmp(x[0],y[0])
 2143:         
 2144:         catalog=getattr(self,self.file_catalog)
 2145:         #tf,tfilename=mkstemp()
 2146:         if not hasattr(self.temp_folder,'downloadCounter'):
 2147:             self.temp_folder.downloadCounter=0
 2148: 
 2149:         if getattr(self.temp_folder,'downloadCounter',0) > 5:
 2150:             return """I am sorry, currently the server has to many requests for downloads, please come back later!"""
 2151: 
 2152:         self.temp_folder.downloadCounter+=1
 2153:         self._p_changed=1
 2154:         transaction.get().commit()
 2155:        
 2156:         list=[(x.getId,x) for x in catalog()]
 2157:         list.sort(sortF)
 2158:         
 2159: 
 2160:         
 2161:         RESPONSE.setHeader("Content-Disposition","""attachement; filename=%s"""%"all.atf")
 2162:         RESPONSE.setHeader("Content-Type","application/octet-stream")
 2163:         tmp=""
 2164:         for l in list:
 2165:             obj=l[1].getObject()
 2166:             
 2167:             if obj.meta_type=="CDLI file":
 2168:                 
 2169:                 #os.write(tf,obj.getLastVersion().data)
 2170:                 if RESPONSE:
 2171:                     RESPONSE.write(obj.getData()[0:])
 2172:                     RESPONSE.write("\n")
 2173:                 self.temp_folder.downloadCounter-=1 
 2174:                 self._p_changed=1
 2175:         transaction.get().commit()
 2176:         #os.close(tf)
 2177:         #RESPONSE.redirect(self.absolute_url()+"/downloadFile?fn="%tfilename)
 2178:         return True
 2179:     
 2180:     def downloadFile(self,fn):
 2181:         """download fn - not used yet"""
 2182:         self.REQUEST.RESPONSE.setHeader("Content-Disposition","""attachement; filename=%s"""%self.getLastVersion().getId())
 2183:         self.REQUEST.RESPONSE.setHeader("Content-Type","application/octet-stream")
 2184:         self.REQUEST.RESPONSE.write(file(fn).read())
 2185:         
 2186:       
 2187:                 
 2188:     def hasParent(self):
 2189:         """returns true falls subfolder"""
 2190:       
 2191:         if self.aq_parent.meta_type in self.folder_meta_type:
 2192:             return True
 2193:         else:
 2194:             return False
 2195:         
 2196:     def getFolders(self):
 2197:         """get all subfolders"""
 2198:         ret=[]
 2199:         folders=self.ZopeFind(self,obj_metatypes=self.folder_meta_type)
 2200:         for folder in folders:
 2201:             ret.append((folder[1],
 2202:                         len(self.ZopeFind(folder[1],obj_metatypes=self.folder_meta_type)),
 2203:                         len(self.ZopeFind(folder[1],obj_metatypes=self.file_meta_type))
 2204:                         ))
 2205:         return ret
 2206:     
 2207:             
 2208:     security.declareProtected('manage','index_html')
 2209:     def index_html(self):
 2210:         """main"""
 2211:         ext=self.ZopeFind(self,obj_ids=["index.html"])
 2212:         if ext:
 2213:             return ext[0][1]()
 2214:         
 2215:         pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','CDLIFileFolderMain')).__of__(self)
 2216:         return pt()
 2217:     
 2218:     
 2219: manage_addCDLIFileFolderForm=DTMLFile('dtml/folderAdd', globals())
 2220: 
 2221:     
 2222: def manage_addCDLIFileFolder(self, id, title='',
 2223:                      createPublic=0,
 2224:                      createUserF=0,
 2225:                      REQUEST=None):
 2226:     """Add a new Folder object with id *id*.
 2227: 
 2228:     If the 'createPublic' and 'createUserF' parameters are set to any true
 2229:     value, an 'index_html' and a 'UserFolder' objects are created respectively
 2230:     in the new folder.
 2231:     """
 2232:     ob=CDLIFileFolder()
 2233:     ob.id=str(id)
 2234:     ob.title=title
 2235:     self._setObject(id, ob)
 2236:     ob=self._getOb(id)
 2237: 
 2238:     checkPermission=getSecurityManager().checkPermission
 2239: 
 2240:     if createUserF:
 2241:         if not checkPermission('Add User Folders', ob):
 2242:             raise Unauthorized, (
 2243:                   'You are not authorized to add User Folders.'
 2244:                   )
 2245:         ob.manage_addUserFolder()
 2246: 
 2247:   
 2248:     if REQUEST is not None:
 2249:         return self.manage_main(self, REQUEST, update_menu=1)
 2250:     
 2251: class CDLIRoot(Folder):
 2252:     """main folder for cdli"""
 2253:     
 2254:     meta_type="CDLIRoot"
 2255:     downloadCounterBaskets=0 # counts the current basket downloads if counter > 10 no downloads are possible
 2256:     
 2257:     file_catalog = 'CDLICatalog'
 2258:     
 2259:     # word splitter for search
 2260:     splitter = {'words':cdliSplitter.wordSplitter(),
 2261:                 'graphemes':cdliSplitter.graphemeSplitter()}
 2262:     
 2263:     
 2264:     def viewATF(self,id,RESPONSE):
 2265:         """view an Object"""
 2266:         ob = self.CDLICatalog({'title':id})
 2267:         logging.debug(ob[0].getObject().getLastVersion().absolute_url()+"/view")
 2268:         if len(ob)>0:
 2269:             RESPONSE.redirect(ob[0].getObject().getLastVersion().absolute_url()+"/view")
 2270:         return "not found"
 2271:     
 2272:     def history(self,id,RESPONSE):
 2273:         """view an Object"""
 2274:         ob = self.CDLICatalog({'title':id})
 2275:         if len(ob)>0:
 2276:             RESPONSE.redirect(ob[0].absolute_url+"/history")
 2277:         return "not found"
 2278:     
 2279: 
 2280:     def downloadLocked(self,id,RESPONSE):
 2281:         """view an Object"""
 2282:         ob = self.CDLICatalog({'title':id})
 2283:         if len(ob)>0:
 2284:             RESPONSE.redirect(ob[0].absolute_url+"/downloadLocked")
 2285:         return "not found"
 2286:     
 2287:     def download(self,id,RESPONSE):
 2288:         """view an Object"""
 2289:         ob = self.CDLICatalog({'title':id})
 2290:         if len(ob)>0:
 2291:             RESPONSE.redirect(ob[0].getLastVersion().absolute_url())
 2292:         return "not found"
 2293:     def addCDLIFileObjectForm(self,id,RESPONSE):
 2294:         """view an Object"""
 2295:         ob = self.CDLICatalog({'title':id})
 2296:         if len(ob)>0:
 2297:             RESPONSE.redirect(ob[0].absolute_url+"/addCDLIFileObjectForm")
 2298:         return "not found"
 2299:     
 2300:     def addVersionedFileObjectForm(self,id,RESPONSE):
 2301:         """view an Object"""
 2302:         ob = self.CDLICatalog({'title':id})
 2303:         if len(ob)>0:
 2304:             RESPONSE.redirect(ob[0].absolute_url+"/addVersionedFileObjectForm")
 2305:         return "not found"
 2306:     
 2307:     def unlock(self,id,RESPONSE):
 2308:         """view an Object"""
 2309:         ob = self.CDLICatalog({'title':id})
 2310:         if len(ob)>0:
 2311:             RESPONSE.redirect(ob[0].absolute_url+"/unlock")
 2312:         return "not found"
 2313:     
 2314:     def getFileObject(self,fileId):
 2315:         """get an object"""
 2316:         x=self.v_files.get(fileId)
 2317:         #logging.debug(x)
 2318:         return x
 2319:     
 2320:     def getFileObjectLastVersion(self,fileId):
 2321:         """get an object"""
 2322:         x=self.v_files_lastVersion.get(fileId)
 2323:         #logging.debug(x)
 2324:         return x
 2325:     
 2326:     def showFileIds(self):
 2327:         """showIds"""
 2328:         return self.v_file_ids
 2329:     
 2330:     def generateFileBTree(self):
 2331:         """erzeuge einen Btree aus allen Files"""
 2332:         self.v_files = OOBTree()
 2333:         self.v_files_lastVersion = OOBTree()
 2334:         self.v_file_ids = Set()
 2335:         
 2336:         for x in self.CDLICatalog.searchResults():
 2337:             
 2338:             self.v_files.update({x.getId:x.getObject()})
 2339:             self.v_files_lastVersion.update({x.getId:x.getObject().getLastVersion()})
 2340:             self.v_file_ids.add(x.getId)
 2341:             logging.debug("add:"+x.getId+"XXX"+repr(x.getObject()))
 2342:         
 2343:         return True
 2344:     
 2345:     
 2346:     def updateOrAddToFileBTree(self,obj):
 2347:         """update a BTree"""
 2348:         self.v_files.update({obj.getId():obj})
 2349:         self.v_files_lastVersion.update({obj.getId():obj.getLastVersion()})
 2350:         
 2351:         self.v_file_ids.add(obj.getId())
 2352:         logging.debug("update:"+obj.getId()+"XXX"+repr(obj))
 2353:         
 2354:     def deleteFromBTree(self,objId):
 2355:         """delete an obj"""
 2356:         self.v_files.pop(objId)
 2357:         self.v_files_lastVersion.pop(objId)
 2358:         self.v_file_ids.remove(objId)
 2359:         
 2360: 
 2361:  
 2362:     def deleteFiles(self,ids):
 2363:         """delete files"""
 2364:         for id in ids:
 2365:             founds=self.CDLICatalog.search({'title':id.split(".")[0]})
 2366:             if founds:
 2367:                 logging.debug("deleting %s"%founds)
 2368:                 folder=founds[0].getObject().aq_parent #get the parent folder of the object
 2369:                 logging.debug("deleting from %s"%folder)
 2370:                 cut=folder.delete([founds[0].getId]) #cut it out
 2371: 
 2372: 
 2373: 
 2374:     def searchText(self, query, index='graphemes'):
 2375:         """searches query in the fulltext index and returns a list of file ids/P-numbers"""
 2376:         # see also: http://www.plope.com/Books/2_7Edition/SearchingZCatalog.stx#2-13
 2377:         logging.debug("searchtext for '%s' in index %s"%(query,index))
 2378:         #import Products.ZCTextIndex.QueryParser
 2379:         #qp = QueryParser.QueryParser()
 2380:         #logging.debug()
 2381:         idxQuery = {index:{'query':query}}
 2382:         idx = getattr(self, self.file_catalog)
 2383:         # do search
 2384:         resultset = idx.search(query_request=idxQuery,sort_index='textid')
 2385:         # put only the P-Number in the result 
 2386:         results = [res.getId[:7] for res in resultset]
 2387:         logging.debug("searchtext: found %d texts"%len(results))
 2388:         return results
 2389: 
 2390: 
 2391:     def getFile(self, pnum):
 2392:         """get the translit file with the given pnum"""
 2393:         f = getattr(self, self.file_catalog).search({'textid':pnum})
 2394:         if not f:
 2395:             return ""
 2396:         
 2397:         return f[0].getObject().getData()
 2398:          
 2399: 
 2400:     def showFile(self,fileId,wholePage=False):
 2401:         """show a file
 2402:         @param fileId: P-Number of the document to be displayed
 2403:         """
 2404:         f=getattr(self, self.file_catalog).search({'textid':fileId})
 2405:         if not f:
 2406:             return ""
 2407:         
 2408:         if wholePage:
 2409:             logging.debug("show whole page")
 2410:             return f[0].getObject().getContentObject().view()
 2411:         else:
 2412:             return f[0].getObject().getLastVersionFormattedData()
 2413:     
 2414: 
 2415:     def showWordInFile(self,fileId,word,indexName='graphemes',regExp=False,):
 2416:         """get lines with word from FileId"""
 2417:         logging.debug("showwordinfile word='%s' index=%s file=%s"%(word,indexName,fileId)) 
 2418:         
 2419:         file = formatAtfFullLineNum(self.getFile(fileId))
 2420:         ret=[]
 2421:         
 2422:         # add whitespace before and whitespace and line-end to splitter bounds expressions
 2423:         bounds = self.splitter[indexName].bounds
 2424:         splitexp = "(%s|\s)(%%s)(%s|\s|\Z)"%(bounds,bounds)
 2425:         # clean word expression 
 2426:         # TODO: this should use QueryParser itself
 2427:         # take out double quotes
 2428:         word = word.replace('"','')
 2429:         # take out ignorable signs
 2430:         ignorable = self.splitter[indexName].ignorex
 2431:         word = ignorable.sub('', word)
 2432:         # compile into regexp objects and escape parens
 2433:         wordlist = [re.compile(splitexp%re.escape(w)) for w in word.split(' ')]
 2434:             
 2435:         for line in file.splitlines():
 2436:             for word in wordlist:
 2437:                 #logging.debug("showwordinfile: searching for %s in %s"%(word.pattern,ignoreable.sub('',line)))
 2438:                 if word.search(ignorable.sub('',line)):
 2439:                     line = formatAtfLineHtml(line)
 2440:                     ret.append(line)
 2441:                     break
 2442:                     
 2443:         return ret
 2444: 
 2445:     
 2446:     def showWordInFiles(self,fileIds,word,indexName='graphemes',regExp=False):
 2447:         """
 2448:         get lines with word from all ids in list FileIds.
 2449:         returns dict with id:lines pairs.
 2450:         """
 2451:         logging.debug("showwordinfiles word='%s' index=%s file=%s"%(word,indexName,fileIds))
 2452:         
 2453:         return dict([(id,self.showWordInFile(id, word, indexName, regExp)) for id in fileIds])
 2454:     
 2455: 
 2456:     def tagWordInFile(self,fileId,word,indexName='graphemes',regExp=False):
 2457:         """get text with word highlighted from FileId"""
 2458:         logging.debug("tagwordinfile word='%s' index=%s file=%s"%(word,indexName,fileId)) 
 2459:         
 2460:         file=self.getFile(fileId)
 2461:         tagStart=u'<span class="found">'
 2462:         tagEnd=u'</span>'
 2463:         tagStr=tagStart + u'%%s' + tagEnd
 2464:         ret=[]
 2465:         
 2466:         # add whitespace to splitter bounds expressions and compile into regexp object
 2467:         bounds = self.splitter[indexName].bounds
 2468:         wordsplit = re.compile("(%s|\s)"%bounds)
 2469:         # clean word expression 
 2470:         # TODO: this should use QueryParser itself
 2471:         word = word.replace('"','') # take out double quotes
 2472:         # take out ignoreable signs
 2473:         ignorable = self.splitter[indexName].ignorex
 2474:         word = ignorable.sub('', word)
 2475:         # split search terms by blanks
 2476:         words = word.split(' ')
 2477:         # split search terms again (for grapheme search with words)
 2478:         splitwords = dict(((w,self.splitter[indexName].process([w])) for w in words))
 2479:             
 2480:         for line in file.splitlines():
 2481:             line = unicodify(line)
 2482:             # ignore lemma and other lines
 2483:             if line.lstrip().startswith('#lem:'):
 2484:                 continue
 2485:             # ignore p-num line
 2486:             if line.startswith('&P'):
 2487:                 continue
 2488:             # ignore version lines
 2489:             if line.startswith('#version'):
 2490:                 continue
 2491:             # ignore atf type lines
 2492:             if line.startswith('#atf:'):
 2493:                 continue
 2494: 
 2495:             # first scan
 2496:             hitwords = []
 2497:             for w in words:
 2498:                 if ignorable.sub('',line).find(w) > -1:
 2499:                     # word is in line
 2500:                     # append split word for grapheme search with words
 2501:                     hitwords.extend(splitwords[w])
 2502:                     #hitwords.extend(wordsplit.split(w))
 2503:                    
 2504:             # examine hits closer
 2505:             if hitwords:
 2506:                 # split line into words
 2507:                 parts = wordsplit.split(line)
 2508:                 line = ""
 2509:                 for p in parts:
 2510:                     #logging.debug("tagwordinfile: searching for %s in %s"%(p,hitwords))
 2511:                     # reassemble line
 2512:                     if ignorable.sub('', p) in hitwords:
 2513:                         #logging.debug("tagwordinfile: found %s in %s"%(p,hitwords))
 2514:                         # this part was found
 2515:                         line += tagStart + formatAtfHtml(p) + tagEnd
 2516:                     else:
 2517:                         line += formatAtfHtml(p)
 2518:                 
 2519:             else:
 2520:                 # no hits
 2521:                 line = formatAtfHtml(line)
 2522:             
 2523:             ret.append(line)
 2524:                         
 2525:         return u'<br>\n'.join(ret)
 2526: 
 2527: 
 2528: 
 2529:     def tagWordInFiles(self,fileIds,word,indexName='graphemes',regExp=False):
 2530:         """
 2531:         get texts with highlighted word from all ids in list FileIds.
 2532:         returns dict with id:text pairs.
 2533:         """
 2534:         logging.debug("tagwordinfiles word='%s' index=%s file=%s"%(word,indexName,fileIds)) 
 2535:         return dict([(id,self.tagWordInFile(id, word, indexName, regExp)) for id in fileIds])
 2536:     
 2537: 
 2538:     def getFileVersionList(self, pnum):
 2539:         """get the version history as a list for the translit file with the given pnum"""
 2540:         f = getattr(self, self.file_catalog).search({'textid':pnum})
 2541:         if not f:
 2542:             return []
 2543:         
 2544:         return f[0].getObject().getVersionList()
 2545:          
 2546: 
 2547:     def URLquote(self,str):
 2548:         """quote url"""
 2549:         return urllib.quote(str)
 2550:     
 2551:     def URLunquote(self,str):
 2552:         """unquote url"""
 2553:         return urllib.unquote(str)
 2554:     
 2555:     def URLquote_plus(self,str):
 2556:         """quote url"""
 2557:         return urllib.quote_plus(str)
 2558:     
 2559:     def URLunquote_plus(self,str):
 2560:         """unquote url"""
 2561:         return urllib.unquote_plus(str)
 2562:     
 2563:     
 2564:     def forceunlock(self):
 2565:         "break all locks"
 2566:         ret=[]
 2567:         for f in self.ZopeFind(self,obj_metatypes="CDLI file",search_sub=1):
 2568:            un=f[1].forceunlock()
 2569: 
 2570:            if un and un !="":
 2571:                ret.append((f[0],un))
 2572: 
 2573:         return ret
 2574:                                         
 2575: 
 2576:     def getChangesByAuthor(self,author,n=100):
 2577:         """getChangesByAuthor"""
 2578:         zcat=self.CDLIObjectsCatalog
 2579:         res=zcat({'lastEditor':author,
 2580:                      'sort_on':'getTime',
 2581:                      'sort_order':'descending',
 2582:                      'sort_limit':n})[:n ]
 2583:                        
 2584:         return res
 2585:     
 2586:     def getChangesByAuthor_html(self,author,n=100):
 2587:         """html output for changes by author"""
 2588:         tmp={}
 2589:         list=[]                         
 2590:         for x in self.getChangesByAuthor(author):
 2591:            nr=x.getObject().getVersionNumber()
 2592:            id=x.getObject().aq_parent.getId()
 2593:            #hinzufuegen, wenn Version neuer als die 
 2594:            if tmp.get(id,(0,0))[1] < nr:
 2595:                 tmp[id]=(x.getObject().aq_parent,nr)
 2596: 
 2597:      
 2598:         return self.cdli_main.findObjectsFromListWithVersion(list=tmp.values(),author=author)           
 2599:         
 2600:     def getLastChanges(self,n=100):
 2601:         """get the last n changes""" 
 2602:         n=int(n)                   
 2603:         zcat=self.CDLICatalog
 2604:         return zcat({'sort_on':'getLastChangeDate',
 2605:                      'sort_order':'descending',
 2606:                      'sort_limit':n})[:n ]
 2607:      
 2608:     
 2609:     def getLastChanges_html(self,n=100):
 2610:         """get the last n changes"""
 2611:         list = [x.getId for x in self.getLastChanges(n)]
 2612:         return self.cdli_main.findObjectsFromList(list=list,display=True)
 2613:                                        
 2614:     def refreshTxt(self,txt="",threadName=None):
 2615:         """txt fuer refresh"""
 2616:   
 2617:         return """ 2;url=%s?repeat=%s """%(self.absolute_url()+txt,threadName)
 2618: 
 2619:     def refreshTxtBasket(self,txt="",threadName=None):
 2620:         """txt fuer refresh"""
 2621:   
 2622:         return """ 2;url=%s?repeat=%s """%(txt,threadName)
 2623: 
 2624:     
 2625:     def getResult(self,threadName=None):
 2626:        """result of thread"""
 2627:        try:
 2628:         return self._v_uploadATF[threadName].getResult()
 2629:        except:
 2630:         return "One moment, please"
 2631:     
 2632:         
 2633:     def checkThreads(self):
 2634:         """check threads"""
 2635:         ret="<html><body>"
 2636:         for thread in threading.enumerate():
 2637:            ret+="<p>%s (%s): %s</p>"%(repr(thread),thread.getName(),thread.isAlive())
 2638:        
 2639:         return ret
 2640:                                        
 2641:                                            
 2642:     def uploadATFRPC(self,data,username):
 2643:         """upload an atffile via xml-rpc"""
 2644:         uploader=uploadATFThread()
 2645:         
 2646:         #generate an random id for the upload object
 2647:         from random import randint
 2648:         if (not self.REQUEST.SESSION.get('idTmp',None)):
 2649: 
 2650:             idTmp=str(randint(0,1000000000))
 2651:             self.REQUEST.SESSION['idTmp']=idTmp
 2652:         else:
 2653:             idTmp=self.REQUEST.SESSION.get('idTmp',None)
 2654:             
 2655:         
 2656:         uploader.set(data,0,username,idTmp)
 2657:         
 2658:         stObj=uploader.run()
 2659:         
 2660:         processor=uploadATFfinallyThread()
 2661:         
 2662:         basketname=stObj.returnValue['basketNameFromFile']
 2663:         
 2664:         processor.set("uploadchanged",basketname=basketname,SESSION=stObj.returnValue,username=username,serverport=self.REQUEST['SERVER_PORT'])
 2665:         
 2666:         processor.run()
 2667:         
 2668:         
 2669:         return generateXMLReturn(stObj.returnValue)
 2670:         
 2671:     def uploadATF(self,repeat=None,upload=None,basketId=0,RESPONSE=None):
 2672:         """upload an atf file / basket file"""
 2673:         #self._v_uploadATF.returnValue=None
 2674:         
 2675:         #generate an random id for the upload thread
 2676:         from random import randint
 2677:         if (not self.REQUEST.SESSION.get('idTmp',None)):
 2678: 
 2679:             idTmp=str(randint(0,1000000000))
 2680:             self.REQUEST.SESSION['idTmp']=idTmp
 2681:         else:
 2682:             idTmp=self.REQUEST.SESSION.get('idTmp',None)
 2683:             
 2684:     
 2685:         threadName=repeat
 2686:         if not threadName or threadName=="":
 2687:             #new thread not called from the waiting page
 2688:             tmpVar=False
 2689:        
 2690:             thread=uploadATFThread()
 2691:             threadName=thread.getName()[0:]                                
 2692:             if (not hasattr(self,'_v_uploadATF')):
 2693:                    self._v_uploadATF={}
 2694:                                        
 2695:             self._v_uploadATF[threadName]=thread
 2696:             #self._xmltrans.start()
 2697:             #thread=Thread(target=self._v_uploadATF)
 2698:             logging.info("set thread. extern")
 2699:             self._v_uploadATF[threadName].set(upload,basketId,self.REQUEST['AUTHENTICATED_USER'],idTmp,serverport=self.REQUEST['SERVER_PORT'])
 2700:             #thread.start()
 2701:             logging.info("start thread. extern")
 2702:             self._v_uploadATF[threadName].start()
 2703: 
 2704:             
 2705:             self.threadName=self._v_uploadATF[threadName].getName()[0:]
 2706:             wait_template=self.aq_parent.ZopeFind(self.aq_parent,obj_ids=['wait_template'])
 2707: 
 2708:             if wait_template:
 2709:                 return wait_template[0][1]()
 2710:             pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadATFWait.zpt')).__of__(self)
 2711:             return pt(txt='/uploadATF',threadName=threadName)
 2712:             #_v_xmltrans.run()
 2713:             
 2714:         else:
 2715:             #recover thread, if lost
 2716:             if (not hasattr(self,'_v_uploadATF')):
 2717:                self._v_uploadATF={}
 2718:             if not self._v_uploadATF.get(threadName,None):
 2719:                  for thread in threading.enumerate():
 2720:                          if threadName == thread.getName():
 2721:                                        self._v_uploadATF[threadName]=thread
 2722:                                        
 2723:             if self._v_uploadATF.get(threadName,None) and (not self._v_uploadATF[threadName].returnValue):
 2724:         
 2725: 
 2726:                 wait_template=self.aq_parent.ZopeFind(self.aq_parent,obj_ids=['wait_template'])
 2727:                 if wait_template:
 2728:                         return wait_template[0][1]()
 2729:                 
 2730:                 pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadATFWait.zpt')).__of__(self)
 2731: 
 2732:                 return pt(txt='/uploadATF',threadName=threadName)
 2733:                 
 2734:             else:
 2735:                 tmp=getattr(self.temp_folder,idTmp).returnValue
 2736:  
 2737:                 pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadCheck.zpt')).__of__(self)
 2738: 
 2739:                 return pt(changed=tmp['changed'],lockerrors=tmp['lockerrors'],errors=tmp['errors'],dir=tmp['dir'],newPs=tmp['newPs'],basketLen=tmp['basketLen'],numberOfFiles=tmp['numberOfFiles'],
 2740:                   basketNameFromId=tmp['basketNameFromId'],basketNameFromFile=tmp['basketNameFromFile'],basketId=tmp['basketId'])
 2741:                      
 2742:     def redoUpload(self,threadName):
 2743:        """redo the upload"""
 2744:        tmp=self.cdli_main.tmpStore2[threadName]
 2745:        pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadCheck.zpt')).__of__(self)
 2746:        return pt(changed=tmp['changed'],lockerrors=tmp['lockerrors'],errors=tmp['errors'],dir=tmp['dir'],newPs=tmp['newPs'],basketLen=tmp['basketLen'],numberOfFiles=tmp['numberOfFiles'],
 2747:                   basketNameFromId=tmp['basketNameFromId'],basketNameFromFile=tmp['basketNameFromFile'],basketId=tmp['basketId'])
 2748:                  
 2749:     def uploadATFfinally(self,procedure='',comment="",basketname='',unlock=None,repeat=None,RESPONSE=None):
 2750:         """nowupload the files"""
 2751:        
 2752:        
 2753:        
 2754:         threadName=repeat
 2755:         if not threadName or threadName=="":
 2756:             thread=uploadATFfinallyThread()
 2757:             threadName=thread.getName()[0:]
 2758: 
 2759:             if (not hasattr(self,'_v_uploadATF')):
 2760:                                 self._v_uploadATF={}
 2761: 
 2762: 
 2763:             self._v_uploadATF[threadName]=thread
 2764: 
 2765:             idTmp=self.REQUEST.SESSION['idTmp']
 2766:             stObj=getattr(self.temp_folder,idTmp)
 2767:             self._v_uploadATF[threadName].set(procedure,comment=comment,basketname=basketname,unlock=unlock,SESSION=stObj.returnValue,username=self.REQUEST['AUTHENTICATED_USER'],serverport=self.REQUEST['SERVER_PORT'])
 2768: 
 2769:             self._v_uploadATF[threadName].start()
 2770: 
 2771:             
 2772:             
 2773:             wait_template=self.aq_parent.ZopeFind(self.aq_parent,obj_ids=['wait_template'])
 2774: 
 2775:             if wait_template:
 2776:                 return wait_template[0][1]()
 2777:             pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadATFWait.zpt')).__of__(self)
 2778: 
 2779:             return pt(txt='/uploadATFfinally',threadName=threadName)
 2780:             #_v_xmltrans.run()
 2781:         
 2782:         else:
 2783:             #recover thread, if lost
 2784:             if not hasattr(self,'_v_uploadATF'):
 2785:                self._v_uploadATF={}
 2786:             if not self._v_uploadATF.get(threadName,None):
 2787:                  for thread in threading.enumerate():
 2788:                          if threadName == thread.getName():
 2789:                                        self._v_uploadATF[threadName]=thread
 2790:                                        
 2791:             if self._v_uploadATF.get(threadName,None) and (self._v_uploadATF[threadName] is not None) and (not self._v_uploadATF[threadName].end) :
 2792: 
 2793:                 wait_template=self.aq_parent.ZopeFind(self.aq_parent,obj_ids=['wait_template'])
 2794:                 if wait_template:
 2795:                         return wait_template[0][1]()
 2796:                 
 2797:                 pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadATFWait.zpt')).__of__(self)
 2798:                 return pt(txt='/uploadATFfinally',threadName=threadName)
 2799:             else:
 2800:               
 2801:              
 2802:               idTmp=self.REQUEST.SESSION['idTmp']
 2803:               stObj=getattr(self.temp_folder,idTmp) 
 2804:               self.REQUEST.SESSION['idTmp']=None
 2805:              
 2806:               #update changed
 2807:               logging.debug("dir:"+repr(stObj.returnValue['changed']))
 2808:               for x in stObj.returnValue['changed']:
 2809:                     ob=self.CDLICatalog.search({'title':x[0]})
 2810:                    
 2811:                     self.cdliRoot.updateOrAddToFileBTree(ob[0].getObject())
 2812:               if RESPONSE is not None:
 2813:                   RESPONSE.redirect(self.absolute_url())
 2814: 
 2815:     def importFiles(self,comment="",author="" ,folderName="/Users/dwinter/atf", files=None,ext=None):
 2816:         """import files"""
 2817:         logging.debug("importFiles folderName=%s files=%s ext=%s"%(folderName,files,ext))
 2818:         root=self.cdli_main
 2819:         count=0
 2820:         if not files:
 2821:             files=os.listdir(folderName)
 2822:             
 2823:         for f in files:
 2824:             folder=f[0:3]
 2825:             f2=f[0:5]
 2826:             
 2827:             #check if main folder PXX already exists
 2828:             obj=self.ZopeFind(root,obj_ids=[folder])
 2829:             logging.debug("importFiles: folder=%s f2=%s obj=%s"%(folder,f2,obj)) 
 2830:             if ext:
 2831:                 ext.result="<p>adding: %s </p>"%f+ext.result
 2832: 
 2833:             
 2834:             if not obj: # if not create it
 2835:                 manage_addCDLIFileFolder(root,folder,folder)
 2836:                 fobj=getattr(root,folder)
 2837:                 #transaction.get().commit()                           
 2838: 
 2839:             else:
 2840:                 fobj=obj[0][1]
 2841:             
 2842:             #check IF PYYYYY already exist
 2843:             obj2=fobj.ZopeFind(fobj,obj_ids=[f2])
 2844:             logging.debug("importFiles: fobj=%s obj2=%s"%(fobj,obj2)) 
 2845:         
 2846:             if not obj2:# if not create it
 2847:                 manage_addCDLIFileFolder(fobj,f2,f2)
 2848:                 fobj2=getattr(fobj,f2)
 2849:         
 2850:             else:
 2851:                 fobj2=obj2[0][1]
 2852:               
 2853:             # not add the file
 2854:             file2=os.path.join(folderName,f)  
 2855:             id=f
 2856:             logging.debug("importFiles: addCDLIFile fobj2=%s, f=%s file2=%s"%(fobj2,repr(f),repr(file2)))
 2857:             fobj2.addFile(vC='',file=file(file2),author=author,newName=f)
 2858:             count+=1
 2859:             
 2860:             #now add the file to the storage
 2861:             ob = getattr(fobj2,f)
 2862:             self.cdliRoot.updateOrAddToFileBTree(ob)
 2863:             
 2864:             if count%100==0:
 2865:                 logging.debug("importfiles: committing")
 2866:                 transaction.get().commit()
 2867: 
 2868:         transaction.get().commit()
 2869:         return "ok"
 2870:          
 2871: 
 2872: manage_addCDLIRootForm=DTMLFile('dtml/rootAdd', globals())
 2873: 
 2874:     
 2875: def manage_addCDLIRoot(self, id, title='',
 2876:                      createPublic=0,
 2877:                      createUserF=0,
 2878:                      REQUEST=None):
 2879:     """Add a new Folder object with id *id*.
 2880: 
 2881:     If the 'createPublic' and 'createUserF' parameters are set to any true
 2882:     value, an 'index_html' and a 'UserFolder' objects are created respectively
 2883:     in the new folder.
 2884:     """
 2885:     ob=CDLIRoot()
 2886:     ob.id=str(id)
 2887:     ob.title=title
 2888:     try:
 2889:         self._setObject(id, ob)
 2890:     except:
 2891:         pass
 2892:     ob=self._getOb(id)
 2893: 
 2894:     checkPermission=getSecurityManager().checkPermission
 2895: 
 2896:     if createUserF:
 2897:         if not checkPermission('Add User Folders', ob):
 2898:             raise Unauthorized, (
 2899:                   'You are not authorized to add User Folders.'
 2900:                   )
 2901:         ob.manage_addUserFolder()
 2902: 
 2903:   
 2904:     if REQUEST is not None:
 2905:         return self.manage_main(self, REQUEST, update_menu=1)    
 2906:  

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>