cdli/cdli_files.py - diff

Return to cdli_files.py CVS log

Up to [Repository] / cdli

Diff for /cdli/cdli_files.py between versions 1.79 and 1.86

-version 1.79, 2007/08/31 14:22:52
+version 1.86, 2008/09/29 12:37:37
  Line 21  from ZPublisher.HTTPRequest import HTTPR
  from ZPublisher.HTTPResponse import HTTPResponse
  from ZPublisher.BaseRequest import RequestContainer
  import threading
- from BTrees.OOBTree import OOBTree
+ from BTrees.OOBTree import OOBTree, OOTreeSet
  import logging
  import transaction
  import copy
  import codecs
  import sys
+ from BTrees.IOBTree import IOBTree
+ import cdliSplitter
+ from sets import Set
+ import md5
+ def makelist(mySet):
+         x = list(mySet)
+         x.sort()
+         return x
  def unicodify(s):
      """decode str (utf-8 or latin-1 representation) into unicode object"""
- Line 50  def utf8ify(s):
+ Line 60  def utf8ify(s):
      else:
          return s.encode('utf-8')
+ def formatAtfHtml(l):
+     """escape special ATF characters for HTML"""
+     if not l:
+         return ""
+     # replace &
+     l = l.replace('&','&amp;')
+     # replace angular brackets
+     l = l.replace('<','&lt;')
+     l = l.replace('>','&gt;')
+     return l
+ def formatAtfLineHtml(l, nolemma=True):
+     """format ATF line for HTML"""
+     if not l:
+         return ""
+     if nolemma:
+         # ignore lemma lines
+         if l.lstrip().startswith('#lem:'):
+             return ""
+     return formatAtfHtml(l)
+ def formatAtfFullLineNum(txt, nolemma=True):
+     """format full line numbers in ATF text"""
+     # surface codes
+     surfaces = {'@obverse':'obv',
+                 '@reverse':'rev',
+                 '@surface':'surface',
+                 '@edge':'edge',
+                 '@left':'left',
+                 '@right':'right',
+                 '@top':'top',
+                 '@bottom':'bottom',
+                 '@face':'face',
+                 '@seal':'seal'}
+     if not txt:
+         return ""
+     ret = []
+     surf = ""
+     col = ""
+     for line in txt.splitlines():
+         line = unicodify(line)
+         if line and line[0] == '@':
+             # surface or column
+             words = line.split(' ')
+             if words[0] in surfaces:
+                 surf = line.replace(words[0],surfaces[words[0]]).strip()
+             elif words[0] == '@column':
+                 col = ' '.join(words[1:])
+         elif line and line[0] in '123456789':
+             # ordinary line -> add line number
+             line = "%s:%s:%s"%(surf,col,line)
+         ret.append(line)
+     return '\n'.join(ret)
  def generateXMLReturn(hash):
      """erzeugt das xml file als returnwert fuer uploadATFRPC"""
- Line 76  def generateXMLReturn(hash):
+ Line 151  def generateXMLReturn(hash):
      return ret
  def unique(s):
      """Return a list of the elements in s, but without duplicates.
- Line 253  class uploadATFfinallyThread(Thread):
+ Line 320  class uploadATFfinallyThread(Thread):
          self.result+="<h2>Start processing</h2>"
          #shall I only upload the changed files?
-         logging.info("uploadATFfinally procedure: %s"%procedure)
+         logging.debug("uploadATFfinally procedure: %s"%procedure)
          if procedure=="uploadchanged":
              changed=[x[0] for x in SESSION.get('changed',[])]
              uploadFns=changed+SESSION.get('newPs',[])
- Line 274  class uploadATFfinallyThread(Thread):
+ Line 341  class uploadATFfinallyThread(Thread):
          #do first the changed files
          i=0
          for fn in uploadFns:
+             logging.debug("uploadATFfinally uploadFn=%s"%fn)
              i+=1
              founds=ctx2.CDLICatalog.search({'title':fn})
              if len(founds)>0:
                  SESSION['author']=str(username)
                  self.result="<p>Changing : %s"%fn+self.result
+                 logging.debug("uploadatffinallythread changing:%s"%fn+self.result)
                  founds[0].getObject().manage_addCDLIFileObject('',comment,SESSION['author'],file=os.path.join(SESSION['tmpdir'],fn),from_tmp=True)
-             if i==200:
+             if i%200==0:
-                         i=0
                          transaction.get().commit()
-                         logging.info("changing: do commit")
+                 logging.debug("uploadatffinallythread changing: do commit")
          transaction.get().commit()
-         logging.info("changing: last commit")
+         logging.debug("uploadatffinallythread changing: last commit")
          #now add the new files
          newPs=SESSION['newPs']
          if len(newPs)>0:
              tmpDir=SESSION['tmpdir']
-             logging.info("adding start")
+             logging.debug("uploadatffinallythread adding start")
              self.result="<p>Adding files</p>"+self.result
              #TODO: make this configurable, at the moment base folder for the files has to be cdli_main
              ctx2.importFiles(comment=comment,author=str(username) ,folderName=tmpDir, files=newPs,ext=self)
-             logging.info("adding finished")
+             logging.debug("uploadatffinallythread adding finished")
          #unlock locked files?
          if unlock:
-             logging.info("unlocking start")
+             logging.debug("uploadatffinallythread unlocking start")
              self.result="<p>Unlock files</p>"+self.result
              unlockFns=[]
              for x in os.listdir(SESSION['tmpdir']):
                      if not x in SESSION['errors']:
                          unlockFns.append(x)
-             logging.info("unlocking have now what to unlock")
+             logging.debug("unlocking have now what to unlock")
              for fn in unlockFns:
                  #logging.info("will unlock: %s"%fn)
- Line 317  class uploadATFfinallyThread(Thread):
+ Line 384  class uploadATFfinallyThread(Thread):
                  if len(founds)>0:
                      #logging.info("unlock: %s"%founds[0].getObject().getId())
                      SESSION['author']=str(username)
                      founds[0].getObject().lockedBy=""
-             logging.info("unlocking done")
+             logging.debug("uploadatffinallythread unlocking done")
          #if a basketname is given, add files to the basket
          if not (basketname ==''):
-             logging.info("add to basket %s"%basketname)
+             logging.debug("uploadatffinallythread add to basket %s"%basketname)
              self.result="<p>Add to basket</p>"+self.result
              basketId=ctx2.basketContainer.getBasketIdfromName(basketname)
              if not basketId: # create new basket
-                 logging.info("create basket %s"%basketname)
+                 logging.debug("uploadatffinallythread create basket %s"%basketname)
                  self.result="<p>Create a new basket</p>"+self.result
                  ob=ctx2.basketContainer.addBasket(basketname)
                  basketId=ob.getId()
              basket=getattr(ctx2.basketContainer,str(basketId))
              ids=os.listdir(SESSION['tmpdir'])
+             logging.debug("should add:"+repr(ids))
              basket.addObjects(ids,deleteOld=True,username=str(username))
+         logging.debug("uploadatffinallythread uploadfinally done")
          if RESPONSE is not None:
              RESPONSE.redirect(self.aq_parent.absolute_url())
-         logging.info("uploadfinally done")
          return True
  class tmpStore(SimpleItem):
- Line 572  class CDLIBasketContainer(OrderedFolder)
+ Line 640  class CDLIBasketContainer(OrderedFolder)
                              ret+=str(object[0].getData())+"\n"
              elif current=="yes":
                              #search current object
-                             logging.info("crrent: %s"%object[1].getId().split(".")[0])
+                             logging.debug("current: %s"%object[1].getId().split(".")[0])
                              founds=self.CDLICatalog.search({'title':object[1].getId().split(".")[0]})
                              if len(founds)>0:
                                  ret+=str(founds[0].getObject().getLastVersion().getData())+"\n"
- Line 865  class CDLIBasketContainer(OrderedFolder)
+ Line 933  class CDLIBasketContainer(OrderedFolder)
          if not ids:
              ids=self.REQUEST.SESSION['fileIds']
-         if type(ids) is not ListType:
+         if (type(ids) is not ListType) and (not isinstance(ids,Set)):
              ids=[ids]
+         if isinstance(ids,Set):
+             ids=list(ids)
          if (submit.lower()=="store in new basket") or (submit.lower()=="new basket"):
              basketRet=self.addBasket(newBasketName)
              self.setActiveBasket(basketRet.getId())
- Line 881  class CDLIBasketContainer(OrderedFolder)
+ Line 952  class CDLIBasketContainer(OrderedFolder)
          if fromFileList:
-             return self.cdli_main.findObjectsFromList(list=self.REQUEST.SESSION['fileIds'],basketName=basket.title,numberOfObjects=added)
+             return self.cdli_main.findObjectsFromList(list=ids,basketName=basket.title,numberOfObjects=added)
          if RESPONSE:
- Line 912  class CDLIBasket(Folder,CatalogAware):
+ Line 983  class CDLIBasket(Folder,CatalogAware):
      def searchInBasket(self,indexName,searchStr,regExp=False):
          """searchInBasket"""
-         lst=self.searchInLineIndexDocs(indexName,searchStr,uniq=True,regExp=regExp)
+         lst=self.searchInLineIndexDocs(indexName,searchStr,uniq=True,regExp=regExp) #TODO: fix this
          ret={}
          lv=self.getLastVersion()
- Line 960  class CDLIBasket(Folder,CatalogAware):
+ Line 1031  class CDLIBasket(Folder,CatalogAware):
      def isActual(self,obj):
          """teste ob im basket die aktuelle version ist"""
+         try:
+             logging.debug("isActual:"+repr(obj))
          actualNo=obj[1].getLastVersion().getVersionNumber()
          storedNo=obj[0].getVersionNumber()
- Line 974  class CDLIBasket(Folder,CatalogAware):
+ Line 1047  class CDLIBasket(Folder,CatalogAware):
              return True , 0
          else:
              return False, actualNo
+         except:
+             return False, -1
      def history(self):
          """history"""
- Line 1117  class CDLIBasket(Folder,CatalogAware):
+ Line 1192  class CDLIBasket(Folder,CatalogAware):
      def addObjects(self,ids,deleteOld=None,username=None):
          """generate a new version of the basket with objects added"""
+         def swap(x):
+             return (x[1],x[0])
          logging.info("add to basket (%s)"%(self.getId()))
          lastVersion=self.getLastVersion()
- Line 1128  class CDLIBasket(Folder,CatalogAware):
+ Line 1207  class CDLIBasket(Folder,CatalogAware):
          if deleteOld:
              oldContent=[]
-         newContent=[]
          added=0
-         for id in ids:
+ #        for id in ids:
-             try:
+ #            logging.debug("adding:"+id)
-                 founds=self.CDLICatalog.search({'title':id})
+ #            try:
-             except:
+ #                founds=self.CDLICatalog.search({'title':id})
-                 founds=[]
+ #            except:
+ #                founds=[]
+ #
+ #            for found in founds:
+ #                if found.getObject() not in oldContent:
+ #                    #TODO: was passiert wenn, man eine Object dazuf�gt, das schon da ist aber eine neuere version
+ #                    newContent.append((found.getObject().getLastVersion(),found.getObject()))
+ #                    added+=1
+         hash = md5.new(repr(makelist(ids))).hexdigest() # erzeuge hash als identification
+         #logging.debug("JJJJJJJ:"+repr(self.makelist(ids)))
+         logging.debug("JJJJJJJ:"+repr(hash))
+         if hasattr(self.cdliRoot,'v_tmpStore') and self.cdliRoot.v_tmpStore.has_key(hash):
+             logging.debug("from store!")
+             newContent=Set(map(swap,self.cdliRoot.v_tmpStore[hash]))
-             for found in founds:
+         else:
-                 if found.getObject() not in oldContent:
+             logging.debug("not from store!")
-                     #TODO: was passiert wenn, man eine Object dazuf�gt, das schon da ist aber eine neuere version
+             newContent=Set([(self.getFileObjectLastVersion(x),self.getFileObject(x)) for x in ids])
-                     newContent.append((found.getObject().getLastVersion(),found.getObject()))
-                     added+=1
-         content=oldContent+newContent
+         content=Set(oldContent).union(newContent)
+         added = len(content)-len(oldContent)
          if not username:
              user=self.getActualUserName()
          else:
              user = username
-         ob=manage_addCDLIBasketVersion(self,user,comment="",basketContent=content)
+         #logging.debug("content:"+repr(list(content)))
+         ob=manage_addCDLIBasketVersion(self,user,comment="",basketContent=list(content))
          logging.info("add to basket (%s) done"%(self.getId()))
          return added
- Line 1285  class CDLIBasketVersion(Implicit,Persist
+ Line 1379  class CDLIBasketVersion(Implicit,Persist
      def downloadObjectsAsOneFileFinally(self,lock=None,procedure=None,REQUEST=None,current="no"):
          """print do the download"""
+         logging.debug("HIHHHH")
          ret=""
          lockedObjects={}
- Line 1332  class CDLIBasketVersion(Implicit,Persist
+ Line 1426  class CDLIBasketVersion(Implicit,Persist
          for object in self.content.getContent():
+                 logging.error("ret:"+repr(object[0]))
+                 logging.error("    -"+repr(procedure))
+                 logging.error("    -"+repr(object[1].lockedBy))
                  if (procedure=="downloadAll") or (object[1].lockedBy=='') or (object[1].lockedBy==self.REQUEST['AUTHENTICATED_USER']):
+                     logging.error("ret1")
                      if current=="no": #version as they are in the basket
+                         logging.error("ret2")
                          ret+=str(object[0].getData())+"\n"
                      elif current=="yes":
+                         logging.error("ret3")
                          #search current object
                          founds=self.CDLICatalog.search({'title':object[1].getId().split(".")[0]})
                          if len(founds)>0:
- Line 1344  class CDLIBasketVersion(Implicit,Persist
+ Line 1444  class CDLIBasketVersion(Implicit,Persist
                  if lock and object[1].lockedBy=='':
                      object[1].lockedBy=self.REQUEST['AUTHENTICATED_USER']
+         if (not isinstance(self.aq_parent,CDLIBasket)):
+             basket_name=self.aq_parent.aq_parent.title+"_V"+self.getId()
+         else:
          basket_name=self.aq_parent.title+"_V"+self.getId()
          #write basketname to header of atf file
          ret="#basket: %s\n"%basket_name+ret
- Line 1450  class CDLIFileObject(CatalogAware,extVer
+ Line 1556  class CDLIFileObject(CatalogAware,extVer
      security=ClassSecurityInfo()
+     security.declareProtected('manage','index_html')
-     security.declarePublic('makeThisVersionCurrent')
+     security.declarePublic('view')
+     view = PageTemplateFile('zpt/viewCDLIFile.zpt', globals())
+     security.declarePublic('editATF')
+     editATF = PageTemplateFile('zpt/editATFFile.zpt', globals())
-     security.declareProtected('manage','index_html')
      def PrincipiaSearchSource(self):
             """Return cataloguable key for ourselves."""
             return str(self)
      def makeThisVersionCurrent_html(self):
-         """form for making this version current"""
+         """form for mthis version current"""
          pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','makeThisVersionCurrent.zpt')).__of__(self)
          return pt()
+     security.declarePublic('makeThisVersionCurrent')
      def makeThisVersionCurrent(self,comment,author,RESPONSE=None):
          """copy this version to current"""
          parent=self.aq_parent
+         parent.manage_addVersionedFileObject(id=None,vC=comment,author=author,file=self.getData(),RESPONSE=RESPONSE)
+         #newversion=parent.manage_addCDLIFileObject('',comment,author)
+         #newversion.manage_upload(self.getData())
+         #if RESPONSE is not None:
-         newversion=parent.manage_addCDLIFileObject('',comment,author)
+         #    RESPONSE.redirect(self.aq_parent.absolute_url()+'/history')
-         newversion.manage_upload(self.getData())
-         if RESPONSE is not None:
-             RESPONSE.redirect(self.aq_parent.absolute_url()+'/history')
          return True
-     security.declarePublic('view')
      def getFormattedData(self):
          """fromat text"""
          data=self.getData()
  #        return re.sub("\s\#lem"," #lem",data) #remove return vor #lem
          return re.sub("#lem","       #lem",data) #remove return vor #lem
-     def view(self):
-         """view file"""
-         pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','viewCDLIFile.zpt')).__of__(self)
-         return pt()
      security.declarePublic('getPNumber')
      def getPNumber(self):
- Line 1518  class CDLIFileObject(CatalogAware,extVer
+ Line 1622  class CDLIFileObject(CatalogAware,extVer
          except:
              return "ERROR"
  manage_addCDLIFileObjectForm=DTMLFile('dtml/fileAdd', globals(),Kind='CDLIFileObject',kind='CDLIFileObject', version='1')
- def manage_addCDLIFileObject(self,id,vC='',author='', file='',title='',precondition='', content_type='',
+ def manage_addCDLIFileObject(self,id,vC='',author='', file='',title='',versionNumber=0,
+                              precondition='', content_type='',
                               from_tmp=False,REQUEST=None):
      """Add a new File object.
      Creates a new File object 'id' with the contents of 'file'"""
      id=str(id)
- Line 1536  def manage_addCDLIFileObject(self,id,vC=
+ Line 1641  def manage_addCDLIFileObject(self,id,vC=
      self=self.this()
      # First, we create the file without data:
-     self._setObject(id, CDLIFileObject(id,title,'',content_type, precondition))
+     self._setObject(id, CDLIFileObject(id,title,versionNumber=versionNumber,versionComment=vC,time=time.localtime(),author=author))
-     self._getOb(id).versionComment=str(vC)
+     fob = self._getOb(id)
-     self._getOb(id).time=time.localtime()
-     setattr(self._getOb(id),'author',author)
      # Now we "upload" the data.  By doing this in two steps, we
      # can use a database trick to make the upload more efficient.
      if file and not from_tmp:
-         self._getOb(id).manage_upload(file)
+         fob.manage_upload(file)
      elif file and from_tmp:
-         self._getOb(id).manage_upload_from_tmp(file)
+         fob.manage_file_upload(file) # manage_upload_from_tmp doesn't exist in ExtFile2
+     #    fob.manage_upload_from_tmp(file) # manage_upload_from_tmp doesn't exist in ExtFile2
      if content_type:
-         self._getOb(id).content_type=content_type
+         fob.content_type=content_type
+     #logging.debug("manage_add: lastversion=%s"%self.getData())
+     logging.debug("reindex1: %s in %s"%(repr(self),repr(self.default_catalog)))
      self.reindex_object()
-     self._getOb(id).reindex_object()
+     #logging.debug("manage_add: fob_data=%s"%fob.getData())
+     logging.debug("reindex2: %s in %s"%(repr(fob), repr(fob.default_catalog)))
+     fob.index_object()
+     self.CDLIRoot.updateOrAddToFileBTree(ob)
      if REQUEST is not None:
          REQUEST['RESPONSE'].redirect(self.absolute_url()+'/manage_main')
  class CDLIFile(extVersionedFile,CatalogAware):
      """CDLI file"""
      security=ClassSecurityInfo()
      meta_type="CDLI file"
+     content_meta_type = ["CDLI File Object"]
      default_catalog='CDLICatalog'
      security.declareProtected('manage','index_html')
-     #security.declarePublic('history')
      def getLastVersionData(self):
          """get last version data"""
-         return self.getLastVersion().getData()
+         return self.getData()
      def getLastVersionFormattedData(self):
          """get last version data"""
-         return self.getLastVersion().getFormattedData()
+         return self.getContentObject().getFormattedData()
-     #security.declarePublic('history')
+     def getTextId(self):
+         """returns P-number of text"""
+         # assuming that its the beginning of the title
+         return self.title[:7]
+     #security.declarePublic('history')
      def history(self):
          """history"""
- Line 1622  class CDLIFile(extVersionedFile,CatalogA
+ Line 1736  class CDLIFile(extVersionedFile,CatalogA
          #return [x.getObject() for x in context.CDLIBasketCatalog.search({'getFileNamesInLastVersion':self.getId()})]
+     def _newContentObject(self, id, title='', versionNumber=0, versionComment=None, time=None, author=None):
+         """factory for content objects. to be overridden in derived classes."""
+         logging.debug("_newContentObject(CDLI)")
+         return CDLIFileObject(id,title,versionNumber=versionNumber,versionComment=versionComment,time=time,author=author)
      def addCDLIFileObjectForm(self):
          """add a new version"""
- Line 1647  class CDLIFile(extVersionedFile,CatalogA
+ Line 1767  class CDLIFile(extVersionedFile,CatalogA
          except:
              pass
+         ob = self.addContentObject(id, vC, author, file, title, changeName=changeName, newName=newName, from_tmp=from_tmp,
+                                    precondition=precondition, content_type=content_type)
-         if changeName=="yes":
-             filename=file.filename
-             self.title=filename[max(filename.rfind('/'),
-                         filename.rfind('\\'),
-                         filename.rfind(':'),
-                         )+1:]
-         if not newName=='':
-             self.title=newName[0:]
-         positionVersionNum=getattr(self,'positionVersionNum','front')
-         if positionVersionNum=='front':
-             id="V%i"%self.getVersion()+"_"+self.title
-         else:
-             tmp=os.path.splitext(self.title)
-             if len(tmp)>1:
-                 id=tmp[0]+"_V%i"%self.getVersion()+tmp[1]
-             else:
-                 id=tmp[0]+"_V%i"%self.getVersion()
-         manage_addCDLIFileObject(self,id,vC,author,file,id,precondition, content_type,from_tmp=from_tmp)
-         #objs=self.ZopeFind(self,obj_ids=[id])[0][1].setVersionNumber(int(self.getVersion()))
-         objs=getattr(self,id).setVersionNumber(int(self.getVersion()))
          try:
            #FIXME: wozu ist das gut?
            self.REQUEST.SESSION['objID_parent']=self.getId()
          except:
            pass
-         if RESPONSE:
+         #self.cdliRoot.updateOrAddToFileBTree(self)# now update the object in the cache
-             obj=self.ZopeFind(self,obj_ids=[id])[0][1]
+         if RESPONSE:
-             if obj.getSize()==0:
+             if ob.getSize()==0:
-                 self.REQUEST.SESSION['objID']=obj.getId()
+                 self.REQUEST.SESSION['objID']=ob.getId()
                  pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','errorUploadFile')).__of__(self)
                  return pt()
              else:
                  if come_from and (come_from!=""):
                                          RESPONSE.redirect(come_from+"?change="+self.getId())
                  else:
                      RESPONSE.redirect(self.REQUEST['URL2']+'?uploaded=%s'%self.title)
          else:
-             return self.ZopeFind(self,obj_ids=[id])[0][1]
+             return ob
  def manage_addCDLIFileForm(self):
- Line 1713  def manage_addCDLIFile(self,id,title,loc
+ Line 1805  def manage_addCDLIFile(self,id,title,loc
      tryToggle=True
      tryCount=0
      self._setObject(id,newObj)
      getattr(self,id).reindex_object()
      if RESPONSE is not None:
          RESPONSE.redirect('manage_main')
  def checkUTF8(data):
      """check utf 8"""
      try:
- Line 1751  def splitatf(fh,dir=None,ext=None):
+ Line 1842  def splitatf(fh,dir=None,ext=None):
      nf=None
      i=0
+     #ROC: why split \n first and then \r???
      if (type(fh) is StringType) or (type(fh) is UnicodeType):
          iter=fh.split("\n")
      else:
- Line 1804  class CDLIFileFolder(extVersionedFileFol
+ Line 1896  class CDLIFileFolder(extVersionedFileFol
      security=ClassSecurityInfo()
      meta_type="CDLI Folder"
-     filesMetaType=['CDLI file']
+     file_meta_type=['CDLI file']
-     folderMetaType=['CDLI Folder']
+     folder_meta_type=['CDLI Folder']
-     default_catalog='CDLICatalog'
-     defaultFileCatalog=default_catalog #wenn dieses definiert ist, wird beim hinzuf�gen einer neuen version eines files dieser catalog neuiniziert
+     file_catalog='CDLICatalog'
      #downloadCounter=0 # counts how many download for all files currently run, be mehr als 5 wird verweigert.
      tmpStore2={}
+     def _newVersionedFile(self, id, title='', lockedBy=None, author=None):
+         """factory for versioned files. to be overridden in derived classes."""
+         logging.debug("_newVersionedFile(CDLI)")
+         return CDLIFile(id, title, lockedBy=lockedBy, author=author)
      def setTemp(self,name,value):
          """set tmp"""
          setattr(self,name,value)
+     deleteFileForm = PageTemplateFile("zpt/doDeleteFile", globals())
-     def delete(self,ids):
+     def delete(self,ids,REQUEST=None):
-         """delete this file, i.e. move into a trash folder"""
+         """delete these files"""
+         if type(ids) is not ListType:
+             ids=[ids]
-         found=self.ZopeFind(self,obj_ids=['.trash'])
+         self.manage_delObjects(ids)
-         if len(found)<1:
+         if REQUEST is not None:
-             manage_addCDLIFileFolder(self, '.trash',title="Trash")
+             return self.index_html()
-             trash=self._getOb('.trash')
-         else:
-             trash=found[0][1]
-         if type(ids) is not ListType:
-             ids=[ids]
-         cut=self.manage_cutObjects(ids)
-         trash.manage_pasteObjects(cut)
      def getVersionNumbersFromIds(self,ids):
          """get the numbers of the current versions of documents described by their ids"""
- Line 1841  class CDLIFileFolder(extVersionedFileFol
+ Line 1936  class CDLIFileFolder(extVersionedFileFol
          founds=self.CDLICatalog.search({'title':searchStr})
          for found in founds:
-             lastVersion=found.getObject().getLastVersion()
+             lastVersion=found.getObject().getContentObject()
              ret.append((found.getId,lastVersion))
          return ret
      def getFile(self,fn):
          """get the content of the file fn"""
-         founds=self.CDLICatalog.search({'title':fn})
+         logging.debug("getFile: %s"%repr(fn))
-         if not founds:
+         if not self.hasObject(fn):
+             # search deeper
+             founds=getattr(self, self.file_catalog).search({'textid':fn})
+             if founds:
+                 obj=founds[0].getObject().getContentObject()
+             else:
              return ""
          else:
-             obj=founds[0].getObject().getLastVersion()
+             obj = self[fn].getContentObject()
              return obj.getData()[0:]
      def checkCatalog(self,fn):
          """check if fn is in the catalog"""
          #TODO add checkCatalog
      def findObjectsFromListWithVersion(self,list,author=None):
          """find objects from a list with versions
          @param list: list of tuples  (cdliFile,version)
          """
          #self.REQUEST.SESSION['fileIds']=list#store fieldIds in session for further usage
          #self.REQUEST.SESSION['searchList']=self.REQUEST.SESSION['fileIds']
          pt=getattr(self,'filelistVersioned.html')
          return pt(search=list,author=author)
- Line 1885  class CDLIFileFolder(extVersionedFileFol
+ Line 1981  class CDLIFileFolder(extVersionedFileFol
          return ret
-     def findObjectsFromList(self,enterList=None,display=False,start=None,upload=None,list=None,basketName=None,numberOfObjects=None,RESPONSE=None):
+     def expandFile(self,fileId,fileTree):
+         """wildcard in fileID suche alle Treffer"""
+         founds=self.CDLICatalog({'title':fileId})
+         for found in founds:
+             fileTree.add(found.getId)
+             logging.debug("ADDD:"+found.getId)
+     def findObjectsFromList(self,enterList=None,display=False,start=None,upload=None,list=None,basketName=None,numberOfObjects=None,RESPONSE=None,REQUEST=None,returnHash=False,hash=None):
          """findObjectsFromList (, TAB oder LINE separated)"""
+         logging.debug("start: findObjectsFromList")
+         #logging.debug("start: findObjectsFromList"+repr(list))
          if upload: # list from file upload
              txt=upload.read()
- Line 1919  class CDLIFileFolder(extVersionedFileFol
+ Line 2025  class CDLIFileFolder(extVersionedFileFol
              pt=getattr(self,'filelist.html')
              return pt(basketName=basketName,numberOfObjects=numberOfObjects)
+         if hash is not None and hasattr(self.cdliRoot,'v_tmpStore') and self.cdliRoot.v_tmpStore.has_key(hash):
+                logging.debug("asking for storage2")
+                result =self.cdliRoot.v_tmpStore[hash]
+                if result:
+                    logging.debug("give result from storage2")
+                    return hash,self.cdliRoot.v_tmpStore[hash]
          if list is not None: # got already a list
+             logging.debug(" ----List version")
              ret=[]
+             fileTree=Set()
              for fileId in list:
-                 if fileId.find("*"): #check for wildcards
-                         fileId=fileId
+                 if fileId.find("*")>-1: #check for wildcards
+                         self.expandFile(fileId,fileTree)
                  elif len(fileId.split("."))==1:
                          fileId=fileId+".atf"
+                         fileTree.add(fileId)
+                 #logging.debug("   -----:"+fileId)
+                 #ret+=self.CDLICatalog({'title':fileId})
+                 #x =self.getFileObject(fileId)
+                 #if x is not None:
+                 #    ret.append(x)
+             ids = fileTree & self.v_file_ids
+             #self.REQUEST.SESSION['fileIds']=ids#store fieldIds in session for further usage
+             l=makelist(fileTree)[0:]
+             logging.debug("l-list:"+repr(l))
+             self.REQUEST.SESSION['fileIds']=l#store fieldIds in session for further usage
+             self.REQUEST.SESSION['searchList']=l
+             #self.REQUEST.SESSION['searchList']=['P000001.atf']
+             hash = md5.new(repr(makelist(fileTree))).hexdigest() # erzeuge hash als identification
+             self.REQUEST.SESSION['hash']=hash
+             #TODO: do I need garbage collection for v_tmpStore ?
+             #logging.debug("Hash:"+repr(hash))
+ #
+ #            if hasattr(self.cdliRoot,'v_tmpStore') and self.cdliRoot.v_tmpStore.has_key(hash):
+ #               logging.debug("asking for storage")
+ #               res=self.cdliRoot.v_tmpStore[hash]
+ #               if res:
+ #                   if returnHash == True:
+ #                       return hash,res
+ #                   return res
-                 ret+=self.CDLICatalog({'title':fileId})
              #TODO: get rid of one of these..
-             ids=[x.getObject().getId() for x in ret]
+             #ids=[x.getObject().getId() for x in ret]
-             self.REQUEST.SESSION['fileIds']=ids#store fieldIds in session for further usage
+             ret=[(self.getFileObject(x),self.getFileObjectLastVersion(x)) for x in ids]
-             self.REQUEST.SESSION['searchList']=self.REQUEST.SESSION['fileIds']
+             #self.REQUEST.SESSION['fileIds']=ids#store fieldIds in session for further usage
+             #self.REQUEST.SESSION['searchList']=self.REQUEST.SESSION['fileIds']
              if display:
                  pt=getattr(self,'filelist.html')
                  return pt(search=ids)
              else:
+                 #self.REQUEST.SESSION['hash'] = ret # store in session
+                 if not hasattr(self,'v_tmpStore'):
+                     self.cdliRoot.v_tmpStore={}
+                 #logging.debug("HHHHHHNEU:"+repr(self.makelist(ids)))
+                 #logging.debug("HHHHHHNEU:"+repr(hash))
+                 self.cdliRoot.v_tmpStore[hash] = ret # store in session
+                 if returnHash == True:
+                     return hash,ret
                  return ret
- Line 1945  class CDLIFileFolder(extVersionedFileFol
+ Line 2105  class CDLIFileFolder(extVersionedFileFol
          if start:
              RESPONSE.redirect("filelist.html?start:int="+str(start))
      security.declareProtected('Manage','createAllFilesAsSingleFile')
      def createAllFilesAsSingleFile(self,RESPONSE=None):
          """download all files"""
- Line 1953  class CDLIFileFolder(extVersionedFileFol
+ Line 2112  class CDLIFileFolder(extVersionedFileFol
          def sortF(x,y):
              return cmp(x[0],y[0])
-         catalog=getattr(self,self.default_catalog)
+         catalog=getattr(self,self.file_catalog)
          #tf,tfilename=mkstemp()
          if not hasattr(self.temp_folder,'downloadCounter'):
              self.temp_folder.downloadCounter=0
- Line 1980  class CDLIFileFolder(extVersionedFileFol
+ Line 2139  class CDLIFileFolder(extVersionedFileFol
                  #os.write(tf,obj.getLastVersion().data)
                  if RESPONSE:
-                     RESPONSE.write(obj.getLastVersion().getData()[0:])
+                     RESPONSE.write(obj.getData()[0:])
                      RESPONSE.write("\n")
                  self.temp_folder.downloadCounter-=1
                  self._p_changed=1
- Line 2000  class CDLIFileFolder(extVersionedFileFol
+ Line 2159  class CDLIFileFolder(extVersionedFileFol
      def hasParent(self):
          """returns true falls subfolder"""
-         if self.aq_parent.meta_type in self.folderMetaType:
+         if self.aq_parent.meta_type in self.folder_meta_type:
              return True
          else:
              return False
- Line 2008  class CDLIFileFolder(extVersionedFileFol
+ Line 2167  class CDLIFileFolder(extVersionedFileFol
      def getFolders(self):
          """get all subfolders"""
          ret=[]
-         folders=self.ZopeFind(self,obj_metatypes=self.folderMetaType)
+         folders=self.ZopeFind(self,obj_metatypes=self.folder_meta_type)
          for folder in folders:
              ret.append((folder[1],
-                         len(self.ZopeFind(folder[1],obj_metatypes=self.folderMetaType)),
+                         len(self.ZopeFind(folder[1],obj_metatypes=self.folder_meta_type)),
-                         len(self.ZopeFind(folder[1],obj_metatypes=self.filesMetaType))
+                         len(self.ZopeFind(folder[1],obj_metatypes=self.file_meta_type))
                          ))
          return ret
- Line 2066  class CDLIRoot(Folder):
+ Line 2225  class CDLIRoot(Folder):
      meta_type="CDLIRoot"
      downloadCounterBaskets=0# counts the current basket downloads if counter > 10 no downloads are possible
-     def deleteFiles(self,ids):
+     file_catalog = 'CDLICatalog'
-         """delete files (resp. move into .trash folder)"""
-         # find or generete trash folder
-         found=self.ZopeFind(self,obj_ids=['.trash'])
-         if len(found)<1:
-             manage_addCDLIFileFolder(self, '.trash',title="Trash")
-             trash=self._getOb('.trash')
-         else:
-             logging.info(found)
-             trash=found[0][1]
-         for id in ids:
-             founds=self.CDLICatalog.search({'title':id.split(".")[0]})
-             if founds:
-                 logging.info(founds)
-                 folder=founds[0].getObject().aq_parent #get the parent folder of the object
-                 logging.info(folder)
-                 cut=folder.manage_cutObjects([founds[0].getId]) #cut it out
-                 trash.manage_pasteObjects(cut)  #paste it in the trash
-     def findWordRegExp(self,indexName,searchTerm):
+     # word splitter for search
-         """find all words in index which match regexp in SearchTerm
+     splitter = {'words':cdliSplitter.wordSplitter(),
-         @param indexName: name of the index to be searched in
+                 'graphemes':cdliSplitter.graphemeSplitter()}
-         @param searchTerm: word to be searched"""
-         ret=[]
+     def viewATF(self,id,RESPONSE):
-         for x in self.lineIndexes[indexName].iterkeys():
+         """view an Object"""
-             if re.match(searchTerm,x):
+         ob = self.CDLICatalog({'title':id})
-                 ret.append(x)
+         logging.debug(ob[0].getObject().getLastVersion().absolute_url()+"/view")
-         return ret
+         if len(ob)>0:
+             RESPONSE.redirect(ob[0].getObject().getLastVersion().absolute_url()+"/view")
-     def searchRegExpInLineIndexDocs(self,indexName,searchTerm):
+         return "not found"
-         """search in inLineIndex with regexp
-         @param indexName: name of the index to be searched in
+     def history(self,id,RESPONSE):
-         @param searchTerm: term to be searched
+         """view an Object"""
-         """
+         ob = self.CDLICatalog({'title':id})
-         if not searchTerm:
+         if len(ob)>0:
-             return []
+             RESPONSE.redirect(ob[0].absolute_url+"/history")
-         ret=[]
+         return "not found"
-         words=self.findWordRegExp(indexName,searchTerm) # suche nach allen Treffern
-         logging.info("wd:%s"%words)
-         for word in words:
+     def downloadLocked(self,id,RESPONSE):
+         """view an Object"""
-             ret+=self.searchInLineIndexDocs(indexName,word)
+         ob = self.CDLICatalog({'title':id})
+         if len(ob)>0:
+             RESPONSE.redirect(ob[0].absolute_url+"/downloadLocked")
-         x= unique(ret)
+         return "not found"
-     logging.info("words_done")
+     def download(self,id,RESPONSE):
+         """view an Object"""
+         ob = self.CDLICatalog({'title':id})
+         if len(ob)>0:
+             RESPONSE.redirect(ob[0].getLastVersion().absolute_url())
+         return "not found"
+     def addCDLIFileObjectForm(self,id,RESPONSE):
+         """view an Object"""
+         ob = self.CDLICatalog({'title':id})
+         if len(ob)>0:
+             RESPONSE.redirect(ob[0].absolute_url+"/addCDLIFileObjectForm")
+         return "not found"
+     def addVersionedFileObjectForm(self,id,RESPONSE):
+         """view an Object"""
+         ob = self.CDLICatalog({'title':id})
+         if len(ob)>0:
+             RESPONSE.redirect(ob[0].absolute_url+"/addVersionedFileObjectForm")
+         return "not found"
+     def unlock(self,id,RESPONSE):
+         """view an Object"""
+         ob = self.CDLICatalog({'title':id})
+         if len(ob)>0:
+             RESPONSE.redirect(ob[0].absolute_url+"/unlock")
+         return "not found"
+     def getFileObject(self,fileId):
+         """get an object"""
+         x=self.v_files.get(fileId)
+         #logging.debug(x)
          return x
-     def showInLineIndex(self):
+     def getFileObjectLastVersion(self,fileId):
-         """get the index for debug purposes"""
+         """get an object"""
-         print "show"
+         x=self.v_files_lastVersion.get(fileId)
-         for key in self.lineIndexes.keys():
+         #logging.debug(x)
-             logging.info("index:%s"%key)
+         return x
-             for x in self.lineIndexes[key].iterkeys():
-                 logging.info("word:%s"%repr(x))
-                 #for y in self.lineIndex[x].iterkeys():
-                 #    print "doc",repr(y),repr(self.lineIndex[x][y])
-         return self.lineIndexes
-     def searchInLineIndexDocs(self,indexName,word,uniq=True,regExp=False):
-         """search occurences in an index
-         @param indexName: name of the index to be searched in
-         @param word: word to be searched
-         @param unique: (optional) unify the list of results
-         @param regExp: (optional) use regular expressions
-         """
-         if regExp:
-             return self.searchRegExpInLineIndexDocs(indexName,word)
-         try:
-                 lst=list(self.lineIndexes[indexName].get(word).keys())
-         except:
-             logging.error("error: searchInLineIndexDocs (%s %s)"%(sys.exc_info()[0:2]))
-             lst=[]
-         if uniq:
-             return unique(lst)
-         else:
-             return lst
-     def getLinesFromIndex(self,indexName,word,doc,regExp=False):
-         """return all lines from a document where word is found
-         @param indexName: Name of the index
-         @param word: word to be searched
-         @param doc: name of the document (usuallay the p-number)
-         @param regExp: (optional) use regExp
-         """
-         if not regExp:
-             return self.lineIndexes[indexName].get(word)[doc]
-         else: # wenn regexp, suche welches word
-             for w in self.findWordRegExp(indexName,word):
-                 if self.lineIndexes[indexName].get(w): # ein word in im dex gefunden
-                     try:
-                         dc=self.lineIndex[indexName].get(word)[doc]
-                         return dc # und ein document dann gib es zurueck
-                     except:
-                          pass #andernfalls weiter
-     def cleanInLineIndex(self,indexName):
-         """empty an InlineIndex
-         @param indexName: name of the index
-         """
-         for x in list(self.lineIndexes[indexName].keys()):
-             del(self.lineIndexes[indexName][x])
-         print [x for x in self.lineIndexes[indexName].keys()]
-         return "ok"
-     def storeInLineIndex(self,indexName,key,value):
+     def showFileIds(self):
-         """store in index, key is normally a word or grapheme
+         """showIds"""
-         and value is a tuple (documentname, line) where the word can be found
+         return self.v_file_ids
-         @param indexName: name of the index
-         @param key: key in index
+     def generateFileBTree(self):
-         @param value: value in index, value is a tuple (document name, line)
+         """erzeuge einen Btree aus allen Files"""
-         """
+         self.v_files = OOBTree()
-         logging.error("indexing: %s %s"%(indexName,key))
+         self.v_files_lastVersion = OOBTree()
-         if (not hasattr(self,'lineIndexes')):
+         self.v_file_ids = Set()
+         for x in self.CDLICatalog.searchResults():
+             self.v_files.update({x.getId:x.getObject()})
+             self.v_files_lastVersion.update({x.getId:x.getObject().getLastVersion()})
+             self.v_file_ids.add(x.getId)
+             logging.debug("add:"+x.getId+"XXX"+repr(x.getObject()))
-             self.lineIndexes={}
+         return True
-         if self.lineIndexes.get(indexName,None) is None:
-             #index exisitiert noch nicht dann anlegen
-             self.lineIndexes[indexName]=OOBTree()
+     def updateOrAddToFileBTree(self,obj):
-         lis=self.lineIndexes
+         """update a BTree"""
-         li=lis[indexName]
+         self.v_files.update({obj.getId():obj})
+         self.v_files_lastVersion.update({obj.getId():obj.getLastVersion()})
+         self.v_file_ids.add(obj.getId())
+         logging.debug("update:"+obj.getId()+"XXX"+repr(obj))
+     def deleteFromBTree(self,objId):
+         """delete an obj"""
+         self.v_files.pop(objId)
+         self.v_files_lastVersion.pop(objId)
+         self.v_file_ids.remove(objId)
-         if li.has_key(key):
- #            if li[key].has_key(value[0]) and (not (value[1] in li[key][value[0]])):
-             if li[key].has_key(value[0]):
-                 tmp=li[key][value[0]]
-                 tmp.append(value[1]) # add it if now in the array
-                 li[key][value[0]]=tmp[0:]
-             else:
-                 li[key][value[0]]=[value[1]] # new array for lines
-         else:
+     def deleteFiles(self,ids):
+         """delete files"""
+         for id in ids:
+             founds=self.CDLICatalog.search({'title':id.split(".")[0]})
+             if founds:
+                 logging.debug("deleting %s"%founds)
+                 folder=founds[0].getObject().aq_parent #get the parent folder of the object
+                 logging.debug("deleting from %s"%folder)
+                 cut=folder.delete([founds[0].getId]) #cut it out
-             li[key]=OOBTree()# new btree for lines
-             li[key][value[0]]=[value[1]]
-         self.lineIndexes=lis
+     def searchText(self, query, index='graphemes'):
+         """searches query in the fulltext index and returns a list of file ids/P-numbers"""
+         # see also: http://www.plope.com/Books/2_7Edition/SearchingZCatalog.stx#2-13
+         logging.debug("searchtext for '%s' in index %s"%(query,index))
+         #import Products.ZCTextIndex.QueryParser
+         #qp = QueryParser.QueryParser()
+         #logging.debug()
+         idxQuery = {index:{'query':query}}
+         idx = getattr(self, self.file_catalog)
+         # do search
+         resultset = idx.search(query_request=idxQuery,sort_index='textid')
+         # put only the P-Number in the result
+         results = [res.getId[:7] for res in resultset]
+         logging.debug("searchtext: found %d texts"%len(results))
+         return results
+     def getFile(self, pnum):
+         """get the translit file with the given pnum"""
+         f = getattr(self, self.file_catalog).search({'textid':pnum})
+         if not f:
+             return ""
-         transaction.get().commit()
+         return f[0].getObject().getData()
      def showFile(self,fileId,wholePage=False):
          """show a file
          @param fileId: P-Number of the document to be displayed
          """
-         f=self.CDLICatalog({'title':fileId})
+         f=getattr(self, self.file_catalog).search({'textid':fileId})
          if not f:
              return ""
          if wholePage:
-             logging.info("whole")
+             logging.debug("show whole page")
-             return f[0].getObject().getLastVersion().view()
+             return f[0].getObject().getContentObject().view()
          else:
              return f[0].getObject().getLastVersionFormattedData()
-     def showWordInFile(self,fileId,word,lineList=None,regExp=True,indexName=""):
+     def showWordInFile(self,fileId,word,indexName='graphemes',regExp=False,):
          """get lines with word  fromFileId"""
+         logging.debug("showwordinfile word='%s' index=%s file=%s"%(word,indexName,fileId))
-         file=self.showFile(fileId)
+         file = formatAtfFullLineNum(self.getFile(fileId))
-     logging.info("regEXP %s"%regExp)
          ret=[]
-         if regExp: # wenn regexp dann generiere alle worte aus der list die der regexp entsprechen
-             wordlist=self.findWordRegExp(indexName,word)
-         else:
-             wordlist=[word]
-         for line in file.split("\n"):
+         # add whitespace before and whitespace and line-end to splitter bounds expressions
-             found=False
+         bounds = self.splitter[indexName].bounds
-             for word in wordlist:
+         splitexp = "(%s|\s)(%%s)(%s|\s|\Z)"%(bounds,bounds)
-         try: # just a hack because of possible unicode errors in line
+         # clean word expression
-                  if line.find(word)>-1:
+         # TODO: this should use QueryParser itself
-                         if lineList: #liste of moeglichen Zeilennummern
+         # take out double quotes
-                                 num=line.split(".")[0] #Zeilenummer ist alles vor dem . in der Zeile
+         word = word.replace('"','')
+         # take out ignorable signs
+         ignorable = self.splitter[indexName].ignorex
+         word = ignorable.sub('', word)
+         # compile into regexp objects and escape parens
+         wordlist = [re.compile(splitexp%re.escape(w)) for w in word.split(' ')]
-                                 if num in lineList:
+         for line in file.splitlines():
+             for word in wordlist:
-                                         ret.append(line)
+                 #logging.debug("showwordinfile: searching for %s in %s"%(word.pattern,ignoreable.sub('',line)))
-                         else: # nimm alles ohne line check
+                 if word.search(ignorable.sub('',line)):
+                     line = formatAtfLineHtml(line)
                                  ret.append(line)
+                     break
-                         break;
-         except:
-             pass
          return ret
-     def tagWordInFile(self,fileId,word,lineList=None,regExp=True,indexName=""):
-         """get lines with word  fromFileId"""
-         file=self.showFile(fileId)
+     def showWordInFiles(self,fileIds,word,indexName='graphemes',regExp=False):
-         tagStr=u'<span class="found">%s</span>'
+         """
+         get lines with word from all ids in list FileIds.
+         returns dict with id:lines pairs.
+         """
+         logging.debug("showwordinfiles word='%s' index=%s file=%s"%(word,indexName,fileIds))
+         return dict([(id,self.showWordInFile(id, word, indexName, regExp)) for id in fileIds])
+     def tagWordInFile(self,fileId,word,indexName='graphemes',regExp=False):
+         """get text with word highlighted from FileId"""
+         logging.debug("tagwordinfile word='%s' index=%s file=%s"%(word,indexName,fileId))
+         file=self.getFile(fileId)
+         tagStart=u'<span class="found">'
+         tagEnd=u'</span>'
+         tagStr=tagStart + u'%%s' + tagEnd
          ret=[]
-         if regExp: # wenn regexp dann generiere alle worte aus der list die der regexp entsprechen
+         # add whitespace to splitter bounds expressions and compile into regexp object
-             wordlist=self.findWordRegExp(indexName,word)
+         bounds = self.splitter[indexName].bounds
-         else:
+         wordsplit = re.compile("(%s|\s)"%bounds)
-             wordlist=[word]
+         # clean word expression
+         # TODO: this should use QueryParser itself
+         word = word.replace('"','') # take out double quotes
+         # take out ignoreable signs
+         ignorable = self.splitter[indexName].ignorex
+         word = ignorable.sub('', word)
+         # split search terms by blanks
+         words = word.split(' ')
+         # split search terms again (for grapheme search with words)
+         splitwords = dict(((w,self.splitter[indexName].process([w])) for w in words))
-         for line in file.split("\n"):
+         for line in file.splitlines():
              line = unicodify(line)
-             found=False
+             # ignore lemma and other lines
-             for word in wordlist:
+             if line.lstrip().startswith('#lem:'):
-                 if line.find(word)>-1: #word ist gefunden dann makiere und breche die Schleife ab
+                 continue
-                         if lineList: #liste of moeglichen Zeilennummern
+             # ignore p-num line
-                                 num=line.split(".")[0] #Zeilenummer ist alles vor dem . in der Zeile
+             if line.startswith('&P'):
+                 continue
-                                 if num in lineList:
+             # ignore version lines
+             if line.startswith('#version'):
+                 continue
+             # ignore atf type lines
+             if line.startswith('#atf:'):
+                 continue
+             # first scan
+             hitwords = []
+             for w in words:
+                 if ignorable.sub('',line).find(w) > -1:
+                     # word is in line
+                     # append split word for grapheme search with words
+                     hitwords.extend(splitwords[w])
+                     #hitwords.extend(wordsplit.split(w))
+             # examine hits closer
+             if hitwords:
+                 # split line into words
+                 parts = wordsplit.split(line)
+                 line = ""
+                 for p in parts:
+                     #logging.debug("tagwordinfile: searching for %s in %s"%(p,hitwords))
+                     # reassemble line
+                     if ignorable.sub('', p) in hitwords:
+                         #logging.debug("tagwordinfile: found %s in %s"%(p,hitwords))
+                         # this part was found
+                         line += tagStart + formatAtfHtml(p) + tagEnd
+                     else:
+                         line += formatAtfHtml(p)
-                                         ret.append(line.replace(word,tagStr%word))
+             else:
+                 # no hits
+                 line = formatAtfHtml(line)
-                         else: # nimm alles ohne line check
-                                 ret.append(line.replace(word,tagStr%word))
-                         found=True
-                         break
-             if not found: #word wurde nicht gefunden keine makierung
                          ret.append(line)
          return u'<br>\n'.join(ret)
+     def tagWordInFiles(self,fileIds,word,indexName='graphemes',regExp=False):
+         """
+         get texts with highlighted word from all ids in list FileIds.
+         returns dict with id:text pairs.
+         """
+         logging.debug("tagwordinfiles word='%s' index=%s file=%s"%(word,indexName,fileIds))
+         return dict([(id,self.tagWordInFile(id, word, indexName, regExp)) for id in fileIds])
+     def getFileVersionList(self, pnum):
+         """get the version history as a list for the translit file with the given pnum"""
+         f = getattr(self, self.file_catalog).search({'textid':pnum})
+         if not f:
+             return []
+         return f[0].getObject().getVersionList()
      def URLquote(self,str):
          """quote url"""
          return urllib.quote(str)
- Line 2549  class CDLIRoot(Folder):
+ Line 2763  class CDLIRoot(Folder):
                  pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadATFWait.zpt')).__of__(self)
                  return pt(txt='/uploadATFfinally',threadName=threadName)
              else:
+               idTmp=self.REQUEST.SESSION['idTmp']
+               stObj=getattr(self.temp_folder,idTmp)
                self.REQUEST.SESSION['idTmp']=None
+               #update changed
+               logging.debug("dir:"+repr(stObj.returnValue['changed']))
+               for x in stObj.returnValue['changed']:
+                     ob=self.CDLICatalog.search({'title':x[0]})
+                     self.cdliRoot.updateOrAddToFileBTree(ob[0].getObject())
                if RESPONSE is not None:
                    RESPONSE.redirect(self.absolute_url())
      def importFiles(self,comment="",author="" ,folderName="/Users/dwinter/atf", files=None,ext=None):
          """import files"""
+         logging.debug("importFiles folderName=%s files=%s ext=%s"%(folderName,files,ext))
          root=self.cdli_main
          count=0
          if not files:
- Line 2563  class CDLIRoot(Folder):
+ Line 2789  class CDLIRoot(Folder):
          for f in files:
              folder=f[0:3]
              f2=f[0:5]
+             #check if main folder PXX already exists
              obj=self.ZopeFind(root,obj_ids=[folder])
+             logging.debug("importFiles: folder=%s f2=%s obj=%s"%(folder,f2,obj))
              if ext:
                  ext.result="<p>adding: %s </p>"%f+ext.result
-             if not obj:
+             if not obj: # if not create it
                  manage_addCDLIFileFolder(root,folder,folder)
                  fobj=getattr(root,folder)
                  #transaction.get().commit()
              else:
                  fobj=obj[0][1]
+             #check IF PYYYYY already exist
              obj2=fobj.ZopeFind(fobj,obj_ids=[f2])
+             logging.debug("importFiles: fobj=%s obj2=%s"%(fobj,obj2))
-             if not obj2:
+             if not obj2:# if not create it
                  manage_addCDLIFileFolder(fobj,f2,f2)
                  fobj2=getattr(fobj,f2)
              else:
                  fobj2=obj2[0][1]
+             # not add the file
              file2=os.path.join(folderName,f)
              id=f
-             manage_addCDLIFile(fobj2,f,'','')
+             logging.debug("importFiles: addCDLIFile fobj2=%s, f=%s file2=%s"%(fobj2,repr(f),repr(file2)))
-             id=f
+             fobj2.addFile(vC='',file=file(file2),author=author,newName=f)
-             ob=fobj2._getOb(f)
-             ob.title=id
-             manage_addCDLIFileObject(ob,id,comment,author,file2,content_type='',from_tmp=True)
-             self.CDLICatalog.catalog_object(ob)
-             #self.CDLICatalog.manage_catalogFoundItems(obj_ids=[id],search_sub=1)
-             #self.CDLICatalog.manage_catalogObject(self.REQUEST, self.REQUEST.RESPONSE, 'CDLICatalog', urlparse.urlparse(ob.absolute_url())[1])
              count+=1
-             if count > 1000:
+             #now add the file to the storage
-                 print "committing"
+             ob = getattr(fobj2,f)
+             self.cdliRoot.updateOrAddToFileBTree(ob)
+             if count%100==0:
+                 logging.debug("importfiles: committing")
                  transaction.get().commit()
-                 count=0
              transaction.get().commit()
          return "ok"

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>

Removed from v.1.79
changed lines
	Added in v.1.86