--- cdli/cdli_files.py 2007/02/05 16:20:38 1.64
+++ cdli/cdli_files.py 2007/03/23 13:58:10 1.73
@@ -25,7 +25,41 @@ from BTrees.OOBTree import OOBTree
import logging
import transaction
import copy
+import codecs
+def generateXMLReturn(hash):
+ """erzeugt das xml file als returnwert fuer uploadATFRPC"""
+
+ ret=""
+
+ ret+=""
+ for error in hash['errors']:
+ ret+="""%s"""%error
+
+ ret+=""
+
+ ret+=""
+ for changed in hash['changed']:
+ ret+="""%s"""%changed
+ ret+=""
+
+ ret+=""
+ for new in hash['newPs']:
+ ret+=""""""%new
+ ret+=""
+
+ ret+=""
+ return ret
+
+
+
+
+
+
+
+
+
+
def unique(s):
"""Return a list of the elements in s, but without duplicates.
@@ -174,8 +208,8 @@ class uploadATFfinallyThread(Thread):
conn.close()
#set flag for end of this method
self.end=True
- logging.info("ended")
- return True
+ logging.info("ended")
+ return True
def __del__(self):
"""delete"""
@@ -195,8 +229,9 @@ class uploadATFfinallyThread(Thread):
self.result+="
Start processing
"
#shall I only upload the changed files?
+ logging.info("uploadATFfinally procedure: %s"%procedure)
if procedure=="uploadchanged":
- changed=[x[0] for x in SESSION.get('changed',[])]
+ changed=[x[0] for x in SESSION.get('changed',[])]
uploadFns=changed+SESSION.get('newPs',[])
#or all
@@ -213,53 +248,64 @@ class uploadATFfinallyThread(Thread):
uploadFns=[]
#do first the changed files
- i=0
+ i=0
for fn in uploadFns:
- i+=1
+ i+=1
founds=ctx2.CDLICatalog.search({'title':fn})
if len(founds)>0:
SESSION['author']=str(username)
self.result="Changing : %s"%fn+self.result
founds[0].getObject().manage_addCDLIFileObject('',comment,SESSION['author'],file=os.path.join(SESSION['tmpdir'],fn),from_tmp=True)
if i==200:
- i=0
- transaction.get().commit()
- logging.info("changing: do commit")
- transaction.get().commit()
- logging.info("changing: last commit")
+ i=0
+ transaction.get().commit()
+ logging.info("changing: do commit")
+
+ transaction.get().commit()
+ logging.info("changing: last commit")
#now add the new files
newPs=SESSION['newPs']
if len(newPs)>0:
tmpDir=SESSION['tmpdir']
+ logging.info("adding start")
self.result="
Adding files
"+self.result
#TODO: make this configurable, at the moment base folder for the files has to be cdli_main
ctx2.importFiles(comment=comment,author=str(username) ,folderName=tmpDir, files=newPs,ext=self)
-
+ logging.info("adding finished")
#unlock locked files?
if unlock:
+ logging.info("unlocking start")
self.result="Unlock files
"+self.result
unlockFns=[]
for x in os.listdir(SESSION['tmpdir']):
if not x in SESSION['errors']:
unlockFns.append(x)
-
+ logging.info("unlocking have now what to unlock")
+
for fn in unlockFns:
+ #logging.info("will unlock: %s"%fn)
founds=ctx2.CDLICatalog.search({'title':fn})
+ #logging.info("found it: %s"%repr(founds))
if len(founds)>0:
+ #logging.info("unlock: %s"%founds[0].getObject().getId())
SESSION['author']=str(username)
founds[0].getObject().lockedBy=""
+ logging.info("unlocking done")
- #if a basketname is give, add files to the basket
+ #if a basketname is given, add files to the basket
if not (basketname ==''):
- self.result="Add basket
"+self.result
+ logging.info("add to basket %s"%basketname)
+ self.result="Add to basket
"+self.result
basketId=ctx2.basketContainer.getBasketIdfromName(basketname)
if not basketId: # create new basket
+ logging.info("create basket %s"%basketname)
+ self.result="Create a new basket
"+self.result
ob=ctx2.basketContainer.addBasket(basketname)
basketId=ob.getId()
basket=getattr(ctx2.basketContainer,str(basketId))
@@ -270,7 +316,7 @@ class uploadATFfinallyThread(Thread):
RESPONSE.redirect(self.aq_parent.absolute_url())
-
+ logging.info("uploadfinally done")
return True
class tmpStore(SimpleItem):
@@ -329,6 +375,7 @@ class uploadATFThread(Thread):
ctx = self.getContext(app,serverport=self.serverport)
logging.info("run intern")
try:
+ logging.info("created: %s"%idTmp)
ctx.temp_folder._setObject(idTmp,tmpStore(idTmp))
except:
logging.error("thread upload: %s %s"%sys.exc_info()[0:2])
@@ -338,11 +385,12 @@ class uploadATFThread(Thread):
#ctx.cdliRoot.cdli_main.tmpStore2[self.getName()[0:]]=self.returnValue
-
+
transaction.get().commit()
conn.close()
+ return getattr(ctx.temp_folder,idTmp)
def getResult(self):
"""method for accessing result"""
@@ -413,11 +461,13 @@ class uploadATFThread(Thread):
#if not than add filename to the list of newfiles
data=file(os.path.join(dir,fn)).read()
- #status,msg=checkFile(fn,data,dir)
- status=True
- msg=""
+ status,msg=checkFile(fn,data,dir)
+ #status=True
+
+
if not status: # error
errors.append((fn,msg))
+
else:
if len(founds)==0:
newPs.append(fn)
@@ -441,7 +491,7 @@ class uploadATFThread(Thread):
stObj.returnValue={}
stObj.returnValue['errors']=errors
-
+
stObj.returnValue['newPs']=newPs
stObj.returnValue['tmpdir']=dir
stObj.returnValue['basketLen']=basketLen
@@ -465,6 +515,44 @@ class CDLIBasketContainer(OrderedFolder)
security=ClassSecurityInfo()
meta_type="CDLIBasketContainer"
+ def getPNumbersOfBasket(self,basketName):
+ """get all pnumbers of a basket as a list, returns an empty list if basket not found
+ @param basketName: name of the basket
+ """
+ ret=[]
+ basketId=self.getBasketIdfromName(basketName)
+ if not basketId:
+ return []
+
+ ob=getattr(self,basketId).getContent()
+
+ ret=[x[0].split(".")[0] for x in ob]
+
+ return ret
+
+ def getBasketAsOneFile(self,basketName,current="no"):
+ """returns all files of the basket combined in one file
+ @param basketName: Name of the basket
+ @param current: (optional) if current is set to "yes" then the most current version of
+ all files are downloaded and not the versions of the files as stored in the basket
+ """
+ ret=""
+ basketId=self.getBasketIdfromName(basketName)
+ if not basketId:
+ return ""
+
+ ob=getattr(self,basketId).getLastVersion()
+ for object in ob.getContent():
+ if current=="no": #version as they are in the basket
+ ret+=str(object[0].getData())+"\n"
+ elif current=="yes":
+ #search current object
+ logging.info("crrent: %s"%object[1].getId().split(".")[0])
+ founds=self.CDLICatalog.search({'title':object[1].getId().split(".")[0]})
+ if len(founds)>0:
+ ret+=str(founds[0].getObject().getLastVersion().getData())+"\n"
+ return ret
+
def upDateBaskets(self):
"""update content in to objects"""
@@ -492,12 +580,19 @@ class CDLIBasketContainer(OrderedFolder)
trash.manage_pasteObjects(cut)
security.declareProtected('manage','manageBaskets')
- def manageBaskets(self,ids,submit,REQUEST=None,RESPONSE=None):
+ def manageBaskets(self,submit,ids=None,basket1="",basket2="",joinBasket="",subtractBasket="",REQUEST=None,RESPONSE=None):
"""manage baskets, delete or copy"""
if submit=="delete":
self.deleteBaskets(ids)
-
+ elif submit=="join":
+ flag,msg=self.joinBasket(joinBasket, ids)
+ logging.info("joining %s %s"%(flag,msg))
+
+ elif submit=="subtract":
+ logging.info("BBBb %s %s"%(basket1,basket2))
+ flag,msg=self.subtractBasket(subtractBasket, basket1,basket2)
+ logging.info("subtract %s %s"%(flag,msg))
if RESPONSE:
RESPONSE.redirect(self.absolute_url())
@@ -561,7 +656,7 @@ class CDLIBasketContainer(OrderedFolder)
ret+= "BASKET:"+com+"\t"+user+"\t"+time+"\n"
for x in values:
ret+= x[0]+"\t"+x[1]+"\n"
- return ret
+ return ret
def getBaskets(self,sortField='title'):
"""get all baskets files"""
@@ -620,9 +715,83 @@ class CDLIBasketContainer(OrderedFolder)
baskets.sort(sortComment)
return baskets
+
+
+ def subtractBasket(self,newBasket,basket1,basket2):
+ """subtract basket2 from basket1
+ (i.e. newbasket will contain alle elements of basket1 which are not in basket2),
+ if basket2 contains files which are not in basket1, then theses files fill be ignored
+
+ @param newbasket: name of the new basket
+ @param basket1: basket where basket2 will be subtracted from
+ @param basket2: see above
+
+ """
+ logging.info("CCCCC %s %s"%(basket1,basket2))
+
+ try:
+ newB=self.addBasket(newBasket)
+ except:
+ return False, "cannot create the new basket"
+
+
-
-
+
+
+ bas2= getattr(self,basket2)
+ bas2content=bas2.getContent()
+ bas2ids=[x[0] for x in bas2content]
+
+
+
+ bas1= getattr(self,basket1)
+ bas1content=bas1.getContent()
+
+
+ newBasketContent={}
+
+ for id,version in bas1content:
+ if not (id in bas2ids):
+ newBasketContent[id]=version
+
+ username=self.getActualUserName()
+
+ logging.info("sbc %s"%newBasketContent)
+ newB.addObjectsWithVersion(newBasketContent,username=username,catalog=self.CDLICatalog)
+
+ return True, ""
+
+
+ def joinBasket(self,newBasket,oldBaskets):
+ """join two baskets
+ @param newbasket: name of the new basket
+ @param oldbaskets: list of baskets to be joined
+ """
+ try:
+ newB=self.addBasket(newBasket)
+ except:
+ return False, "cannot create the new basket"
+
+ newBasketContent={}
+ for ob in oldBaskets:
+ x= getattr(self,ob,None)
+ if x is None:
+ return False, "cannot find basket: %s"%ob
+
+ ids=x.getContent() # hole den Inhalt
+
+ for id,version in ids:
+ if newBasketContent.has_key(id): # p number gibt's schon
+ newBasketContent[id]=max(newBasketContent[id],version) # speichere die groessere Versionsnumber
+ else:
+ newBasketContent[id]=version
+ username=self.getActualUserName()
+
+ logging.info("nbc %s"%newBasketContent)
+ newB.addObjectsWithVersion(newBasketContent,username=username,catalog=self.CDLICatalog)
+
+ return True, ""
+
def getNewId(self):
"""createIds"""
last=getattr(self,'last',0)
@@ -636,11 +805,11 @@ class CDLIBasketContainer(OrderedFolder)
def setActiveBasket(self,basketId,REQUEST=None):
"""store active basketId in a cookie"""
self.REQUEST.RESPONSE.setCookie("CDLIActiveBasket",basketId,path="/")
- try:
- qs=cgi.parse_qs(REQUEST['QUERY_STRING'])
- del(qs['basketId'])
- except:
- qs={}
+ try:
+ qs=cgi.parse_qs(REQUEST['QUERY_STRING'])
+ del(qs['basketId'])
+ except:
+ qs={}
if REQUEST:
REQUEST.RESPONSE.redirect(REQUEST['URL1']+'?'+urllib.urlencode(qs))
@@ -664,7 +833,7 @@ class CDLIBasketContainer(OrderedFolder)
ob=manage_addCDLIBasket(self,newBasketName)
return ob
-
+
def storeInBasket(self,submit,ids=None,newBasketName=None,fromFileList=None,RESPONSE=None,REQUEST=None):
"""store it"""
if not ids:
@@ -766,7 +935,11 @@ class CDLIBasket(Folder,CatalogAware):
self.shortDescription=shortDescription
self.comment=comment
-
+ def getActualUserName(self):
+ """get name of the actualuser"""
+
+ return str(self.REQUEST['AUTHENTICATED_USER'])
+
def getLastVersion(self):
"""hole letzte version"""
@@ -830,9 +1003,59 @@ class CDLIBasket(Folder,CatalogAware):
return obj
+ def addObjectsWithVersion(self,ids,deleteOld=None,username=None,catalog=None):
+ """generate a new version of the basket with objects added,
+ hier wird jedoch nicht die letzte Version jedes Files hinzugefuegt, s
+ ondern ids is ein Tupel mit der Id (d.h. der p-number) und der Versionsnummer.
+ """
+ logging.info("add to basket (%s)"%(self.getId()))
+ lastVersion=self.getLastVersion()
+
+ if not catalog:
+ catalog=self.CDLICatalog
+
+ if lastVersion is None:
+ oldContent=[]
+ else:
+ oldContent=lastVersion.content.getContent()
+
+ if deleteOld:
+ oldContent=[]
+
+ newContent=[]
+ added=0
+
+ for id,version in ids.iteritems():
+ logging.info("adding %s %s"%(id,version))
+ id=id.split(".")[0] # title nur die pnumber ohne atf
+
+ try:
+ founds=catalog.search({'title':id})
+ except:
+ founds=[]
+ logging.info(" found %s "%(founds))
+ for found in founds:
+ if found.getObject() not in oldContent:
+
+ #TODO: was passiert wenn, man eine Object dazufgt, das schon da ist aber eine neuere version
+ newContent.append((found.getObject().getVersions()[version-1][1],found.getObject()))
+ added+=1
+
+ content=oldContent+newContent
+ if not username:
+ logging.error("XXXXXXXXXXX %s"%repr(self))
+ user=self.getActualUserName()
+ else:
+ user = username
+
+ ob=manage_addCDLIBasketVersion(self,user,comment="",basketContent=content)
+ logging.info("add to basket (%s) done"%(self.getId()))
+ return added
+
+
def addObjects(self,ids,deleteOld=None,username=None):
"""generate a new version of the basket with objects added"""
-
+ logging.info("add to basket (%s)"%(self.getId()))
lastVersion=self.getLastVersion()
if lastVersion is None:
@@ -846,10 +1069,11 @@ class CDLIBasket(Folder,CatalogAware):
newContent=[]
added=0
for id in ids:
- try:
- founds=self.CDLICatalog.search({'title':id})
- except:
- founds=[]
+ try:
+ founds=self.CDLICatalog.search({'title':id})
+ except:
+ founds=[]
+
for found in founds:
if found.getObject() not in oldContent:
#TODO: was passiert wenn, man eine Object dazufgt, das schon da ist aber eine neuere version
@@ -863,12 +1087,22 @@ class CDLIBasket(Folder,CatalogAware):
user = username
ob=manage_addCDLIBasketVersion(self,user,comment="",basketContent=content)
-
+ logging.info("add to basket (%s) done"%(self.getId()))
return added
-
+ def getContent(self):
+ """print content"""
+ ret=[]
+
+ lv=self.getLastVersion()
+ for obj in lv.content.getContent():
+ logging.info("XXXXXXXXXX %s"%repr(obj))
+ ret.append((obj[1].getId(),obj[0].versionNumber))
+
+ return ret
+
def getContentIds(self):
"""print basket content"""
ret=[]
@@ -955,6 +1189,21 @@ class CDLIBasketVersion(Implicit,Persist
return True
return False
+ def downloadListOfPnumbers(self):
+ """download pnumbers of the basket as list"""
+
+ basket_name=self.aq_parent.title
+
+ ids=self.getContent() # get the list of objects
+ logging.error(ids)
+ ret="\n".join([x[1].getId().split(".")[0] for x in ids])
+
+ self.REQUEST.RESPONSE.setHeader("Content-Disposition","""attachement; filename="%s.txt" """%basket_name)
+ self.REQUEST.RESPONSE.setHeader("Content-Type","application/octet-stream")
+ length=len(ret)
+ self.REQUEST.RESPONSE.setHeader("Content-Length",length)
+ self.REQUEST.RESPONSE.write(ret)
+
security.declareProtected('View','downloadObjectsAsOneFile')
def downloadObjectsAsOneFile(self,lock=None,procedure=None,REQUEST=None,check="yes",current="no"):
"""download all selected files in one file"""
@@ -1027,7 +1276,7 @@ class CDLIBasketVersion(Implicit,Persist
ret+=str(object[0].getData())+"\n"
elif current=="yes":
#search current object
- founds=self.CDLICatalog.search({'title':object[0].getId()})
+ founds=self.CDLICatalog.search({'title':object[1].getId().split(".")[0]})
if len(founds)>0:
ret+=str(founds[0].getObject().getLastVersion().getData())+"\n"
@@ -1170,7 +1419,8 @@ class CDLIFileObject(CatalogAware,extVer
def getFormattedData(self):
"""fromat text"""
data=self.getData()
- return re.sub("\s\#lem"," #lem",data) #remove return vor #lem
+# return re.sub("\s\#lem"," #lem",data) #remove return vor #lem
+ return re.sub("#lem"," #lem",data) #remove return vor #lem
def view(self):
"""view file"""
@@ -1407,7 +1657,14 @@ def manage_addCDLIFile(self,id,title,loc
if RESPONSE is not None:
RESPONSE.redirect('manage_main')
-
+def checkUTF8(data):
+ """check utf 8"""
+ try:
+ data.encode('utf-8')
+ return True
+ except:
+ return False
+
def checkFile(filename,data,folder):
"""check the files"""
@@ -1418,17 +1675,11 @@ def checkFile(filename,data,folder):
return False,"P missing in the filename"
elif len(fn[0])!=7:
return False,"P number has not the right length 6"
+ elif not checkUTF8(data):
+ return False,"not utf-8"
else:
- fn=os.path.join(folder,filename)
- stin,out=os.popen4("/usr/bin/atfcheck.plx %s"%fn)
- value=out.read()
- ret= out.close()
-
- if value:
-
- return False,"atf checker error: %s"%value
- else:
- return True,""
+ return True,""
+
def splitatf(fh,dir=None,ext=None):
"""split it"""
@@ -1436,42 +1687,51 @@ def splitatf(fh,dir=None,ext=None):
nf=None
i=0
- for lineTmp in fh.readlines():
- for line in lineTmp.split("\r"):
- if ext:
- i+=1
- if (i%100)==0:
- ext.result+="."
- if i==10000:
- i=0
- ext.result+="
"
- #check if basket name is in the first line
- if line.find("#atf basket")>=0: #old convention
- ret=line.replace('#atf basket ','')
- ret=ret.split('_')[0]
- elif line.find("#basket:")>=0: #new convention
- ret=line.replace('#basket: ','')
- ret=ret.split('_')[0]
-
- else:
- if (len(line.lstrip())>0) and (line.lstrip()[0]=="&"): #newfile
- if nf:
- nf.close() #close last file
-
-
- filename=line[1:].split("=")[0].rstrip()+".atf"
- if dir:
- filename=os.path.join(dir,filename)
- nf=file(filename,"w")
- logging.info("open %s"%filename)
- if nf:
- nf.write(line.replace("\n","")+"\n")
+ if (type(fh) is StringType) or (type(fh) is UnicodeType):
+ iter=fh.split("\n")
+ else:
+ iter=fh.readlines()
+
+ for lineTmp in iter:
+ lineTmp=lineTmp.replace(codecs.BOM_UTF8,'') # make sure that all BOM are removed..
+ for line in lineTmp.split("\r"):
+ #logging.log("Deal with: %s"%line)
+ if ext:
+ i+=1
+ if (i%100)==0:
+ ext.result+="."
+ if i==10000:
+ i=0
+ ext.result+="
"
+ #check if basket name is in the first line
+ if line.find("#atf basket")>=0: #old convention
+ ret=line.replace('#atf basket ','')
+ ret=ret.split('_')[0]
+ elif line.find("#basket:")>=0: #new convention
+ ret=line.replace('#basket: ','')
+ ret=ret.split('_')[0]
+
+ else:
+ if (len(line.lstrip())>0) and (line.lstrip()[0]=="&"): #newfile
+ if nf:
+ nf.close() #close last file
+
- try:
- nf.close()
+ filename=line[1:].split("=")[0].rstrip()+".atf"
+ if dir:
+ filename=os.path.join(dir,filename)
+ nf=file(filename,"w")
+ logging.info("open %s"%filename)
+ if nf:
+ nf.write(line.replace("\n","")+"\n")
+
+ try:
+ nf.close()
except:
- pass
- fh.close()
+ pass
+
+ if not((type(fh) is StringType) or (type(fh) is UnicodeType)):
+ fh.close()
return ret,len(os.listdir(dir))
@@ -1522,6 +1782,16 @@ class CDLIFileFolder(extVersionedFileFol
return ret
+ def getFile(self,fn):
+ """get the content of the file fn"""
+ founds=self.CDLICatalog.search({'title':fn})
+ if not founds:
+ return ""
+ else:
+ obj=founds[0].getObject().getLastVersion()
+
+ return obj.getData()[0:]
+
def checkCatalog(self,fn):
"""check if fn is in the catalog"""
#TODO add checkCatalog
@@ -1544,7 +1814,13 @@ class CDLIFileFolder(extVersionedFileFol
return pt(search=list,author=author)
-
+ def getAllPNumbers(self):
+ """get a list of all files (resp their p-numbers) stored"""
+
+ ret=[x.getId for x in self.CDLICatalog()]
+
+ return ret
+
def findObjectsFromList(self,enterList=None,display=False,start=None,upload=None,list=None,basketName=None,numberOfObjects=None,RESPONSE=None):
"""findObjectsFromList (, TAB oder LINE separated)"""
@@ -1615,8 +1891,8 @@ class CDLIFileFolder(extVersionedFileFol
catalog=getattr(self,self.default_catalog)
#tf,tfilename=mkstemp()
- if not hasattr(self.temp_folder,'downloadCounter'):
- self.temp_folder.downloadCounter=0
+ if not hasattr(self.temp_folder,'downloadCounter'):
+ self.temp_folder.downloadCounter=0
if getattr(self.temp_folder,'downloadCounter',0) > 5:
return """I am sorry, currently the server has to many requests for downloads, please come back later!"""
@@ -1641,6 +1917,7 @@ class CDLIFileFolder(extVersionedFileFol
#os.write(tf,obj.getLastVersion().data)
if RESPONSE:
RESPONSE.write(obj.getLastVersion().getData()[0:])
+ RESPONSE.write("\n")
self.temp_folder.downloadCounter-=1
self._p_changed=1
transaction.get().commit()
@@ -1725,78 +2002,137 @@ class CDLIRoot(Folder):
meta_type="CDLIRoot"
downloadCounterBaskets=0# counts the current basket downloads if counter > 10 no downloads are possible
- def findWordRegExp(self,searchTerm):
- """find all words in index which match regexp in SearchTerm"""
+ def deleteFiles(self,ids):
+ """delete files (resp. move into .trash folder)"""
+ # find or generete trash folder
+
+ found=self.ZopeFind(self,obj_ids=['.trash'])
+
+ if len(found)<1:
+ manage_addCDLIFileFolder(self, '.trash',title="Trash")
+ trash=self._getOb('.trash')
+ else:
+ logging.info(found)
+ trash=found[0][1]
+
+
+ for id in ids:
+ founds=self.CDLICatalog.search({'title':id.split(".")[0]})
+ if founds:
+ logging.info(founds)
+ folder=founds[0].getObject().aq_parent #get the parent folder of the object
+ logging.info(folder)
+ cut=folder.manage_cutObjects([founds[0].getId]) #cut it out
+ trash.manage_pasteObjects(cut) #paste it in the trash
+
+
+ def findWordRegExp(self,indexName,searchTerm):
+ """find all words in index which match regexp in SearchTerm
+ @param indexName: name of the index to be searched in
+ @param searchTerm: word to be searched"""
+
ret=[]
- for x in self.lineIndex.iterkeys():
+ for x in self.lineIndexes[indexName].iterkeys():
if re.match(searchTerm,x):
ret.append(x)
return ret
- def searchRegExpInLineIndexDocs(self,searchTerm):
- """search in inLineIndex with regexp"""
+ def searchRegExpInLineIndexDocs(self,indexName,searchTerm):
+ """search in inLineIndex with regexp
+ @param indexName: name of the index to be searched in
+ @param searchTerm: term to be searched
+ """
if not searchTerm:
return []
ret=[]
- words=self.findWordRegExp(searchTerm) # suche nach allen Treffern
+ words=self.findWordRegExp(indexName,searchTerm) # suche nach allen Treffern
logging.info("wd:%s"%words)
for word in words:
- ret+=self.searchInLineIndexDocs(word)
+ ret+=self.searchInLineIndexDocs(indexName,word)
return unique(ret)
def showInLineIndex(self):
"""get the index for debug purposes"""
print "show"
- for x in self.lineIndex.iterkeys():
- logging.info("word:%s"%repr(x))
- #for y in self.lineIndex[x].iterkeys():
- # print "doc",repr(y),repr(self.lineIndex[x][y])
-
- return self.lineIndex
+ for key in self.lineIndexes.keys():
+ logging.info("index:%s"%key)
+ for x in self.lineIndexes[key].iterkeys():
+ logging.info("word:%s"%repr(x))
+ #for y in self.lineIndex[x].iterkeys():
+ # print "doc",repr(y),repr(self.lineIndex[x][y])
+
+ return self.lineIndexes
- def searchInLineIndexDocs(self,word,uniq=True,regExp=False):
- """search occurences"""
+ def searchInLineIndexDocs(self,indexName,word,uniq=True,regExp=False):
+ """search occurences in an index
+ @param indexName: name of the index to be searched in
+ @param word: word to be searched
+ @param unique: (optional) unify the list of results
+ @param regExp: (optional) use regular expressions
+ """
if regExp:
- return self.searchRegExpInLineIndexDocs(word)
+ return self.searchRegExpInLineIndexDocs(indexName,word)
try:
- lst=list(self.lineIndex.get(word).keys())
+
+ lst=list(self.lineIndexes[indexName].get(word).keys())
except:
+ logging.error("error: searchInLineIndexDocs (%s %s)"%(sys.exc_info()[0:2]))
lst=[]
if uniq:
return unique(lst)
else:
return lst
- def getLinesFromIndex(self,word,doc,regExp=False):
- """get lines"""
+ def getLinesFromIndex(self,indexName,word,doc,regExp=False):
+ """return all lines from a document where word is found
+ @param indexName: Name of the index
+ @param word: word to be searched
+ @param doc: name of the document (usuallay the p-number)
+ @param regExp: (optional) use regExp
+ """
+
if not regExp:
- return self.lineIndex.get(word)[doc]
+ return self.lineIndexes[indexName].get(word)[doc]
else: # wenn regexp, suche welches word
- for w in self.findWordRegExp(word):
- if self.lineIndex.get(w): # ein word in im dex gefunden
+ for w in self.findWordRegExp(indexName,word):
+ if self.lineIndexes[indexName].get(w): # ein word in im dex gefunden
try:
- dc=self.lineIndex.get(word)[doc]
+ dc=self.lineIndex[indexName].get(word)[doc]
return dc # und ein document dann gib es zurueck
except:
pass #andernfalls weiter
- def cleanInLineIndex(self):
- """delete InlineIndex"""
- for x in list(self.lineIndex.keys()):
- del(self.lineIndex[x])
- print [x for x in self.lineIndex.keys()]
+ def cleanInLineIndex(self,indexName):
+ """empty an InlineIndex
+ @param indexName: name of the index
+ """
+ for x in list(self.lineIndexes[indexName].keys()):
+ del(self.lineIndexes[indexName][x])
+ print [x for x in self.lineIndexes[indexName].keys()]
return "ok"
- def storeInLineIndex(self,key,value):
- """store in index"""
-
- if (not hasattr(self,'lineIndex')) or (type(self.lineIndex) is DictType):
- self.lineIndex=OOBTree()
- li=self.lineIndex
+ def storeInLineIndex(self,indexName,key,value):
+ """store in index, key is normally a word or grapheme
+ and value is a tuple (documentname, line) where the word can be found
+ @param indexName: name of the index
+ @param key: key in index
+ @param value: value in index, value is a tuple (document name, line)
+ """
+ logging.error("indexing: %s %s"%(indexName,key))
+ if (not hasattr(self,'lineIndexes')):
+
+ self.lineIndexes={}
+
+ if self.lineIndexes.get(indexName,None) is None:
+ #index exisitiert noch nicht dann anlegen
+
+ self.lineIndexes[indexName]=OOBTree()
+ lis=self.lineIndexes
+ li=lis[indexName]
if li.has_key(key):
@@ -1814,81 +2150,80 @@ class CDLIRoot(Folder):
li[key][value[0]]=[value[1]]
- self.lineIndex=li
+ self.lineIndexes=lis
transaction.get().commit()
def showFile(self,fileId):
- """show a file"""
+ """show a file
+ @param fileId: P-Number of the document to be displayed
+ """
f=self.CDLICatalog({'title':fileId})
if not f:
return ""
return f[0].getObject().getLastVersionFormattedData()
- def showLineFromFile(self,fileId,lineNum,word):
- """get line lineNum fromFileId"""
-
- file=self.showFile(fileId)
- #str="^%s\.[^%s\.]*%s[^\n]*\n"%(lineNum,lineNum,word)
- #str="^%s\..*?%s[^\n]*\n"%(lineNum,word)
-
- #print str
- #m=re.search(str,file,flags=re.M|re.DOTALL)
- #if m:
- # return m.group()
- #else:
- # return ""
- #ret=lineNum+"."
- #splitted=file.split(lineNum+".")
- #if len(splitted)>1:
- #for part in splitted[1:]:
- #if part.find(word)>-1:
- # for x in part.split("\n"):
- #ret+=x
- #if x.find(word)>-1:
- #break
- #break;
- #return ret
- def showWordInFile(self,fileId,word,lineList=None):
+ def showWordInFile(self,fileId,word,lineList=None,regExp=True,indexName=""):
"""get lines with word fromFileId"""
file=self.showFile(fileId)
- ret=[]
- for line in file.split("\n"):
- if line.find(word)>-1:
- if lineList: #liste of moeglichen Zeilennummern
- num=line.split(".")[0] #Zeilenummer ist alles vor dem . in der Zeile
-
- if num in lineList:
-
- ret.append(line)
- else: # nimm alles ohne line check
- ret.append(line)
- return ret
+ ret=[]
+ if regExp: # wenn regexp dann generiere alle worte aus der list die der regexp entsprechen
+ wordlist=self.findWordRegExp(indexName,word)
+ else:
+ wordlist=[word]
+
+ for line in file.split("\n"):
+ found=False
+ for word in wordlist:
+ if line.find(word)>-1:
+ if lineList: #liste of moeglichen Zeilennummern
+ num=line.split(".")[0] #Zeilenummer ist alles vor dem . in der Zeile
+
+ if num in lineList:
+
+ ret.append(line)
+ else: # nimm alles ohne line check
+ ret.append(line)
+
+ break;
+ return ret
- def tagWordInFile(self,fileId,word,lineList=None):
+ def tagWordInFile(self,fileId,word,lineList=None,regExp=True,indexName=""):
"""get lines with word fromFileId"""
file=self.showFile(fileId)
- tagStr="""%s"""
- ret=[]
- for line in file.split("\n"):
- if line.find(word)>-1:
- if lineList: #liste of moeglichen Zeilennummern
- num=line.split(".")[0] #Zeilenummer ist alles vor dem . in der Zeile
-
- if num in lineList:
-
- ret.append(line.replace(word,tagStr%word))
- else: # nimm alles ohne line check
- ret.append(line.replace(word,tagStr%word))
- else:
- ret.append(line)
- return "
\n".join(ret)
+ tagStr="""%s"""
+ ret=[]
+
+ if regExp: # wenn regexp dann generiere alle worte aus der list die der regexp entsprechen
+ wordlist=self.findWordRegExp(indexName,word)
+ else:
+ wordlist=[word]
+
+ for line in file.split("\n"):
+ found=False
+ for word in wordlist:
+ if line.find(word)>-1: #word ist gefunden dann makiere und breche die Schleife ab
+ if lineList: #liste of moeglichen Zeilennummern
+ num=line.split(".")[0] #Zeilenummer ist alles vor dem . in der Zeile
+
+ if num in lineList:
+
+ ret.append(line.replace(word,tagStr%word))
+
+ else: # nimm alles ohne line check
+ ret.append(line.replace(word,tagStr%word))
+ found=True
+ break
+ if not found: #word wurde nicht gefunden keine makierung
+ ret.append(line)
+
+ return "
\n".join(ret)
def URLquote(self,str):
"""quote url"""
@@ -1917,19 +2252,8 @@ class CDLIRoot(Folder):
ret.append((f[0],un))
return ret
-
- def forceDahl(self):
- "break all locks"
- ret=[]
- for f in self.ZopeFind(self,obj_metatypes="CDLI file",search_sub=1):
- if str(f[1].lockedBy)=="dahl":
- un=f[1].forceunlock()
-
- if un and un !="":
- ret.append((f[0],un))
+
- return ret
-
def getChangesByAuthor(self,author,n=100):
"""getChangesByAuthor"""
zcat=self.CDLIObjectsCatalog
@@ -1991,10 +2315,40 @@ class CDLIRoot(Folder):
return ret
-
+ def uploadATFRPC(self,data,username):
+ """upload an atffile via xml-rpc"""
+ uploader=uploadATFThread()
+
+ #generate an random id for the upload object
+ from random import randint
+ if (not self.REQUEST.SESSION.get('idTmp',None)):
+
+ idTmp=str(randint(0,1000000000))
+ self.REQUEST.SESSION['idTmp']=idTmp
+ else:
+ idTmp=self.REQUEST.SESSION.get('idTmp',None)
+
+
+ uploader.set(data,0,username,idTmp)
+
+ stObj=uploader.run()
+
+ processor=uploadATFfinallyThread()
+
+ basketname=stObj.returnValue['basketNameFromFile']
+
+ processor.set("uploadchanged",basketname=basketname,SESSION=stObj.returnValue,username=username,serverport=self.REQUEST['SERVER_PORT'])
+
+ processor.run()
+
+
+ return generateXMLReturn(stObj.returnValue)
+
def uploadATF(self,repeat=None,upload=None,basketId=0,RESPONSE=None):
- """standard ausgabe"""
+ """upload an atf file / basket file"""
#self._v_uploadATF.returnValue=None
+
+ #generate an random id for the upload thread
from random import randint
if (not self.REQUEST.SESSION.get('idTmp',None)):
@@ -2003,8 +2357,10 @@ class CDLIRoot(Folder):
else:
idTmp=self.REQUEST.SESSION.get('idTmp',None)
+
threadName=repeat
if not threadName or threadName=="":
+ #new thread not called from the waiting page
tmpVar=False
thread=uploadATFThread()
@@ -2052,26 +2408,8 @@ class CDLIRoot(Folder):
return pt(txt='/uploadATF',threadName=threadName)
else:
-# tmp={}
-# for key in self._v_uploadATF[threadName].returnValue.keys():
-# t=self._v_uploadATF[threadName].returnValue[key]
-# if type(t) is ListType:
-# tmp[key]=self._v_uploadATF[threadName].returnValue[key][0:]
-# else:
-# tmp[key]=self._v_uploadATF[threadName].returnValue[key]
-# repr(tmp[key]),repr(key)
-#
-# #
- #tmp=self.cdli_main.tmpStore2[threadName]
-
tmp=getattr(self.temp_folder,idTmp).returnValue
-
-
-
-
- #del(self.cdli_main.tmpStore2[threadName])
-
-
+
pt=PageTemplateFile(os.path.join(package_home(globals()),'zpt','uploadCheck.zpt')).__of__(self)
return pt(changed=tmp['changed'],lockerrors=tmp['lockerrors'],errors=tmp['errors'],dir=tmp['dir'],newPs=tmp['newPs'],basketLen=tmp['basketLen'],numberOfFiles=tmp['numberOfFiles'],
@@ -2152,7 +2490,7 @@ class CDLIRoot(Folder):
obj=self.ZopeFind(root,obj_ids=[folder])
if ext:
- ext.result+="adding: %s
"%f
+ ext.result="adding: %s
"%f+ext.result
if not obj:
manage_addCDLIFileFolder(root,folder,folder)
fobj=getattr(root,folder)
@@ -2180,13 +2518,13 @@ class CDLIRoot(Folder):
self.CDLICatalog.catalog_object(ob)
#self.CDLICatalog.manage_catalogFoundItems(obj_ids=[id],search_sub=1)
#self.CDLICatalog.manage_catalogObject(self.REQUEST, self.REQUEST.RESPONSE, 'CDLICatalog', urlparse.urlparse(ob.absolute_url())[1])
- count+=1
+ count+=1
- if count > 1000:
- print "committing"
- transaction.get().commit()
- count=0
- transaction.get().commit()
+ if count > 1000:
+ print "committing"
+ transaction.get().commit()
+ count=0
+ transaction.get().commit()
return "ok"
@@ -2207,9 +2545,9 @@ def manage_addCDLIRoot(self, id, title='
ob.id=str(id)
ob.title=title
try:
- self._setObject(id, ob)
+ self._setObject(id, ob)
except:
- pass
+ pass
ob=self._getOb(id)
checkPermission=getSecurityManager().checkPermission