cdli/cdli_files.py - diff

Return to cdli_files.py CVS log

Up to [Repository] / cdli

Diff for /cdli/cdli_files.py between versions 1.114 and 1.117

version 1.114, 2009/09/01 08:36:04	version 1.117, 2011/04/27 16:19:27
Line 90 class CDLIFileObject(CatalogAware,extVer	Line 90 class CDLIFileObject(CatalogAware,extVer
def getPNumber(self):	def getPNumber(self):
"""get the pnumber"""	"""get the pnumber"""
try:	try:
txt=re.match("&[Pp](\d)\s=([^\r\n]*)",self.getData()[0:])	txt=re.match("&[PpSs](\d)\s=([^\r\n]*)",self.getData()[0:])
except:	except:
txt=self.getData()[0:]	txt=self.getData()[0:]

Line 104 class CDLIFileObject(CatalogAware,extVer	Line 104 class CDLIFileObject(CatalogAware,extVer
def getDesignation(self):	def getDesignation(self):
"""get the designation out of the file"""	"""get the designation out of the file"""
try:	try:
txt=re.match("&[Pp](\d)\s=([^\r\n]*)",self.getData()[0:])	txt=re.match("&[PpSs](\d)\s=([^\r\n]*)",self.getData()[0:])
except:	except:
txt=self.getData()[0:]	txt=self.getData()[0:]

Line 306 def manage_addCDLIFile(self,id,title,loc	Line 306 def manage_addCDLIFile(self,id,title,loc

def checkUTF8(data):	def checkUTF8(data):
"""check utf 8"""	"""check utf 8"""
	if not isinstance(data, str):
	logging.error("checkUTF8 data is not string! (%s)"%repr(data))

try:	try:
data.encode('utf-8')	data.decode('utf-8')
	logging.debug("checkUTF8: ok!")
return True	return True
except:	except:
	logging.debug("checkUTF8: false!")
return False	return False


Line 318 def checkFile(filename,data,folder):	Line 323 def checkFile(filename,data,folder):
# first check the file name	# first check the file name
fn=filename.split(".") # no extension	fn=filename.split(".") # no extension

if not fn[0][0]=="P":	if not (fn[0][0]=="P" or fn[0][0]=="S"):
return False,"P missing in the filename"	return False,"P/S missing in the filename"
elif len(fn[0])!=7:	elif len(fn[0])!=7:
return False,"P number has not the right length 6"	return False,"P number has not the right length 6"
elif not checkUTF8(data):	elif not checkUTF8(data):
Line 335 def splitatf(fh,dir=None,ext=None):	Line 340 def splitatf(fh,dir=None,ext=None):
i=0	i=0

#ROC: why split \n first and then \r???	#ROC: why split \n first and then \r???
if (type(fh) is StringType) or (type(fh) is UnicodeType):	if isinstance(fh, basestring):
iter=fh.split("\n")	iter=fh.split("\n")
else:	else:
iter=fh.readlines()	iter=fh.readlines()
Line 369 def splitatf(fh,dir=None,ext=None):	Line 374 def splitatf(fh,dir=None,ext=None):
if dir:	if dir:
filename=os.path.join(dir,filename)	filename=os.path.join(dir,filename)
nf=file(filename,"w")	nf=file(filename,"w")
logging.info("open %s"%filename)	logging.debug("open %s"%filename)
if nf:	if nf:
nf.write(line.replace("\n","")+"\n")	nf.write(line.replace("\n","")+"\n")

Line 378 def splitatf(fh,dir=None,ext=None):	Line 383 def splitatf(fh,dir=None,ext=None):
except:	except:
pass	pass

if not((type(fh) is StringType) or (type(fh) is UnicodeType)):	if not isinstance(fh, basestring):
fh.close()	fh.close()

return ret,len(os.listdir(dir))	return ret,len(os.listdir(dir))


Line 888 class CDLIRoot(Folder):	Line 894 class CDLIRoot(Folder):



def searchText(self, query, index='graphemes'):	def searchText(self, query, index='graphemes', resultFilter=None):
"""searches query in the fulltext index and returns a list of file ids/P-numbers"""	"""searches query in the fulltext index and returns a list of file IDs/P-numbers
	resultFilter is matched against the beginning of the file ID"""
# see also: http://www.plope.com/Books/2_7Edition/SearchingZCatalog.stx#2-13	# see also: http://www.plope.com/Books/2_7Edition/SearchingZCatalog.stx#2-13
logging.debug("searchtext for '%s' in index %s"%(query,index))	logging.debug("searchtext for '%s' in index %s"%(query,index))
#import Products.ZCTextIndex.QueryParser	#import Products.ZCTextIndex.QueryParser
Line 900 class CDLIRoot(Folder):	Line 907 class CDLIRoot(Folder):
# do search	# do search
resultset = idx.search(query_request=idxQuery,sort_index='textid')	resultset = idx.search(query_request=idxQuery,sort_index='textid')
# put only the P-Number in the result	# put only the P-Number in the result
	if resultFilter is None:
results = [res.getId[:7] for res in resultset]	results = [res.getId[:7] for res in resultset]
	else:
	results = [res.getId[:7] for res in resultset if res.getId.startswith(resultFilter)]
logging.debug("searchtext: found %d texts"%len(results))	logging.debug("searchtext: found %d texts"%len(results))
return results	return results

Line 1000 class CDLIRoot(Folder):	Line 1010 class CDLIRoot(Folder):
if line.lstrip().startswith('#lem:'):	if line.lstrip().startswith('#lem:'):
continue	continue
# ignore p-num line	# ignore p-num line
if line.startswith('&P'):	if line.startswith('&P') or line.startswith('&S'):
continue	continue
# ignore version lines	# ignore version lines
if line.startswith('#version'):	if line.startswith('#version'):
Line 1091 class CDLIRoot(Folder):	Line 1101 class CDLIRoot(Folder):
lv.author=user	lv.author=user
lv.versionComment="XXXXXXX"	lv.versionComment="XXXXXXX"



gen
def forceunlock(self,REQUEST=None,user=None,fid=None):	def forceunlock(self,REQUEST=None,user=None,fid=None):
"break all locks"	"break all locks"
if fid is not None:	if fid is not None:
Line 1317 class CDLIRoot(Folder):	Line 1324 class CDLIRoot(Folder):

def uploadATFfinally(self,procedure='',comment="",basketname='',unlock=None,repeat=None,RESPONSE=None):	def uploadATFfinally(self,procedure='',comment="",basketname='',unlock=None,repeat=None,RESPONSE=None):
"""nowupload the files"""	"""nowupload the files"""



threadName=repeat	threadName=repeat
if not threadName or threadName=="":	if not threadName or threadName=="":
thread=uploadATFfinallyThread()	thread=uploadATFfinallyThread()

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>

Removed from v.1.114
changed lines
	Added in v.1.117