--- MPIWGWeb/Attic/nameSplitter.py 2006/09/13 08:17:33 1.1.2.2 +++ MPIWGWeb/Attic/nameSplitter.py 2010/02/15 19:04:24 1.1.2.4 @@ -5,7 +5,7 @@ name splitter from Products.ZCTextIndex.ISplitter import ISplitter from Products.ZCTextIndex.PipelineFactory import element_factory -import psycopg + import re from types import StringType @@ -41,7 +41,7 @@ class nameSplitter: default_encoding = "utf-8" def process(self, lsttmp): - print "XXX" + import psycopg result = [] o = psycopg.connect('dbname=authorities user=dwinter password=3333',serialize=0) c = o.cursor() @@ -73,7 +73,7 @@ except: pass if __name__ == '__main__': - a = 'abc def我们的很 好。' + a = 'abc def\U00CE\U00D2\U00D3\U00C7\U00B5\U00C4 \U00DC\U00C3\U00A1\U00A3' u = unicode(a, 'gbk') s = authorSplitter() print s.process([u])