--- OSAS/OSA_system/OSAS_search.py	2004/07/05 21:08:55	1.2
+++ OSAS/OSA_system/OSAS_search.py	2004/07/09 16:55:19	1.3
@@ -119,6 +119,12 @@ class OSAS_search(SimpleItem):
 	
     def dbSearch(self, query, type):
         """search DB for query and return result set"""
+        results = []
+        restypes = {}
+        if not query:
+            # empty query
+            return results
+        
         curs = self.dbCursor()
         if type == 'equals':
             qs = query
@@ -127,19 +133,19 @@ class OSAS_search(SimpleItem):
         elif type == 'contains':
             qs = "%" + query + "%"
             
-        sql = 'select fileid,idx,tags,content from meta where content like %(qs)s'
+        sql = 'select fileid,idx,tags,content from meta where lower(content) like lower(%(qs)s)'
         print sql, " -> ", qs
         curs.execute(sql, {'qs':qs})
         print "done"
-        results = []
         res = curs.fetchone()
         rescnt = 1
         #print "res0:", res
         while res and rescnt < MAXHITS:
             #print "res:", res
             result = self.getResult(res)
-            if (result):
+            if result:
                 results.append(result)
+                restypes[result.type] = result.type
                 
             res = curs.fetchone()
             rescnt += 1
@@ -148,7 +154,8 @@ class OSAS_search(SimpleItem):
         #self.dbCon = None
 
         #print "SEARCH: ", rescnt, " results"
-        return results
+        restypelist = restypes.keys()
+        return (results, restypelist)
 
         
     def getResult(self, db_result, rank=0):
@@ -165,15 +172,31 @@ class OSAS_search(SimpleItem):
             res = AnyResult(self, db_result, rank)
 
         return res
+
 	
     def renderResult(self, result):
         """returns HTML rendering of a search result"""
 
         return result.render(self)
 	
-	
-	
-	
+
+    def filterResults(self, results, start, end, restypefilter=None):
+        """returns list of results that match a filter"""
+        # filter types first
+        if restypefilter:
+            res = []
+            for r in results:
+                if r.type in restypefilter:
+                    res.append(r)
+        else:
+            res = results
+        # filter on count
+        resgroup = res[start:end]
+	# new total count (because of filter)
+        rescnt = len(res)
+
+        return (resgroup, rescnt)
+    
 
     #
     # Web page stuff
@@ -185,7 +208,7 @@ class OSAS_search(SimpleItem):
         return pt()
 
 
-    def search(self, searchstring=None, searchtype='startswith', start=1, count=10):
+    def search(self, searchstring=None, searchtype='startswith', start=1, count=10, restypefilter=None):
         """search and create result"""
         sres = int(start) -1
         lres = sres + count
@@ -202,18 +225,26 @@ class OSAS_search(SimpleItem):
             
         if not oldsearch or searchstring != oldsearch or searchtype != oldtype:
             # new search
-            res = self.dbSearch(searchstring, searchtype)
+            (res, restypes) = self.dbSearch(searchstring, searchtype)
             # sort the result
             res.sort(ranksort)
             # store it
             self.REQUEST.SESSION['results'] = res
             self.REQUEST.SESSION['searchstring'] = searchstring
             self.REQUEST.SESSION['searchtype'] = searchtype
+            self.REQUEST.SESSION['resulttypes'] = restypes
 
-        self.REQUEST.SESSION['resultgroup'] = self.REQUEST.SESSION['results'][sres:lres]
-        self.REQUEST.SESSION['res_indexes'] = (sres+1, lres, len(self.REQUEST.SESSION['results']), int(count))
+        (resgroup, nres) = self.filterResults(self.REQUEST.SESSION['results'], sres, lres, restypefilter)
+        lres = min(lres, nres)
+        self.REQUEST.SESSION['resultgroup'] = resgroup
+        self.REQUEST.SESSION['res_indexes'] = (sres+1, lres, nres, int(count))
+        self.REQUEST.SESSION['res_type_filter'] = restypefilter
+        if nres > 0:
+            zpt = "zpt/searchResult.zpt"
+        else:
+            zpt = "zpt/searchResult_none.zpt"
             
-        pt=PageTemplateFile(os.path.join(package_home(globals()), "zpt/searchResult.zpt")).__of__(self)
+        pt=PageTemplateFile(os.path.join(package_home(globals()), zpt)).__of__(self)
         return pt()
 
 
@@ -240,7 +271,7 @@ class OSAS_search(SimpleItem):
         """returns if there are more results"""
         try:
             (first, last, total, count) = self.REQUEST.SESSION['res_indexes']
-            return (first < total)
+            return (first + count < total)
         except:
             return False
 
@@ -264,7 +295,8 @@ class OSAS_search(SimpleItem):
             if last > total:
                 last = total
         except:
-            print "OUCH: no next results: ", first, last, total, count
+            print "OUCH: no next results!"
+            return self.search()
 
         return self.search(start=first, count=count)
 
@@ -280,8 +312,8 @@ class OSAS_search(SimpleItem):
             if last < 1:
                 last = 1
         except:
-            print "OUCH: no prev results: ", first, last, total, count
-           
+            print "OUCH: no prev results!"
+            return self.search()           
 
         return self.search(start=first, count=count)
         
@@ -307,11 +339,20 @@ class SearchResult(SimpleItem):
 
     def __init__(self, type='unknown', file=None, url=None, content=None, rank=0):
         """init"""
+        # result type (e.g. "bib", "archim")
         self.type = type
+        # index file name
         self.file = file
-        self.url = url
-        self.urlabel = url
+        # url for result (list of pairs)
+        if url:
+            self.urls = url
+        else:
+            self.urls = []
+        # actual content (list of tuples)
         self.content = content
+        # document status (e.g. "online", "archive")
+        self.status = None
+        # result rank for presentation
         self.rank = rank
 
 class AnyResult(SearchResult):
@@ -319,26 +360,33 @@ class AnyResult(SearchResult):
 
     def __init__(self, zope, db_result, rank):
         """returns a catch-all type result"""
-        SearchResult.__init__(self, type='unknown')
+        SearchResult.__init__(self)
         #print "NEW ANY RESULT!"
-
+        self.type='unknown'
         self.zptFile = os.path.join(package_home(globals()), "zpt/searchResult_any.zpt")
         
-        (fileid, tagidx, tags, content) = db_result
-        self.hitTag = tags
+        (db_fileid, db_tagidx, db_tags, db_content) = db_result
+        self.hitTag = db_tags
 
         # get full info from db
-        self.fileinfo = zope.getDBFile(fileid)
+        self.fileinfo = zope.getDBFile(db_fileid)
         assert self.fileinfo
 
         items = {}
-        items[tags] = content
+        items[db_tags] = db_content
         self.content = items
         self.file = self.fileinfo[0]
-        self.url = ""
-        self.urlabel = self.file
+        self.status = statusForFile(self.file)
         self.rank = rank
 
+    def getContentList(self):
+        """returns content as list of tuples in preferred order"""
+        l = []
+        for k in self.content.keys():
+            l.append((k, self.content[k]))
+
+        return l
+
     def render(self, zope):
         """render this result object"""
         zope.REQUEST.SESSION['result'] = self
@@ -360,20 +408,19 @@ class MetaResult(AnyResult):
         self.metainfo = zope.getDBFileMeta(fileid)
         assert self.metainfo
         
-    def checkContext(self, tags, content):
-        """takes meta entry and sets url from context tags"""
+    def checkContext(self, tags, content, ctxurl):
+        """takes meta entry and updates url from context tags"""
         if tags.endswith('/context/link'):
             if content:
-                self.url = content            
+                #print "CTXlink: ", content
+                ctxurl[0] = content
             
         elif tags.endswith('/context/name'):
             if content:
-                self.urlabel = content
-
-        else:
-            return False
+                #print "CTXname: ", content
+                ctxurl[1] = content
 
-        return True
+        return ctxurl
 
 
 class BibResult(MetaResult):
@@ -382,21 +429,22 @@ class BibResult(MetaResult):
     def __init__(self, zope, db_result, rank):
         """constructor"""
         MetaResult.__init__(self, zope, db_result, rank)
-        #print "NEW BIB RESULT!"
+        #print "NEW BIB RESULT!", self
         self.type = "bib"
         self.zptFile = os.path.join(package_home(globals()), "zpt/searchResult_bib.zpt")
-        self.url = urlForFile(self.file)
-        self.urlabel = None
+        url = storageURL(self.file)
+        if url:
+            self.urls.append(url)
         (fileid, tagidx, tags, content) = db_result
 
         btype = ""
         bitems = {}
+        ctxurl = ['', '']
 
         for me in self.metainfo:
             (m_idx, m_tags, m_content, m_attributes) = me
             # context tag
-            if self.checkContext(m_tags, m_content):
-                continue
+            ctxurl = self.checkContext(m_tags, m_content, ctxurl)
             # first tag with bib type attribute
             if m_tags.endswith('/meta/bib'):
                 r = re.search('type="([^"]*)"', m_attributes)
@@ -418,12 +466,38 @@ class BibResult(MetaResult):
                 k = r.group(1)
                 #print "CONTENT: ", m_content
                 bitems[k] = m_content
+                # remember hit tag
+                if m_tags == self.hitTag:
+                    self.hitTag = k
                 continue
 
         self.content = bitems
+        # store context
+        if not ctxurl[1]:
+            ctxurl[1] = "View"
+        # must have link
+        if ctxurl[0]:
+            self.urls.append(ctxurl)
+                
         self.rank += 100
-        if not self.urlabel and self.url:
-            self.urlabel = "view"
+
+    def getContentList(self):
+        """returns content as list of tuples in preferred order"""
+        l = []
+        c = self.content.copy()
+        # preferred items first
+        for k in ('author', 'title', 'journal', 'year'):
+            if c.has_key(k):
+                l.append((k, c[k]))
+                del c[k]
+
+        # no type
+        del c['type']
+        # copy the rest
+        for k in c.keys():
+            l.append((k, c[k]))
+
+        return l
 
 
 class ArchimResult(MetaResult):
@@ -432,32 +506,58 @@ class ArchimResult(MetaResult):
     def __init__(self, zope, db_result, rank):
         """constructor"""
         MetaResult.__init__(self, zope, db_result, rank)
-        #print "NEW ARCHIM RESULT!"
+        #print "NEW ARCHIM RESULT!", self
         self.type = "archim"
         self.zptFile = os.path.join(package_home(globals()), "zpt/searchResult_archim.zpt")
-        self.url = urlForFile(self.file)
-        self.urlabel = None
+        url = storageURL(self.file)
+        if url:
+            self.urls.append(url)
+            
         (fileid, tagidx, tags, content) = db_result
 
         # process info
         bitems = {}
+        ctxurl = ['', '']
         for me in self.metainfo:
             (m_idx, m_tags, m_content, m_attributes) = me
             # context tag
-            if self.checkContext(m_tags, m_content):
-                continue
+            ctxurl = self.checkContext(m_tags, m_content, ctxurl)
             # collect archimedes/something
             r = re.search('/meta/archimedes/(.*)', m_tags)
             if r:
                 k = r.group(1)
                 #print "CONTENT: ", m_content
                 bitems[k] = m_content
+                # remember hit tag
+                if m_tags == self.hitTag:
+                    self.hitTag = k
                 continue
 
         self.content = bitems
         self.rank += 100
-        if not self.urlabel and self.url:
-            self.urlabel = "view"
+        # store context
+        if not ctxurl[1]:
+            ctxurl[1] = "View"
+        # must have link
+        if ctxurl[0]:
+            self.urls.append(ctxurl)
+
+
+    def getContentList(self):
+        """returns content as list of tuples in preferred order"""
+        l = []
+        c = self.content.copy()
+        # preferred items first
+        for k in ('author', 'title', 'date', 'place'):
+            if c.has_key(k):
+                l.append((k, c[k]))
+                del c[k]
+
+        # copy the rest
+        for k in c.keys():
+            l.append((k, c[k]))
+
+        return l
 	
 
 
@@ -467,13 +567,31 @@ def ranksort(res1, res2):
     return cmp(res2.rank, res1.rank)
 
 
-def urlForFile(filename):
+def statusForFile(filename):
+    """heuristic... returns status for a index file name"""
+    status = None
+    if filename.startswith('/mpiwg/online/'):
+        status = "online"
+    elif filename.startswith('/mpiwg/archive/'):
+        status = "archive"
+    elif filename.startswith('http://'):
+        status = "database"
+        
+    return status
+
+def storageURL(filename):
     """heuristic... returns an URL for a index file name"""
     url = None
+    name = None
     if filename.startswith('/mpiwg/online/'):
-        print "URLFORFILE: online ", filename
-        r = re.search('/mpiwg/online/(.*)/index.meta', filename)
+        #print "URLFORFILE: online ", filename
+        r = re.search('^(.*)/index.meta', filename)
         if r:
-            url = "http://nausikaa.mpiwg-berlin.mpg.de/digitallibrary/digilib.jsp?fn=%s"%r.group(1)
+            url = "http://content.mpiwg-berlin.mpg.de/mpistorage/storage/ShowOnline/index_html?path=%s"%r.group(1)
+            name = "Storage System"
+
+    if name and url:
+        return (url, name)
+    
+    return None
 
-    return url