Commit 0ece22d9 authored by Toby Dickenson's avatar Toby Dickenson

merged toby-catalog-optimise-branch; collector 304; three easy optimisations for indexed searches

parent 69f6f129
...@@ -54,6 +54,8 @@ Zope Changes ...@@ -54,6 +54,8 @@ Zope Changes
- STXNG: added new env. variable STX_DEFAULT_LEVEL to change - STXNG: added new env. variable STX_DEFAULT_LEVEL to change
the default level for <Hx> elements (see doc/ENVIRONMENT.txt) the default level for <Hx> elements (see doc/ENVIRONMENT.txt)
- Collector #304: several catalog optimisations
Bugs: Bugs:
- Fixed PropertyManager/PropertySheets so that you can safely add a - Fixed PropertyManager/PropertySheets so that you can safely add a
......
...@@ -480,16 +480,7 @@ class Catalog(Persistent, Acquisition.Implicit, ExtensionClass.Base): ...@@ -480,16 +480,7 @@ class Catalog(Persistent, Acquisition.Implicit, ExtensionClass.Base):
rs=data.items() rs=data.items()
append(LazyMap(self.instantiate, rs, len(self))) append(LazyMap(self.instantiate, rs, len(self)))
else: else:
try: self._build_sorted_results(data,sort_index,append)
for k, intset in sort_index.items():
if hasattr(intset, 'keys'): intset=intset.keys()
append((k,LazyMap(self.__getitem__, intset)))
except AttributeError:
raise ValueError, (
"Incorrect index name passed as"
" 'sort_on' parameter. Note that you may only"
" sort on values for which there is a matching"
" index available.")
elif rs: elif rs:
# this is reached by having an empty result set (ie non-None) # this is reached by having an empty result set (ie non-None)
if sort_index is None and hasattr(rs, 'values'): if sort_index is None and hasattr(rs, 'values'):
...@@ -513,6 +504,19 @@ class Catalog(Persistent, Acquisition.Implicit, ExtensionClass.Base): ...@@ -513,6 +504,19 @@ class Catalog(Persistent, Acquisition.Implicit, ExtensionClass.Base):
# reached, therefor 'sort-on' does not happen in the # reached, therefor 'sort-on' does not happen in the
# context of text index query. This should probably # context of text index query. This should probably
# sort by relevance first, then the 'sort-on' attribute. # sort by relevance first, then the 'sort-on' attribute.
self._build_sorted_results(rs,sort_index,append)
return used
def _build_sorted_results(self,rs,sort_index,append):
# The two 'for' loops in here contribute a significant
# proportion of the time to perform an indexed search.
# Try to avoid all non-local attribute lookup inside
# those loops.
_lazymap = LazyMap
_intersection = intersection
_self__getitem__ = self.__getitem__
_None = None
if ((len(rs) / 4) > len(sort_index)): if ((len(rs) / 4) > len(sort_index)):
# if the sorted index has a quarter as many keys as # if the sorted index has a quarter as many keys as
# the result set # the result set
...@@ -523,17 +527,23 @@ class Catalog(Persistent, Acquisition.Implicit, ExtensionClass.Base): ...@@ -523,17 +527,23 @@ class Catalog(Persistent, Acquisition.Implicit, ExtensionClass.Base):
# This only makes sense if the number of # This only makes sense if the number of
# keys is much less then the number of results. # keys is much less then the number of results.
intset = intersection(rs, intset) intset = _intersection(rs, intset)
if intset: if intset:
if hasattr(intset, 'keys'): intset=intset.keys() keys = getattr(intset,'keys',_None)
append((k,LazyMap(self.__getitem__, intset))) if keys is not _None:
# Is this ever true?
intset = keys()
append((k,_lazymap(_self__getitem__, intset)))
else: else:
if hasattr(rs, 'keys'): rs=rs.keys() if hasattr(rs, 'keys'): rs=rs.keys()
_sort_index_keyForDocument = sort_index.keyForDocument
_keyerror = KeyError
for did in rs: for did in rs:
append((sort_index.keyForDocument(did), try:
LazyMap(self.__getitem__,[did]))) append((_sort_index_keyForDocument(did),
_lazymap(_self__getitem__,[did])))
return used except _keyerror:
pass
def searchResults(self, REQUEST=None, used=None, **kw): def searchResults(self, REQUEST=None, used=None, **kw):
...@@ -595,7 +605,7 @@ class Catalog(Persistent, Acquisition.Implicit, ExtensionClass.Base): ...@@ -595,7 +605,7 @@ class Catalog(Persistent, Acquisition.Implicit, ExtensionClass.Base):
so.lower() in ('reverse', 'descending')): so.lower() in ('reverse', 'descending')):
r.reverse() r.reverse()
r=map(lambda i: i[1], r) r= [i[1] for i in r]
r=LazyCat(r, reduce(lambda x,y: x+len(y), r, 0)) r=LazyCat(r, reduce(lambda x,y: x+len(y), r, 0))
return r return r
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment