-
Notifications
You must be signed in to change notification settings - Fork 339
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
enhance: [2.5][cp] add search iterator v2 (#2524)
pr: #2395 issue: milvus-io/milvus#37548 Signed-off-by: Patrick Weizhi Xu <[email protected]> (cherry picked from commit 3ce4ac0)
- Loading branch information
Showing
6 changed files
with
259 additions
and
3 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,149 @@ | ||
import logging | ||
from copy import deepcopy | ||
from typing import Dict, List, Optional, Union | ||
|
||
from pymilvus.client import entity_helper, utils | ||
from pymilvus.client.abstract import Hits | ||
from pymilvus.client.constants import ( | ||
GUARANTEE_TIMESTAMP, | ||
ITER_SEARCH_BATCH_SIZE_KEY, | ||
ITER_SEARCH_ID_KEY, | ||
ITER_SEARCH_LAST_BOUND_KEY, | ||
ITER_SEARCH_V2_KEY, | ||
ITERATOR_FIELD, | ||
) | ||
from pymilvus.exceptions import ExceptionsMessage, ParamError, ServerVersionIncompatibleException | ||
from pymilvus.orm.connections import Connections | ||
from pymilvus.orm.constants import MAX_BATCH_SIZE, MILVUS_LIMIT, OFFSET | ||
from pymilvus.orm.iterator import SearchPage, fall_back_to_latest_session_ts | ||
|
||
logger = logging.getLogger(__name__) | ||
|
||
|
||
class SearchIteratorV2: | ||
# for compatibility, save the first result during init | ||
_saved_first_res = None | ||
_is_saved = False | ||
# for compatibility, track the number of total results left | ||
_left_res_cnt = None | ||
|
||
def __init__( | ||
self, | ||
connection: Connections, | ||
collection_name: str, | ||
data: Union[List, utils.SparseMatrixInputType], | ||
batch_size: int = 1000, | ||
filter: Optional[str] = None, | ||
output_fields: Optional[List[str]] = None, | ||
search_params: Optional[Dict] = None, | ||
timeout: Optional[float] = None, | ||
partition_names: Optional[List[str]] = None, | ||
anns_field: Optional[str] = None, | ||
round_decimal: Optional[int] = -1, | ||
**kwargs, | ||
): | ||
self._check_params(batch_size, data, kwargs) | ||
|
||
# for compatibility, delete limit from incoming | ||
if MILVUS_LIMIT in kwargs: | ||
self._left_res_cnt = kwargs[MILVUS_LIMIT] | ||
del kwargs[MILVUS_LIMIT] | ||
|
||
self._conn = connection | ||
self._params = { | ||
"collection_name": collection_name, | ||
"data": data, | ||
"anns_field": anns_field, | ||
"param": deepcopy(search_params), | ||
"limit": batch_size, | ||
"expression": filter, | ||
"partition_names": partition_names, | ||
"output_fields": output_fields, | ||
"timeout": timeout, | ||
"round_decimal": round_decimal, | ||
ITERATOR_FIELD: True, | ||
ITER_SEARCH_V2_KEY: True, | ||
ITER_SEARCH_BATCH_SIZE_KEY: batch_size, | ||
GUARANTEE_TIMESTAMP: 0, | ||
**kwargs, | ||
} | ||
# this raises MilvusException if the server does not support V2 | ||
self._saved_first_res = self.next() | ||
self._is_saved = True | ||
|
||
def next(self): | ||
# for compatibility | ||
if self._is_saved: | ||
self._is_saved = False | ||
return self._saved_first_res | ||
self._saved_first_res = None | ||
if self._left_res_cnt is not None and self._left_res_cnt <= 0: | ||
return SearchPage(None) | ||
|
||
res = self._conn.search(**self._params) | ||
iter_info = res.get_search_iterator_v2_results_info() | ||
self._params[ITER_SEARCH_LAST_BOUND_KEY] = iter_info.last_bound | ||
|
||
# patch token and guarantee timestamp for the first next() call | ||
if ITER_SEARCH_ID_KEY not in self._params: | ||
if iter_info.token is not None and iter_info.token != "": | ||
self._params[ITER_SEARCH_ID_KEY] = iter_info.token | ||
else: | ||
raise ServerVersionIncompatibleException( | ||
message=ExceptionsMessage.SearchIteratorV2FallbackWarning | ||
) | ||
if self._params[GUARANTEE_TIMESTAMP] <= 0: | ||
if res.get_session_ts() > 0: | ||
self._params[GUARANTEE_TIMESTAMP] = res.get_session_ts() | ||
else: | ||
logger.warning( | ||
"failed to set up mvccTs from milvus server, use client-side ts instead" | ||
) | ||
self._params[GUARANTEE_TIMESTAMP] = fall_back_to_latest_session_ts() | ||
|
||
# return SearchPage for compability | ||
if len(res) > 0: | ||
return self._wrap_return_res(res[0]) | ||
return SearchPage(None) | ||
|
||
def close(self): | ||
pass | ||
|
||
def _check_params( | ||
self, | ||
batch_size: int, | ||
data: Union[List, utils.SparseMatrixInputType], | ||
kwargs: Dict, | ||
): | ||
# metric_type can be empty, deduced at server side | ||
# anns_field can be empty, deduced at server side | ||
|
||
# check batch size | ||
if batch_size < 0: | ||
raise ParamError(message="batch size cannot be less than zero") | ||
if batch_size > MAX_BATCH_SIZE: | ||
raise ParamError(message=f"batch size cannot be larger than {MAX_BATCH_SIZE}") | ||
|
||
# check offset | ||
if kwargs.get(OFFSET, 0) != 0: | ||
raise ParamError(message="Offset is not supported for search_iterator_v2") | ||
|
||
# check num queries, heavy to check at server side | ||
rows = entity_helper.get_input_num_rows(data) | ||
if rows > 1: | ||
raise ParamError( | ||
message="search_iterator_v2 does not support processing multiple vectors simultaneously" | ||
) | ||
if rows == 0: | ||
raise ParamError(message="The vector data for search cannot be empty") | ||
|
||
def _wrap_return_res(self, res: Hits) -> SearchPage: | ||
if self._left_res_cnt is None: | ||
return SearchPage(res) | ||
|
||
# When we have a limit, ensure we don't return more results than requested | ||
cur_len = len(res) | ||
if cur_len > self._left_res_cnt: | ||
res = res[: self._left_res_cnt] | ||
self._left_res_cnt -= cur_len | ||
return SearchPage(res) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters