diff --git a/benchmarks/perf-tool/README.md b/benchmarks/perf-tool/README.md
index eb4ac0dc1..239563e22 100644
--- a/benchmarks/perf-tool/README.md
+++ b/benchmarks/perf-tool/README.md
@@ -229,6 +229,29 @@ Ingests a dataset of vectors into the cluster.
 | ----------- | ----------- | ----------- |
 | took | Total time to ingest the dataset into the index.| ms |
 
+#### ingest_extended
+
+Ingests a dataset of multiple context types into the cluster.
+
+##### Parameters
+
+| Parameter Name | Description                                                                                                                                                  | Default |  
+| ----------- |--------------------------------------------------------------------------------------------------------------------------------------------------------------| ----------- |
+| index_name | Name of index to ingest into                                                                                                                                 | No default |
+| field_name | Name of field to ingest into                                                                                                                                 | No default |
+| bulk_size | Documents per bulk request                                                                                                                                   | 300 |
+| dataset_format | Format the data-set is in. Currently hdf5 and bigann is supported. The hdf5 file must be organized in the same way that the ann-benchmarks organizes theirs. | 'hdf5' |
+| dataset_path | Path to data-set                                                                                                                                             | No default |
+| doc_count | Number of documents to create from data-set                                                                                                                  | Size of the data-set |
+| attributes_dataset_name | Name of dataset with additional attributes inside the main dataset                                                                                           | No default |
+| attribute_spec | Definition of attributes, format is: [{id: [id_val], name: [name_val], type: [type_val]}]                                                                    | No default |
+
+##### Metrics
+
+| Metric Name | Description | Unit |  
+| ----------- | ----------- | ----------- |
+| took | Total time to ingest the dataset into the index.| ms |
+
 #### query
 
 Runs a set of queries against an index.
@@ -257,6 +280,60 @@ Runs a set of queries against an index.
 | recall@R | ratio of top R results from the ground truth neighbors that are in the K results returned by the plugin | float 0.0-1.0 |
 | recall@K | ratio of results returned that were ground truth nearest neighbors  | float 0.0-1.0 |
 
+#### query_with_filter
+
+Runs a set of queries with filter against an index.
+
+##### Parameters
+
+| Parameter Name | Description                                                                                                                                                               | Default              |  
+| ----------- |---------------------------------------------------------------------------------------------------------------------------------------------------------------------------|----------------------|
+| k | Number of neighbors to return on search                                                                                                                                   | 100                  |
+| r | r value in Recall@R                                                                                                                                                       | 1                    |
+| index_name | Name of index to search                                                                                                                                                   | No default           |
+| field_name | Name field to search                                                                                                                                                      | No default           |
+| calculate_recall | Whether to calculate recall values                                                                                                                                        | False                |
+| dataset_format | Format the dataset is in. Currently hdf5 and bigann is supported. The hdf5 file must be organized in the same way that the ann-benchmarks organizes theirs.               | 'hdf5'               |
+| dataset_path | Path to dataset                                                                                                                                                           | No default           |
+| neighbors_format | Format the neighbors dataset is in. Currently hdf5 and bigann is supported. The hdf5 file must be organized in the same way that the ann-benchmarks organizes theirs.     | 'hdf5'               |
+| neighbors_path | Path to neighbors dataset                                                                                                                                                 | No default           |
+| neighbors_dataset | Name of filter dataset inside the neighbors dataset                                                                                                                       | No default           |
+| filter_spec | Path to filter specification                                                                                                                                              | No default           |
+| filter_type | Type of filter format, we do support following types: <br/>FILTER inner filter format for approximate k-NN search<br/>SCRIPT score scripting style with exact k-NN search | SCRIPT               |
+| score_script_similarity | Similarity function that has been used to index dataset. Used for SCRIPT filter type and ignored for others                                                               | l2                   |
+| query_count | Number of queries to create from data-set                                                                                                                                 | Size of the data-set |
+
+##### Metrics
+
+| Metric Name | Description | Unit |  
+| ----------- | ----------- | ----------- |
+| took | Took times returned per query aggregated as total, p50, p90 and p99 (when applicable) | ms |
+| memory_kb | Native memory k-NN is using at the end of the query workload | KB |
+| recall@R | ratio of top R results from the ground truth neighbors that are in the K results returned by the plugin | float 0.0-1.0 |
+| recall@K | ratio of results returned that were ground truth nearest neighbors  | float 0.0-1.0 |
+
+### Data sets
+
+This benchmark tool uses pre-generated data sets to run indexing and query workload. For some benchmark types existing dataset need to be 
+extended. Filtering is an example of use case where such dataset extension is needed.
+
+It's possible to use script provided with this repo to generate dataset and run benchmark for filtering queries.
+You need to have existing dataset with vector data. This dataset will be used  to generate additional attribute data and set of ground truth neighbours document ids.
+
+To generate dataset with attributes based on vectors only dataset use following command pattern:
+
+```commandline
+python add-filters-to-dataset.py <path_to_dataset_with_vectors> <path_of_new_dataset_with_attributes> True False
+```
+
+To generate neighbours dataset for different filters based on dataset with attributes use following command pattern:
+
+```commandline
+python add-filters-to-dataset.py <path_to_dataset_with_vectors> <path_of_new_dataset_with_attributes> False True
+```
+
+After that new dataset(s) can be referred from testcase definition in `ingest_extended` and `query_with_filter` steps.
+
 ## Contributing 
 
 ### Linting
diff --git a/benchmarks/perf-tool/add-filters-to-dataset.py b/benchmarks/perf-tool/add-filters-to-dataset.py
new file mode 100644
index 000000000..3e02a0d0b
--- /dev/null
+++ b/benchmarks/perf-tool/add-filters-to-dataset.py
@@ -0,0 +1,172 @@
+import getopt
+import os
+import random
+import sys
+
+import h5py
+
+from osb.extensions.data_set import Context, HDF5DataSet
+
+"""
+Script builds complex dataset with additional attributes from exiting dataset that has only vectors. 
+Additional attributes are predefined in the script: color, taste, age. Only HDF5 format of vector dataset is supported.
+
+Script generates additional dataset of neighbours (ground truth) for each filter type. 
+
+Example of usage:
+    
+    create new hdf5 file with attribute dataset
+    add-filters-to-dataset.py ~/dev/opensearch/k-NN/benchmarks/perf-tool/dataset/data.hdf5 ~/dev/opensearch/datasets/data-with-attr True False
+    
+    create new hdf5 file with filter datasets
+    add-filters-to-dataset.py ~/dev/opensearch/k-NN/benchmarks/perf-tool/dataset/data-with-attr.hdf5 ~/dev/opensearch/datasets/data-with-filters False True
+"""
+
+class Dataset():
+    DEFAULT_INDEX_NAME = "test-index"
+    DEFAULT_FIELD_NAME = "test-field"
+    DEFAULT_CONTEXT = Context.INDEX
+    DEFAULT_TYPE = HDF5DataSet.FORMAT_NAME
+    DEFAULT_NUM_VECTORS = 10
+    DEFAULT_DIMENSION = 10
+    DEFAULT_RANDOM_STRING_LENGTH = 8
+
+    def createDataset(self, source_dataset_path, out_file_path, generate_attrs: bool, generate_filters: bool) -> None:
+        path_elements = os.path.split(os.path.abspath(source_dataset_path))
+        data_set_dir = path_elements[0]
+
+        # For HDF5, because multiple data sets can be grouped in the same file,
+        # we will build data sets in memory and not write to disk until
+        # _flush_data_sets_to_disk is called
+        # read existing dataset
+        data_hdf5 = os.path.join(os.path.dirname(os.path.realpath('/')), source_dataset_path)
+
+        with h5py.File(data_hdf5, "r") as hf:
+
+            if generate_attrs:
+                data_set_w_attr = self.create_dataset_file(out_file_path, self.DEFAULT_TYPE, data_set_dir)
+
+                possible_colors = ['red', 'green', 'yellow', 'blue', None]
+                possible_tastes = ['sweet', 'salty', 'sour', 'bitter', None]
+                max_age = 100
+
+                for key in hf.keys():
+                    if key not in ['neighbors', 'test', 'train']:
+                        continue
+                    data_set_w_attr.create_dataset(key, data=hf[key][()])
+
+                attributes = []
+                for i in range(len(hf['train'])):
+                    attr = [random.choice(possible_colors), random.choice(possible_tastes),
+                            random.randint(0, max_age + 1)]
+                    attributes.append(attr)
+
+                data_set_w_attr.create_dataset('attributes', (len(attributes), 3), 'S10', data=attributes)
+
+                data_set_w_attr.flush()
+                data_set_w_attr.close()
+
+            if generate_filters:
+                attributes = hf['attributes'][()]
+                expected_neighbors = hf['neighbors'][()]
+
+                data_set_filters = self.create_dataset_file(out_file_path, self.DEFAULT_TYPE, data_set_dir)
+
+                def filter1(attributes, vector_idx):
+                    if attributes[vector_idx][0].decode() == 'red' and int(attributes[vector_idx][2].decode()) >= 20:
+                        return True
+                    else:
+                        return False
+
+                self.apply_filter(expected_neighbors, attributes, data_set_filters, 'neighbors_filter_1', filter1)
+
+                # filter 2 - color = blue or None and taste = 'salty'
+                def filter2(attributes, vector_idx):
+                    if (attributes[vector_idx][0].decode() == 'blue' or attributes[vector_idx][
+                        0].decode() == 'None') and attributes[vector_idx][1].decode() == 'salty':
+                        return True
+                    else:
+                        return False
+
+                self.apply_filter(expected_neighbors, attributes, data_set_filters, 'neighbors_filter_2', filter2)
+
+                # filter 3 - color and taste are not None and age is between 20 and 80
+                def filter3(attributes, vector_idx):
+                    if attributes[vector_idx][0].decode() != 'None' and attributes[vector_idx][
+                        1].decode() != 'None' and 20 <= \
+                            int(attributes[vector_idx][2].decode()) <= 80:
+                        return True
+                    else:
+                        return False
+
+                self.apply_filter(expected_neighbors, attributes, data_set_filters, 'neighbors_filter_3', filter3)
+
+                # filter 4 - color green or blue and taste is bitter and age is between (30, 60)
+                def filter4(attributes, vector_idx):
+                    if (attributes[vector_idx][0].decode() == 'green' or attributes[vector_idx][0].decode() == 'blue') \
+                        and  (attributes[vector_idx][1].decode() == 'bitter') \
+                        and 30 <= int(attributes[vector_idx][2].decode()) <= 60:
+                        return True
+                    else:
+                        return False
+
+                self.apply_filter(expected_neighbors, attributes, data_set_filters, 'neighbors_filter_4', filter4)
+
+                # filter 5 color is (green or blue or yellow) or taste = sweet or age is between (30, 70)
+                def filter5(attributes, vector_idx):
+                    if attributes[vector_idx][0].decode() == 'green' or attributes[vector_idx][0].decode() == 'blue' \
+                            or attributes[vector_idx][0].decode() == 'yellow' \
+                            or attributes[vector_idx][1].decode() == 'sweet' \
+                            or 30 <= int(attributes[vector_idx][2].decode()) <= 70:
+                        return True
+                    else:
+                        return False
+
+                self.apply_filter(expected_neighbors, attributes, data_set_filters, 'neighbors_filter_5', filter5)
+
+                data_set_filters.flush()
+                data_set_filters.close()
+
+    def apply_filter(self, expected_neighbors, attributes, data_set_w_filtering, filter_name, filter_func):
+        neighbors_filter = []
+        filtered_count = 0
+        for expected_neighbors_row in expected_neighbors:
+            neighbors_filter_row = [-1] * len(expected_neighbors_row)
+            idx = 0
+            for vector_idx in expected_neighbors_row:
+                if filter_func(attributes, vector_idx):
+                    neighbors_filter_row[idx] = vector_idx
+                    idx += 1
+                    filtered_count += 1
+            neighbors_filter.append(neighbors_filter_row)
+        overall_count = len(expected_neighbors) * len(expected_neighbors[0])
+        perc = float(filtered_count/overall_count) * 100
+        print('ground truth size for {} is {}, percentage {}'.format(filter_name, filtered_count, perc))
+        data_set_w_filtering.create_dataset(filter_name, data=neighbors_filter)
+        return expected_neighbors
+
+    def create_dataset_file(self, file_name, extension, data_set_dir) -> h5py.File:
+        data_set_file_name = "{}.{}".format(file_name, extension)
+        data_set_path = os.path.join(data_set_dir, data_set_file_name)
+
+        data_set_w_filtering = h5py.File(data_set_path, 'a')
+
+        return data_set_w_filtering
+
+
+def main(argv):
+    opts, args = getopt.getopt(argv, "")
+    in_file_path = args[0]
+    out_file_path = args[1]
+    generate_attr = str2bool(args[2])
+    generate_filters = str2bool(args[3])
+
+    worker = Dataset()
+    worker.createDataset(in_file_path, out_file_path, generate_attr, generate_filters)
+
+def str2bool(v):
+  return v.lower() in ("yes", "true", "t", "1")
+
+if __name__ == "__main__":
+   main(sys.argv[1:])
+
diff --git a/benchmarks/perf-tool/dataset/data-with-attr-with-filters.hdf5 b/benchmarks/perf-tool/dataset/data-with-attr-with-filters.hdf5
new file mode 100644
index 000000000..01df75f83
Binary files /dev/null and b/benchmarks/perf-tool/dataset/data-with-attr-with-filters.hdf5 differ
diff --git a/benchmarks/perf-tool/dataset/data-with-attr.hdf5 b/benchmarks/perf-tool/dataset/data-with-attr.hdf5
new file mode 100644
index 000000000..22873b06c
Binary files /dev/null and b/benchmarks/perf-tool/dataset/data-with-attr.hdf5 differ
diff --git a/benchmarks/perf-tool/okpt/io/config/parsers/util.py b/benchmarks/perf-tool/okpt/io/config/parsers/util.py
index cecb9f2d0..454fec5a0 100644
--- a/benchmarks/perf-tool/okpt/io/config/parsers/util.py
+++ b/benchmarks/perf-tool/okpt/io/config/parsers/util.py
@@ -13,9 +13,9 @@
 
 
 def parse_dataset(dataset_format: str, dataset_path: str,
-                  context: Context) -> DataSet:
+                  context: Context, custom_context=None) -> DataSet:
     if dataset_format == 'hdf5':
-        return HDF5DataSet(dataset_path, context)
+        return HDF5DataSet(dataset_path, context, custom_context)
 
     if dataset_format == 'bigann' and context == Context.NEIGHBORS:
         return BigANNNeighborDataSet(dataset_path)
diff --git a/benchmarks/perf-tool/okpt/io/dataset.py b/benchmarks/perf-tool/okpt/io/dataset.py
index 4f8bc22a2..001563bab 100644
--- a/benchmarks/perf-tool/okpt/io/dataset.py
+++ b/benchmarks/perf-tool/okpt/io/dataset.py
@@ -34,6 +34,7 @@ class Context(Enum):
     INDEX = 1
     QUERY = 2
     NEIGHBORS = 3
+    CUSTOM = 4
 
 
 class DataSet(ABC):
@@ -64,9 +65,9 @@ class HDF5DataSet(DataSet):
     <https://github.com/erikbern/ann-benchmarks#data-sets>`_
     """
 
-    def __init__(self, dataset_path: str, context: Context):
+    def __init__(self, dataset_path: str, context: Context, custom_context=None):
         file = h5py.File(dataset_path)
-        self.data = cast(h5py.Dataset, file[self._parse_context(context)])
+        self.data = cast(h5py.Dataset, file[self._parse_context(context, custom_context)])
         self.current = 0
 
     def read(self, chunk_size: int):
@@ -88,7 +89,7 @@ def reset(self):
         self.current = 0
 
     @staticmethod
-    def _parse_context(context: Context) -> str:
+    def _parse_context(context: Context, custom_context=None) -> str:
         if context == Context.NEIGHBORS:
             return "neighbors"
 
@@ -98,6 +99,9 @@ def _parse_context(context: Context) -> str:
         if context == Context.QUERY:
             return "test"
 
+        if context == Context.CUSTOM:
+            return custom_context
+
         raise Exception("Unsupported context")
 
 
diff --git a/benchmarks/perf-tool/okpt/test/steps/factory.py b/benchmarks/perf-tool/okpt/test/steps/factory.py
index 2b7bcc68d..5073b838d 100644
--- a/benchmarks/perf-tool/okpt/test/steps/factory.py
+++ b/benchmarks/perf-tool/okpt/test/steps/factory.py
@@ -9,7 +9,7 @@
 from okpt.test.steps.base import Step, StepConfig
 
 from okpt.test.steps.steps import CreateIndexStep, DisableRefreshStep, RefreshIndexStep, DeleteIndexStep, \
-    TrainModelStep, DeleteModelStep, ForceMergeStep, ClearCacheStep, IngestStep, QueryStep
+    TrainModelStep, DeleteModelStep, ForceMergeStep, ClearCacheStep, IngestStep, IngestStepExtended, QueryStep, QueryWithFilterStep
 
 
 def create_step(step_config: StepConfig) -> Step:
@@ -27,8 +27,12 @@ def create_step(step_config: StepConfig) -> Step:
         return DeleteIndexStep(step_config)
     elif step_config.step_name == IngestStep.label:
         return IngestStep(step_config)
+    elif step_config.step_name == IngestStepExtended.label:
+        return IngestStepExtended(step_config)
     elif step_config.step_name == QueryStep.label:
         return QueryStep(step_config)
+    elif step_config.step_name == QueryWithFilterStep.label:
+        return QueryWithFilterStep(step_config)
     elif step_config.step_name == ForceMergeStep.label:
         return ForceMergeStep(step_config)
     elif step_config.step_name == ClearCacheStep.label:
diff --git a/benchmarks/perf-tool/okpt/test/steps/steps.py b/benchmarks/perf-tool/okpt/test/steps/steps.py
index b61781a6e..2fc35ca2d 100644
--- a/benchmarks/perf-tool/okpt/test/steps/steps.py
+++ b/benchmarks/perf-tool/okpt/test/steps/steps.py
@@ -18,7 +18,7 @@
 from opensearchpy import OpenSearch, RequestsHttpConnection
 
 from okpt.io.config.parsers.base import ConfigurationError
-from okpt.io.config.parsers.util import parse_string_param, parse_int_param, parse_dataset, parse_bool_param
+from okpt.io.config.parsers.util import parse_string_param, parse_int_param, parse_dataset, parse_bool_param, parse_list_param
 from okpt.io.dataset import Context
 from okpt.io.utils.reader import parse_json_from_path
 from okpt.test.steps import base
@@ -325,6 +325,63 @@ def action(doc_id):
     def _get_measures(self) -> List[str]:
         return ['took']
 
+class IngestStepExtended(OpenSearchStep):
+    """See base class."""
+
+    label = 'ingest_extended'
+
+    def __init__(self, step_config: StepConfig):
+        super().__init__(step_config)
+        self.index_name = parse_string_param('index_name', step_config.config,
+                                             {}, None)
+        self.field_name = parse_string_param('field_name', step_config.config,
+                                             {}, None)
+        self.bulk_size = parse_int_param('bulk_size', step_config.config, {},
+                                         300)
+        self.implicit_config = step_config.implicit_config
+        dataset_format = parse_string_param('dataset_format',
+                                            step_config.config, {}, 'hdf5')
+        dataset_path = parse_string_param('dataset_path', step_config.config,
+                                          {}, None)
+
+        self.dataset = parse_dataset(dataset_format, dataset_path,
+                                     Context.INDEX)
+
+        self.attributes_dataset_name = parse_string_param('attributes_dataset_name',
+                                            step_config.config, {}, None)
+
+        self.attributes_dataset = parse_dataset(dataset_format, dataset_path,
+                                                Context.CUSTOM, self.attributes_dataset_name)
+
+        self.attribute_spec = parse_list_param('attribute_spec',
+                                               step_config.config, {}, [])
+
+        input_doc_count = parse_int_param('doc_count', step_config.config, {},
+                                          self.dataset.size())
+        self.doc_count = min(input_doc_count, self.dataset.size())
+
+    def _action(self):
+
+        def action(doc_id):
+            return {'index': {'_index': self.index_name, '_id': doc_id}}
+
+        # Maintain minimal state outside of this loop. For large data sets, too
+        # much state may cause out of memory failure
+        partition_attr = self.attributes_dataset.read(self.doc_count)
+        for i in range(0, self.doc_count, self.bulk_size):
+            partition = self.dataset.read(self.bulk_size)
+            if partition is None:
+                break
+            body = bulk_transform_with_attributes(partition, partition_attr, self.field_name, self.attributes_dataset_name, action, i, self.attribute_spec)
+            bulk_index(self.opensearch, self.index_name, body)
+
+        self.dataset.reset()
+
+        return {}
+
+    def _get_measures(self) -> List[str]:
+        return ['took']
+
 
 class QueryStep(OpenSearchStep):
     """See base class."""
@@ -414,6 +471,134 @@ def _get_measures(self) -> List[str]:
 
         return measures
 
+class QueryWithFilterStep(OpenSearchStep):
+    """See base class."""
+
+    label = 'query_with_filter'
+
+    def __init__(self, step_config: StepConfig):
+        super().__init__(step_config)
+        self.k = parse_int_param('k', step_config.config, {}, 100)
+        self.r = parse_int_param('r', step_config.config, {}, 1)
+        self.index_name = parse_string_param('index_name', step_config.config,
+                                             {}, None)
+        self.field_name = parse_string_param('field_name', step_config.config,
+                                             {}, None)
+        self.calculate_recall = parse_bool_param('calculate_recall',
+                                                 step_config.config, {}, False)
+
+        self.filter_spec = parse_string_param('filter_spec', step_config.config, {}, None)
+
+        dataset_format = parse_string_param('dataset_format',
+                                            step_config.config, {}, 'hdf5')
+        dataset_path = parse_string_param('dataset_path',
+                                          step_config.config, {}, None)
+        self.dataset = parse_dataset(dataset_format, dataset_path,
+                                     Context.QUERY)
+
+        input_query_count = parse_int_param('query_count',
+                                            step_config.config, {},
+                                            self.dataset.size())
+        self.query_count = min(input_query_count, self.dataset.size())
+
+        neighbors_format = parse_string_param('neighbors_format',
+                                              step_config.config, {}, 'hdf5')
+        neighbors_path = parse_string_param('neighbors_path',
+                                            step_config.config, {}, None)
+
+        neighbors_dataset = parse_string_param('neighbors_dataset',
+                                            step_config.config, {}, None)
+
+        self.neighbors = parse_dataset(neighbors_format, neighbors_path,
+                                       Context.CUSTOM, neighbors_dataset)
+
+        self.filter_type = parse_string_param('filter_type', step_config.config, {}, 'SCRIPT')
+        self.score_script_similarity = parse_string_param('score_script_similarity', step_config.config, {}, 'l2')
+
+        self.implicit_config = step_config.implicit_config
+
+    def _action(self):
+        def get_body_filter(vec):
+            filter_json = json.load(open(self.filter_spec))
+            if self.filter_type == 'FILTER':
+                return {
+                    'size': self.k,
+                    'query': {
+                        'knn': {
+                            self.field_name: {
+                                'vector': vec,
+                                'k': self.k,
+                                'filter': filter_json
+                            }
+                        }
+                    }
+                }
+            elif self.filter_type == 'SCRIPT':
+                return {
+                    'size': self.k,
+                    'query': {
+                        'script_score': {
+                            'query': {
+                                'bool': {
+                                    'filter': filter_json
+                                }
+                            },
+                            'script': {
+                                'source': 'knn_score',
+                                'lang': 'knn',
+                                'params': {
+                                    'field': self.field_name,
+                                    'query_value': vec,
+                                    'space_type': self.score_script_similarity
+                                }
+                            }
+                        }
+                    }
+                }
+            else:
+                raise ConfigurationError('Not supported filter type {}'.format(self.filter_type))
+
+        results = {}
+        query_responses = []
+
+        for i in range(self.query_count):
+            query = self.dataset.read(1)
+            if query is None:
+                break
+            body = get_body_filter(query[0])
+            query_responses.append(
+                query_index(self.opensearch, self.index_name,
+                           body, [self.field_name]))
+
+        results['took'] = [
+            float(query_response['took']) for query_response in query_responses
+        ]
+        results['memory_kb'] = get_cache_size_in_kb(self.endpoint, 9200)
+
+        if self.calculate_recall:
+            ids = [[int(hit['_id'])
+                    for hit in query_response['hits']['hits']]
+                   for query_response in query_responses]
+            r_at_k = recall_at_r(ids, self.neighbors,
+                                              self.k, self.k, self.query_count)
+            results['recall@K'] = r_at_k
+            self.neighbors.reset()
+            r_at_r = recall_at_r(
+                ids, self.neighbors, self.r, self.k, self.query_count)
+            results[f'recall@{str(self.r)}'] = r_at_r
+            self.neighbors.reset()
+
+        self.dataset.reset()
+
+        return results
+
+    def _get_measures(self) -> List[str]:
+        measures = ['took', 'memory_kb']
+
+        if self.calculate_recall:
+            measures.extend(['recall@K', f'recall@{str(self.r)}'])
+
+        return measures
 
 # Helper functions - (AKA not steps)
 def bulk_transform(partition: np.ndarray, field_name: str, action,
@@ -436,6 +621,45 @@ def bulk_transform(partition: np.ndarray, field_name: str, action,
     actions[1::2] = [{field_name: vec} for vec in partition.tolist()]
     return actions
 
+def bulk_transform_with_attributes(partition: np.ndarray, partition_attr, field_name: str, attributes_dataset_name: str,
+                                   action, offset: int, attributes_def) -> List[Dict[str, Any]]:
+    """Partitions and transforms a list of vectors into OpenSearch's bulk
+    injection format.
+    Args:
+        offset: to start counting from
+        partition: An array of vectors to transform.
+        field_name: field name for action
+        action: Bulk API action.
+    Returns:
+        An array of transformed vectors in bulk format.
+    """
+    actions = []
+    _ = [
+        actions.extend([action(i + offset), None])
+        for i in range(len(partition))
+    ]
+    idx = 1
+    part_list = partition.tolist()
+    for i in range(len(partition)):
+        actions[idx] = {field_name: part_list[i]}
+        attr_idx = i + offset
+
+        for attribute in attributes_def:
+            attr_def_idx = attribute['id']
+            attr_def_name = attribute['name']
+            attr_def_type = attribute['type']
+
+            if attr_def_type == 'str':
+                val = partition_attr[attr_idx][attr_def_idx].decode()
+                if val != 'None':
+                    actions[idx][attr_def_name] = val
+            elif attr_def_type == 'int':
+                val = int(partition_attr[attr_idx][attr_def_idx].decode())
+                actions[idx][attr_def_name] = val
+        idx+=2
+
+    return actions
+
 
 def delete_index(opensearch: OpenSearch, index_name: str):
     """Deletes an OpenSearch index.
@@ -520,16 +744,20 @@ def recall_at_r(results, neighbor_dataset, r, k, query_count):
         Recall at R
     """
     correct = 0.0
+    total_num_of_results = 0
     for query in range(query_count):
         true_neighbors = neighbor_dataset.read(1)
         if true_neighbors is None:
             break
         true_neighbors_set = set(true_neighbors[0][:k])
-        for j in range(r):
+        true_neighbors_set.discard(-1)
+        min_r = min(r, len(true_neighbors_set))
+        total_num_of_results += min_r
+        for j in range(min_r):
             if results[query][j] in true_neighbors_set:
                 correct += 1.0
 
-    return correct / (r * query_count)
+    return correct / total_num_of_results
 
 
 def get_index_size_in_kb(opensearch, index_name):
diff --git a/benchmarks/perf-tool/sample-configs/filter-spec/filter-1-spec.json b/benchmarks/perf-tool/sample-configs/filter-spec/filter-1-spec.json
new file mode 100644
index 000000000..f529de4fe
--- /dev/null
+++ b/benchmarks/perf-tool/sample-configs/filter-spec/filter-1-spec.json
@@ -0,0 +1,24 @@
+{
+    "bool":
+    {
+        "must":
+        [
+            {
+                "range":
+                {
+                    "age":
+                    {
+                        "gte": 20,
+                        "lte": 100
+                    }
+                }
+            },
+            {
+                "term":
+                {
+                    "color": "red"
+                }
+            }
+        ]
+    }
+}
\ No newline at end of file
diff --git a/benchmarks/perf-tool/sample-configs/filter-spec/filter-2-spec.json b/benchmarks/perf-tool/sample-configs/filter-spec/filter-2-spec.json
new file mode 100644
index 000000000..9d4514e62
--- /dev/null
+++ b/benchmarks/perf-tool/sample-configs/filter-spec/filter-2-spec.json
@@ -0,0 +1,40 @@
+{
+    "bool":
+    {
+        "must":
+        [
+            {
+                "term":
+                {
+                    "taste": "salty"
+                }
+            },
+            {
+                "bool":
+                {
+                    "should":
+                    [
+                        {
+                            "bool":
+                            {
+                                "must_not":
+                                {
+                                    "exists":
+                                    {
+                                        "field": "color"
+                                    }
+                                }
+                            }
+                        },
+                        {
+                            "term":
+                            {
+                                "color": "blue"
+                            }
+                        }
+                    ]
+                }
+            }
+        ]
+    }
+}
\ No newline at end of file
diff --git a/benchmarks/perf-tool/sample-configs/filter-spec/filter-3-spec.json b/benchmarks/perf-tool/sample-configs/filter-spec/filter-3-spec.json
new file mode 100644
index 000000000..d69f8768e
--- /dev/null
+++ b/benchmarks/perf-tool/sample-configs/filter-spec/filter-3-spec.json
@@ -0,0 +1,30 @@
+{
+    "bool":
+    {
+        "must":
+        [
+            {
+                "range":
+                {
+                    "age":
+                    {
+                        "gte": 20,
+                        "lte": 80
+                    }
+                }
+            },
+            {
+                "exists":
+                {
+                    "field": "color"
+                }
+            },
+            {
+                "exists":
+                {
+                    "field": "taste"
+                }
+            }
+        ]
+    }
+}
\ No newline at end of file
diff --git a/benchmarks/perf-tool/sample-configs/filter-spec/filter-4-spec.json b/benchmarks/perf-tool/sample-configs/filter-spec/filter-4-spec.json
new file mode 100644
index 000000000..9e6356f1c
--- /dev/null
+++ b/benchmarks/perf-tool/sample-configs/filter-spec/filter-4-spec.json
@@ -0,0 +1,44 @@
+{
+    "bool":
+    {
+        "must":
+        [
+            {
+                "range":
+                {
+                    "age":
+                    {
+                        "gte": 30,
+                        "lte": 60
+                    }
+                }
+            },
+            {
+                "term":
+                {
+                    "taste": "bitter"
+                }
+            },
+            {
+                "bool":
+                {
+                    "should":
+                    [
+                        {
+                            "term":
+                            {
+                                "color": "blue"
+                            }
+                        },
+                        {
+                            "term":
+                            {
+                                "color": "green"
+                            }
+                        }
+                    ]
+                }
+            }
+        ]
+    }
+}
\ No newline at end of file
diff --git a/benchmarks/perf-tool/sample-configs/filter-spec/filter-5-spec.json b/benchmarks/perf-tool/sample-configs/filter-spec/filter-5-spec.json
new file mode 100644
index 000000000..08acded4b
--- /dev/null
+++ b/benchmarks/perf-tool/sample-configs/filter-spec/filter-5-spec.json
@@ -0,0 +1,48 @@
+{
+    "bool":
+    {
+        "should":
+        [
+            {
+                "range":
+                {
+                    "age":
+                    {
+                        "gte": 30,
+                        "lte": 70
+                    }
+                }
+            },
+            {
+                "term":
+                {
+                    "color": "green"
+                }
+            },
+            {
+                "term":
+                {
+                    "color": "blue"
+                }
+            },
+            {
+                "term":
+                {
+                    "color": "yellow"
+                }
+            },
+            {
+                "term":
+                {
+                    "color": "sweet"
+                }
+            },
+            {
+                "term":
+                {
+                    "taste": "bitter"
+                }
+            }
+        ]
+    }
+}
\ No newline at end of file
diff --git a/benchmarks/perf-tool/sample-configs/lucene-sift-hnsw-filter/index-spec.json b/benchmarks/perf-tool/sample-configs/lucene-sift-hnsw-filter/index-spec.json
new file mode 100644
index 000000000..83ea79b15
--- /dev/null
+++ b/benchmarks/perf-tool/sample-configs/lucene-sift-hnsw-filter/index-spec.json
@@ -0,0 +1,27 @@
+{
+  "settings": {
+    "index": {
+      "knn": true,
+      "refresh_interval": "10s",
+      "number_of_shards": 30,
+      "number_of_replicas": 0
+    }
+  },
+  "mappings": {
+    "properties": {
+      "target_field": {
+        "type": "knn_vector",
+        "dimension": 128,
+        "method": {
+          "name": "hnsw",
+          "space_type": "l2",
+          "engine": "lucene",
+          "parameters": {
+            "ef_construction": 100,
+            "m": 16
+          }
+        }
+      }
+    }
+  }
+}
diff --git a/benchmarks/perf-tool/sample-configs/lucene-sift-hnsw-filter/test.yml b/benchmarks/perf-tool/sample-configs/lucene-sift-hnsw-filter/test.yml
new file mode 100644
index 000000000..6389a7de9
--- /dev/null
+++ b/benchmarks/perf-tool/sample-configs/lucene-sift-hnsw-filter/test.yml
@@ -0,0 +1,41 @@
+endpoint: localhost
+test_name: lucene_sift_hnsw
+test_id: "Test workflow for lucene hnsw"
+num_runs: 1
+show_runs: false
+setup:
+  - name: delete_index
+    index_name: target_index
+steps:
+  - name: create_index
+    index_name: target_index
+    index_spec: sample-configs/lucene-sift-hnsw-filter/index-spec.json
+  - name: ingest_extended
+    index_name: target_index
+    field_name: target_field
+    bulk_size: 500
+    dataset_format: hdf5
+    dataset_path: ../dataset/sift-128-euclidean-with-attr.hdf5
+    attributes_dataset_name: attributes
+    attribute_spec: [ { id: 0, name: 'color', type: 'str' }, { id: 1, name: 'taste', type: 'str' }, { id: 2, name: 'age', type: 'int' } ]
+  - name: refresh_index
+    index_name: target_index
+  - name: force_merge
+    index_name: target_index
+    max_num_segments: 10
+  - name: query_with_filter
+    k: 10
+    r: 1
+    calculate_recall: true
+    index_name: target_index
+    field_name: target_field
+    dataset_format: hdf5
+    dataset_path: ../dataset/sift-128-euclidean-with-attr.hdf5
+    neighbors_format: hdf5
+    neighbors_path: ../dataset/sift-128-euclidean-with-attr-with-filters.hdf5
+    neighbors_dataset: neighbors_filter_1
+    filter_spec: sample-configs/filter-spec/filter-1-spec.json
+    query_count: 100
+cleanup:
+  - name: delete_index
+    index_name: target_index
\ No newline at end of file