[MOD-12263] Enhance FT.PROFILE with vector search execution details (#7408)

meiravgri · web-flow · commit a43aacf782c0 · 2025-11-19T09:27:14.000Z
* add vector search mode to profule

add VecSimSearchMode_ToString

* ADD 'Largest batch size',and 'Largest batch iteration (zero based)

* reset maxBatchSize and maxBatchIteration
diff --git a/src/iterators/hybrid_reader.c b/src/iterators/hybrid_reader.c
@@ -243,6 +243,8 @@ static VecSimQueryReply_Code prepareResults(HybridIterator *hr) {
     child_num_estimated = VecSimIndex_IndexSize(hr->index);
   }
   size_t child_upper_bound = child_num_estimated;
+  // Track maximum batch size
+  hr->maxBatchSize = hr->runtimeParams.batchSize;
   while (VecSimBatchIterator_HasNext(batch_it)) {
     hr->numIterations++;
     size_t vec_index_size = VecSimIndex_IndexSize(hr->index);
@@ -252,6 +254,11 @@ static VecSimQueryReply_Code prepareResults(HybridIterator *hr) {
     size_t batch_size = hr->runtimeParams.batchSize;
     if (batch_size == 0) {
       batch_size = n_res_left * ((float)vec_index_size / child_num_estimated) + 1;
+      // If given by the user, it's constant, otherwise update the maximum batch size.
+      if (batch_size > hr->maxBatchSize) {
+        hr->maxBatchSize = batch_size;
+        hr->maxBatchIteration = hr->numIterations - 1;  // Zero-based
+      }
     }
     VecSimQueryReply_Free(hr->reply);
     VecSimQueryReply_IteratorFree(hr->iter);
@@ -379,6 +386,8 @@ static void HR_Rewind(QueryIterator *ctx) {
   HybridIterator *hr = (HybridIterator *)ctx;
   hr->resultsPrepared = false;
   hr->numIterations = 0;
+  hr->maxBatchSize = 0;
+  hr->maxBatchIteration = 0;
   VecSimQueryReply_Free(hr->reply);
   VecSimQueryReply_IteratorFree(hr->iter);
   hr->reply = NULL;
@@ -473,6 +482,8 @@ QueryIterator *NewHybridVectorIterator(HybridIteratorParams hParams, QueryError
   hi->iter = NULL;
   hi->topResults = NULL;
   hi->numIterations = 0;
+  hi->maxBatchSize = 0;
+  hi->maxBatchIteration = 0;
   hi->canTrimDeepResults = hParams.canTrimDeepResults;
   hi->timeoutCtx = (TimeoutCtx){ .timeout = hParams.timeout, .counter = 0 };
   hi->runtimeParams.timeoutCtx = &hi->timeoutCtx;
diff --git a/src/iterators/hybrid_reader.h b/src/iterators/hybrid_reader.h
@@ -49,6 +49,8 @@ typedef struct {
   char *scoreField;                // To use by the sorter, for distinguishing between different vector fields.
   mm_heap_t *topResults;           // Sorted by score (min-max heap).
   size_t numIterations;
+  size_t maxBatchSize;             // Maximum batch size used during batches mode
+  size_t maxBatchIteration;        // Iteration (zero-based) where the maximum batch size occurred
   bool canTrimDeepResults;         // Ignore the document scores, only vector score matters. No need to deep copy the results from the child iterator.
   TimeoutCtx timeoutCtx;           // Timeout parameters
   FieldFilterContext filterCtx;
diff --git a/src/profile.c b/src/profile.c
@@ -408,6 +408,10 @@ PRINT_PROFILE_FUNC(printMetricIt) {
 
   printProfileCounters(counters);
 
+  if (it->type == VECTOR_DISTANCE) {
+    printProfileVectorSearchMode(VECSIM_RANGE_QUERY);
+  }
+
   RedisModule_Reply_MapEnd(reply);
 }
 
@@ -423,9 +427,12 @@ void PrintIteratorChildProfile(RedisModule_Reply *reply, QueryIterator *root, Pr
 
     if (root->type == HYBRID_ITERATOR) {
       HybridIterator *hi = (HybridIterator *)root;
+      printProfileVectorSearchMode(hi->searchMode);
       if (hi->searchMode == VECSIM_HYBRID_BATCHES ||
           hi->searchMode == VECSIM_HYBRID_BATCHES_TO_ADHOC_BF) {
         printProfileNumBatches(hi);
+        printProfileMaxBatchSize(hi);
+        printProfileMaxBatchIteration(hi);
       }
     }
 
diff --git a/src/profile.h b/src/profile.h
@@ -24,8 +24,14 @@
 #define printProfileGILTime(vtime) RedisModule_ReplyKV_Double(reply, "GIL-Time", (rs_timer_ms(&(vtime))))
 #define printProfileNumBatches(hybrid_reader) \
   RedisModule_ReplyKV_LongLong(reply, "Batches number", (hybrid_reader)->numIterations)
+#define printProfileMaxBatchSize(hybrid_reader) \
+  RedisModule_ReplyKV_LongLong(reply, "Largest batch size", (hybrid_reader)->maxBatchSize)
+#define printProfileMaxBatchIteration(hybrid_reader) \
+  RedisModule_ReplyKV_LongLong(reply, "Largest batch iteration (zero based)", (hybrid_reader)->maxBatchIteration)
 #define printProfileOptimizationType(oi) \
   RedisModule_ReplyKV_SimpleString(reply, "Optimizer mode", QOptimizer_PrintType((oi)->optim))
+#define printProfileVectorSearchMode(searchMode) \
+  RedisModule_ReplyKV_SimpleString(reply, "Vector search mode", VecSimSearchMode_ToString(searchMode))
 
 /**
  * @brief Add profile iterators to all nodes in the iterator tree
diff --git a/src/vector_index.c b/src/vector_index.c
@@ -296,6 +296,23 @@ const char *VecSimAlgorithm_ToString(VecSimAlgo algo) {
   }
   return NULL;
 }
+const char *VecSimSearchMode_ToString(VecSearchMode vecsimSearchMode) {
+    switch (vecsimSearchMode) {
+    case EMPTY_MODE:
+        return "EMPTY_MODE";
+    case STANDARD_KNN:
+        return "STANDARD_KNN";
+    case HYBRID_ADHOC_BF:
+        return "HYBRID_ADHOC_BF";
+    case HYBRID_BATCHES:
+        return "HYBRID_BATCHES";
+    case HYBRID_BATCHES_TO_ADHOC_BF:
+        return "HYBRID_BATCHES_TO_ADHOC_BF";
+    case RANGE_QUERY:
+        return "RANGE_QUERY";
+    }
+    return NULL;
+}
 
 bool VecSim_IsLeanVecCompressionType(VecSimSvsQuantBits quantBits) {
   return quantBits == VecSimSvsQuant_4x8_LeanVec || quantBits == VecSimSvsQuant_8x8_LeanVec;
diff --git a/src/vector_index.h b/src/vector_index.h
@@ -162,6 +162,7 @@ size_t VecSimType_sizeof(VecSimType type);
 const char *VecSimType_ToString(VecSimType type);
 const char *VecSimMetric_ToString(VecSimMetric metric);
 const char *VecSimAlgorithm_ToString(VecSimAlgo algo);
+const char *VecSimSearchMode_ToString(VecSearchMode vecsimSearchMode);
 const char *VecSimSvsCompression_ToString(VecSimSvsQuantBits quantBits);
 const char *VecSimSearchHistory_ToString(VecSimOptionMode option);
 bool VecSim_IsLeanVecCompressionType(VecSimSvsQuantBits quantBits);
diff --git a/tests/pytests/test_profile.py b/tests/pytests/test_profile.py
@@ -290,7 +290,7 @@ def testProfileVector(env):
 
   actual_res = conn.execute_command('ft.profile', 'idx', 'search', 'query', '*=>[KNN 3 @v $vec]',
                                     'SORTBY', '__v_score', 'PARAMS', '2', 'vec', 'aaaaaaaa', 'nocontent')
-  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 3]
+  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 3, 'Vector search mode', 'STANDARD_KNN']
   expected_vecsim_rp_res = ['Type', 'Metrics Applier', 'Results processed', 3]
   env.assertEqual(actual_res[0], [3, '4', '2', '1'])
   actual_profile = to_dict(actual_res[1][1][0])
@@ -301,7 +301,7 @@ def testProfileVector(env):
   # Range query - uses metric iterator. Radius is set so that the closest 2 vectors will be in the range
   actual_res = conn.execute_command('ft.profile', 'idx', 'search', 'query', '@v:[VECTOR_RANGE 3e36 $vec]=>{$yield_distance_as:dist}',
                                     'SORTBY', 'dist', 'PARAMS', '2', 'vec', 'aaaaaaaa', 'nocontent')
-  expected_iterators_res = ['Type', 'METRIC - VECTOR DISTANCE', 'Number of reading operations', 2]
+  expected_iterators_res = ['Type', 'METRIC - VECTOR DISTANCE', 'Number of reading operations', 2, 'Vector search mode', 'RANGE_QUERY']
   expected_vecsim_rp_res = ['Type', 'Metrics Applier', 'Results processed', 2]
   env.assertEqual(actual_res[0], [2, '4', '2'])
   actual_profile = to_dict(actual_res[1][1][0])
@@ -313,7 +313,7 @@ def testProfileVector(env):
   # Expect ad-hoc BF to take place - going over child iterator exactly once (reading 2 results)
   actual_res = conn.execute_command('ft.profile', 'idx', 'search', 'query', '(@t:hello world)=>[KNN 3 @v $vec]',
                                     'SORTBY', '__v_score', 'PARAMS', '2', 'vec', 'aaaaaaaa', 'nocontent')
-  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 2, 'Child iterator',
+  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 2, 'Vector search mode', 'HYBRID_ADHOC_BF', 'Child iterator',
                             ['Type', 'INTERSECT', 'Number of reading operations', 2, 'Child iterators', [
                               ['Type', 'TEXT', 'Term', 'world', 'Number of reading operations', 2, 'Estimated number of matches', 2],
                               ['Type', 'TEXT', 'Term', 'hello', 'Number of reading operations', 2, 'Estimated number of matches', 5]]]]
@@ -332,7 +332,7 @@ def testProfileVector(env):
   actual_res = conn.execute_command('ft.profile', 'idx', 'search', 'query', '(@t:hello world)=>[KNN 3 @v $vec]',
                                     'SORTBY', '__v_score', 'PARAMS', '2', 'vec', 'aaaaaaaa', 'nocontent')
   env.assertEqual(actual_res[0], [3, '4', '6', '7'])
-  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 3, 'Batches number', 2, 'Child iterator',
+  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 3, 'Vector search mode', 'HYBRID_BATCHES', 'Batches number', 2, 'Largest batch size', 4, 'Largest batch iteration (zero based)', 0, 'Child iterator',
                             ['Type', 'INTERSECT', 'Number of reading operations', 8, 'Child iterators', [
                               ['Type', 'TEXT', 'Term', 'world', 'Number of reading operations', 8, 'Estimated number of matches', 9997],
                               ['Type', 'TEXT', 'Term', 'hello', 'Number of reading operations', 8, 'Estimated number of matches', 10000]]]]
@@ -348,7 +348,7 @@ def testProfileVector(env):
 
   # expected results that pass the filter is index_size/2. after two iterations with no results,
   # we should move ad-hoc BF.
-  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 0, 'Batches number', 2, 'Child iterator',
+  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 0, 'Vector search mode', 'HYBRID_BATCHES_TO_ADHOC_BF', 'Batches number', 2, 'Largest batch size', 13, 'Largest batch iteration (zero based)', 1, 'Child iterator',
                             ['Type', 'INTERSECT', 'Number of reading operations', 2, 'Child iterators', [
                              ['Type', 'TEXT', 'Term', 'hello', 'Number of reading operations', 5, 'Estimated number of matches', 10000],
                              ['Type', 'TEXT', 'Term', 'other', 'Number of reading operations', 3, 'Estimated number of matches', 10000]]]]
@@ -363,7 +363,7 @@ def testProfileVector(env):
   # index after the 13th batch.
   actual_res = conn.execute_command('ft.profile', 'idx', 'search', 'query', '(@t:hello other)=>[KNN 2 @v $vec HYBRID_POLICY BATCHES]',
                                     'SORTBY', '__v_score', 'PARAMS', '2', 'vec', '????????', 'nocontent')
-  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 0, 'Batches number', 13, 'Child iterator',
+  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 0, 'Vector search mode', 'HYBRID_BATCHES', 'Batches number', 13, 'Largest batch size', 20001, 'Largest batch iteration (zero based)', 12, 'Child iterator',
                              ['Type', 'INTERSECT', 'Number of reading operations', 12, 'Child iterators', [
                               ['Type', 'TEXT', 'Term', 'hello', 'Number of reading operations', 25, 'Estimated number of matches', 10000],
                               ['Type', 'TEXT', 'Term', 'other', 'Number of reading operations', 13, 'Estimated number of matches', 10000]]]]
@@ -375,7 +375,7 @@ def testProfileVector(env):
   # After 200 iterations, we should go over the entire index.
   actual_res = conn.execute_command('ft.profile', 'idx', 'search', 'query', '(@t:hello other)=>[KNN 2 @v $vec HYBRID_POLICY BATCHES BATCH_SIZE 100]',
                                     'SORTBY', '__v_score', 'PARAMS', '2', 'vec', '????????', 'nocontent', 'timeout', '100000')
-  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 0, 'Batches number', 200, 'Child iterator',
+  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 0, 'Vector search mode', 'HYBRID_BATCHES', 'Batches number', 200, 'Largest batch size', 100, 'Largest batch iteration (zero based)', 0, 'Child iterator',
                             ['Type', 'INTERSECT', 'Number of reading operations', 199, 'Child iterators', [
                              ['Type', 'TEXT', 'Term', 'hello', 'Number of reading operations', 399, 'Estimated number of matches', 10000],
                              ['Type', 'TEXT', 'Term', 'other', 'Number of reading operations', 200, 'Estimated number of matches', 10000]]]]
@@ -389,7 +389,7 @@ def testProfileVector(env):
   # every iteration that returned 0 results.
   actual_res = conn.execute_command('ft.profile', 'idx', 'search', 'query', '(@t:hello other)=>[KNN 2 @v $vec BATCH_SIZE 100]',
                                     'SORTBY', '__v_score', 'PARAMS', '2', 'vec', '????????', 'nocontent')
-  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 0, 'Batches number', 2, 'Child iterator',
+  expected_iterators_res = ['Type', 'VECTOR', 'Number of reading operations', 0, 'Vector search mode', 'HYBRID_BATCHES_TO_ADHOC_BF', 'Batches number', 2, 'Largest batch size', 100, 'Largest batch iteration (zero based)', 0, 'Child iterator',
                             ['Type', 'INTERSECT', 'Number of reading operations', 2, 'Child iterators', [
                              ['Type', 'TEXT', 'Term', 'hello', 'Number of reading operations', 5, 'Estimated number of matches', 10000],
                              ['Type', 'TEXT', 'Term', 'other', 'Number of reading operations', 3, 'Estimated number of matches', 10000]]]]
@@ -693,3 +693,82 @@ def testProfileBM25NormMax(env):
   env.assertTrue(recursive_contains(aggregate_response, "Score Max Normalizer"))
   search_response = env.cmd('FT.PROFILE', 'idx', 'SEARCH', 'query', 'hello', 'WITHSCORES', 'SCORER', 'BM25STD.NORM')
   env.assertTrue(recursive_contains(search_response, "Score Max Normalizer"))
+
+def testProfileVectorSearchMode():
+  """Test Vector search mode field in FT.PROFILE for both SEARCH and AGGREGATE"""
+  env = Env(moduleArgs='DEFAULT_DIALECT 2', protocol=3)  # Use RESP3 for easier dict access
+  conn = getConnectionByEnv(env)
+
+  env.expect('FT.CREATE', 'idx', 'SCHEMA', 'v', 'VECTOR', 'FLAT', '6', 'TYPE', 'FLOAT32', 'DIM', '2', 'DISTANCE_METRIC', 'L2', 't', 'TEXT').ok()
+
+  conn.execute_command('hset', '1', 'v', 'bababaca', 't', "hello")
+  conn.execute_command('hset', '2', 'v', 'babababa', 't', "hello")
+  conn.execute_command('hset', '3', 'v', 'aabbaabb', 't', "hello")
+  conn.execute_command('hset', '4', 'v', 'bbaabbaa', 't', "hello world")
+  conn.execute_command('hset', '5', 'v', 'aaaabbbb', 't', "hello world")
+
+  # Helper function to test both SEARCH and AGGREGATE
+  def verify_search_mode(query_type, query, params, expected_mode, expected_iterator_type='VECTOR'):
+    scenario_message = f"query_type: {query_type}, query: {query}, params: {params}, expected_mode: {expected_mode}"
+    """
+    Verify that Vector search mode appears in profile for both SEARCH and AGGREGATE
+    query_type: 'SEARCH' or 'AGGREGATE'
+    query: the query string
+    params: list of params (e.g., ['vec', 'aaaaaaaa'])
+    expected_mode: expected search mode string
+    expected_iterator_type: 'VECTOR' or 'METRIC - VECTOR DISTANCE'
+    """
+    cmd = ['FT.PROFILE', 'idx', query_type, 'QUERY', query]
+    cmd.extend(['PARAMS'] + [str(len(params))] + params)
+
+    res = env.cmd(*cmd)
+
+    # Navigate to iterator profile (RESP3 dict structure)
+    shards = res['Profile']['Shards']
+    env.assertGreater(len(shards), 0, message=scenario_message)
+
+    # Check at least one shard has the expected search mode
+    # res['Profile']['Shards'][0]['Iterators profile']['Vector search mode']
+    found = False
+    for shard in shards:
+      iter_profile = shard['Iterators profile']
+      if iter_profile['Type'] == expected_iterator_type:
+        env.assertEqual(iter_profile['Vector search mode'], expected_mode, message=scenario_message)
+        found = True
+        break
+    env.assertTrue(found, message=f"{scenario_message}: Expected iterator type {expected_iterator_type} not found")
+
+  # Test 1: STANDARD_KNN
+  verify_search_mode('SEARCH', '*=>[KNN 3 @v $vec]', ['vec', 'aaaaaaaa'], 'STANDARD_KNN')
+  verify_search_mode('AGGREGATE', '*=>[KNN 3 @v $vec]', ['vec', 'aaaaaaaa'], 'STANDARD_KNN')
+
+  # Test 2: HYBRID_ADHOC_BF
+  verify_search_mode('SEARCH', '(@t:hello world)=>[KNN 3 @v $vec]', ['vec', 'aaaaaaaa'], 'HYBRID_ADHOC_BF')
+  verify_search_mode('AGGREGATE', '(@t:hello world)=>[KNN 3 @v $vec]', ['vec', 'aaaaaaaa'], 'HYBRID_ADHOC_BF')
+
+  # Test 3: RANGE_QUERY (uses METRIC_ITERATOR)
+  verify_search_mode('SEARCH', '@v:[VECTOR_RANGE 3e36 $vec]=>{$yield_distance_as:dist}',
+                     ['vec', 'aaaaaaaa'], 'RANGE_QUERY', 'METRIC - VECTOR DISTANCE')
+  verify_search_mode('AGGREGATE', '@v:[VECTOR_RANGE 3e36 $vec]=>{$yield_distance_as:dist}',
+                     ['vec', 'aaaaaaaa'], 'RANGE_QUERY', 'METRIC - VECTOR DISTANCE')
+
+  # Test 4: HYBRID_BATCHES
+  verify_search_mode('SEARCH', '(@t:hello world)=>[KNN 3 @v $vec HYBRID_POLICY BATCHES BATCH_SIZE 100]', ['vec', 'aaaaaaaa'], 'HYBRID_BATCHES')
+  verify_search_mode('AGGREGATE', '(@t:hello world)=>[KNN 3 @v $vec HYBRID_POLICY BATCHES BATCH_SIZE 100]', ['vec', 'aaaaaaaa'], 'HYBRID_BATCHES')
+
+  # Running HYBRID_BATCHES_TO_ADHOC_BF on cluster requires much more data and doesn't add a significant value
+  if env.isCluster():
+    return
+
+  for i in range(6, 5000):
+    conn.execute_command('hset', str(i), 'v', 'bababada', 't', "hello")
+
+  # Add another 10K docs with "other" tag for HYBRID_BATCHES_TO_ADHOC_BF test
+  for i in range(5000, 10001):
+    conn.execute_command('hset', str(i), 'v', '????????', 't', "other")
+
+  # Test 5: HYBRID_BATCHES_TO_ADHOC_BF
+  # Query: "hello" (10K docs) AND "other" (10K docs) → intersection is 0 (disjoint sets)
+  # High estimated results → starts BATCHES, but 0 actual results → switches to ADHOC_BF
+  verify_search_mode('SEARCH', '(@t:hello other)=>[KNN 3 @v $vec BATCH_SIZE 100]', ['vec', '????????'], 'HYBRID_BATCHES_TO_ADHOC_BF')
+  verify_search_mode('AGGREGATE', '(@t:hello other)=>[KNN 3 @v $vec BATCH_SIZE 100]', ['vec', '????????'], 'HYBRID_BATCHES_TO_ADHOC_BF')

Original file line number	Diff line number	Diff line change
`@@ -408,6 +408,10 @@ PRINT_PROFILE_FUNC(printMetricIt) {`
`408`	`408`
`409`	`409`	`printProfileCounters(counters);`
`410`	`410`
	`411`	`+ if (it->type == VECTOR_DISTANCE) {`
	`412`	`+ printProfileVectorSearchMode(VECSIM_RANGE_QUERY);`
	`413`	`+ }`
	`414`	`+`
`411`	`415`	`RedisModule_Reply_MapEnd(reply);`
`412`	`416`	`}`
`413`	`417`
`@@ -423,9 +427,12 @@ void PrintIteratorChildProfile(RedisModule_Reply reply, QueryIterator root, Pr`
`423`	`427`
`424`	`428`	`if (root->type == HYBRID_ITERATOR) {`
`425`	`429`	`HybridIterator hi = (HybridIterator )root;`
	`430`	`+ printProfileVectorSearchMode(hi->searchMode);`
`426`	`431`	`if (hi->searchMode == VECSIM_HYBRID_BATCHES \|\|`
`427`	`432`	`hi->searchMode == VECSIM_HYBRID_BATCHES_TO_ADHOC_BF) {`
`428`	`433`	`printProfileNumBatches(hi);`
	`434`	`+ printProfileMaxBatchSize(hi);`
	`435`	`+ printProfileMaxBatchIteration(hi);`
`429`	`436`	`}`
`430`	`437`	`}`
`431`	`438`