Bit-Quill · AlexFilipImproving · Jan 28, 2026 · Jan 28, 2026 · Jan 28, 2026 · Jan 28, 2026
diff --git a/COMMANDS.md b/COMMANDS.md
@@ -153,6 +153,7 @@ FT.SEARCH <index> <query>
   [TIMEOUT <timeout>]
   [PARAMS nargs <name> <value> [ <name> <value> ...]]
   [LIMIT <offset> <num>]
+  [SORTBY <field> [ASC|DESC]]
   [DIALECT <dialect>]
 ```
 
@@ -165,6 +166,7 @@ Performs a search of the specified index. The keys which match the query express
 - **PARAMS \<count\> \<name1\> \<value1\> \<name2\> \<value2\> ...** (optional): `count` is of the number of arguments, i.e., twice the number of value name pairs. See the query string for usage details.
 - **RETURN \<count\> \<field1\> \<field2\> ...** (options): `count` is the number of fields to return. Specifies the fields you want to retrieve from your documents, along with any aliases for the returned values. By default, all fields are returned unless the NOCONTENT option is set, in which case no fields are returned. If num is set to 0, it behaves the same as NOCONTENT.
 - **LIMIT \<offset\> \<count\>** (optional): Lets you choose a portion of the result. The first `<offset>` keys are skipped and only a maximum of `<count>` keys are included. The default is LIMIT 0 10, which returns at most 10 keys.  
+- **SORTBY \<field\> [ASC|DESC]** (optional): Sorts the results by the specified indexed field. The field must be a numeric or tag field that is indexed. ASC sorts in ascending order (default), DESC sorts in descending order. Documents with missing values for the sort field are placed at the end of the results.
 - **DIALECT \<dialect\>** (optional): Specifies your dialect. The only supported dialect is 2\.
 
 **RESPONSE**

diff --git a/integration/compatibility/aggregate-answers.pickle.gz b/integration/compatibility/aggregate-answers.pickle.gz
diff --git a/integration/compatibility/generate.py b/integration/compatibility/generate.py
@@ -44,8 +44,7 @@ def setup_class(cls):
         if cls.ANSWER_FILE_NAME is None:
             raise NotImplementedError("Subclass must define ANSWER_FILE_NAME")
 
-        os.system("docker remove Generate-search || true")
-        if os.system("docker run --name Generate-search -p 6380:6379 redis/redis-stack-server &") != 0:
+        if os.system("docker run --rm -d --name Generate-search -p 6380:6379 redis/redis-stack-server") != 0:
             print("Failed to start Redis Stack server, please check your Docker setup.")
             sys.exit(1)
         print("Started Generate-search server")
@@ -66,7 +65,6 @@ def setup_class(cls):
     def teardown_class(cls):
         print("Stopping Generate-search server")
         os.system("docker stop Generate-search")
-        os.system("docker remove Generate-search")
         print("Dumping ", len(cls.answers), " answers")
         with gzip.open(cls.ANSWER_FILE_NAME, "wb") as answer_file:
             pickle.dump(cls.answers, answer_file)
@@ -155,7 +153,7 @@ def checkall(self, dialect, *orig_cmd, **kwargs):
         self.checkvec(self, dialect, orig_cmd, kwargs)
         self.check(self, dialect, orig_cmd)
 
-    '''        
+    '''
     def test_bad_numeric_data(self, key_type, dialect):
         self.setup_data("bad numbers", key_type)
         self.check(dialect, f"ft.search {key_type}_idx1",  "@n1:[-inf inf]")
@@ -460,3 +458,14 @@ def test_aggregate_dyadic_ops(self, key_type, dialect):
                         "as",
                         "nn",
                 )
+
+    def test_search_sortby(self, key_type, dialect):
+        self.setup_data("sortable numbers", key_type)
+
+        for sort_key in ["n1", "n2"]:
+            for direction in ["ASC", "DESC", ""]:
+                for return_keys in ["", "RETURN 3 @n1 @t1"]:
+                    for wsk in ["", "WITHSORTKEYS"]:
+                        for limit in ["LIMIT 0 5", "LIMIT 2 3", ""]:
+                            self.check(dialect, f"ft.search {key_type}_idx1 * SORTBY {sort_key} {direction} {return_keys} {limit} {wsk}")
+
diff --git a/integration/compatibility_test.py b/integration/compatibility_test.py
@@ -95,16 +95,47 @@ def parse_value(x, key_type):
         raise
     return result
 
-def unpack_search_result(rs, key_type):
+def result_has_sortkeys(rs):
+    """Detect if a search result actually contains sort keys by checking the format.
+
+    With sort keys: [count, key1, #sortkey1, [fields1], key2, #sortkey2, [fields2], ...]
+    Without sort keys: [count, key1, [fields1], key2, [fields2], ...]
+
+    The sort key is a bytes/string that starts with '#' (or '$' in some Redis versions),
+    and fields are always a list.
+    """
+    if len(rs) < 3:
+        return False
+    # Check if element at index 2 (after count and first key) is a sort key (starts with # or $)
+    # or a fields list
+    second_elem = rs[2]
+    if isinstance(second_elem, list):
+        # It's a fields list, so no sort keys
+        return False
+    if isinstance(second_elem, (bytes, str)):
+        # Check if it starts with '#' or '$' (sort key indicator)
+        if isinstance(second_elem, bytes):
+            return second_elem.startswith(b'#') or second_elem.startswith(b'$')
+        return second_elem.startswith('#') or second_elem.startswith('$')
+    return False
+
+def unpack_search_result(rs, key_type, has_sortkeys=False):
     rows = []
-    for (key, value) in [(rs[i],rs[i+1]) for i in range(1, len(rs), 2)]:
-        #try:
-        row = {"__key": key}
-        for i in range(0, len(value), 2):
-            row[parse_field(value[i], key_type)] = parse_value(value[i+1], key_type)
-        rows += [row]
-        #except:
-        #    print("Parse failure: ", key, value)
+    if has_sortkeys:
+        # Format: [count, key1, sortkey1, [fields1], key2, sortkey2, [fields2], ...]
+        # Step by 3 elements at a time
+        for (key, sortkey, value) in [(rs[i], rs[i+1], rs[i+2]) for i in range(1, len(rs), 3)]:
+            row = {"__key": key}
+            for j in range(0, len(value), 2):
+                row[parse_field(value[j], key_type)] = parse_value(value[j+1], key_type)
+            rows += [row]
+    else:
+        # Format: [count, key1, [fields1], key2, [fields2], ...]
+        for (key, value) in [(rs[i],rs[i+1]) for i in range(1, len(rs), 2)]:
+            row = {"__key": key}
+            for i in range(0, len(value), 2):
+                row[parse_field(value[i], key_type)] = parse_value(value[i+1], key_type)
+            rows += [row]
     return rows
 
 def unpack_agg_result(rs, key_type):
@@ -123,7 +154,12 @@ def unpack_agg_result(rs, key_type):
 
 def unpack_result(cmd, key_type, rs, sortkeys):
     if "ft.search" in cmd[0].lower():
-        out = unpack_search_result(rs, key_type)
+        # Detect if the result actually has sort keys by checking the format,
+        # not just whether WITHSORTKEYS is in the command. This handles cases
+        # where the expected result (from pickle) may not have sort keys even
+        # if the command requested them.
+        has_sortkeys = result_has_sortkeys(rs)
+        out = unpack_search_result(rs, key_type, has_sortkeys)
     else:
         out = unpack_agg_result(rs, key_type)
     #
@@ -242,7 +278,7 @@ def compare_results(expected, results):
         sortkeys = [cmd[ix+2+i][1:] for i in range(count)]
     elif 'sortby' in cmd:
         ix = cmd.index('sortby')
-        count = int(cmd[ix+1])
+        count = int(cmd[ix+1]) if cmd[0] != 'ft.search' else 1
         # Grab the fields after the count, stripping any leading '@'
         sortkeys = [cmd[ix+2+i][1 if cmd[ix+2+i].startswith("@") else 0:] for i in range(count)]
         for f in ['asc', 'desc', 'ASC', 'DESC']:

diff --git a/src/attribute_data_type.cc b/src/attribute_data_type.cc
@@ -77,22 +77,23 @@ bool HashHasRecord(ValkeyModuleKey *key, absl::string_view identifier) {
 }
 
 absl::StatusOr<RecordsMap> HashAttributeDataType::FetchAllRecords(
-    ValkeyModuleCtx *ctx, const std::string &vector_identifier,
+    ValkeyModuleCtx *ctx, const std::optional<std::string> &vector_identifier,
     [[maybe_unused]] ValkeyModuleKey *open_key, absl::string_view key,
     const absl::flat_hash_set<absl::string_view> &identifiers) const {
   vmsdk::VerifyMainThread();
   auto key_str = vmsdk::MakeUniqueValkeyString(key);
   auto key_obj =
       vmsdk::MakeUniqueValkeyOpenKey(ctx, key_str.get(), VALKEYMODULE_READ);
   if (!key_obj) {
-    return absl::NotFoundError(
-        absl::StrCat("No such record with key: `", vector_identifier, "`"));
+    return absl::NotFoundError(absl::StrCat(
+        "No such record with key: `", vector_identifier.value_or(""), "`"));
   }
   // Only check for vector_identifier if it's not empty (vector queries)
-  if (!vector_identifier.empty() &&
-      !HashHasRecord(key_obj.get(), vector_identifier)) {
+  if (vector_identifier.has_value() &&
+      !HashHasRecord(key_obj.get(), vector_identifier.value())) {
     return absl::NotFoundError(absl::StrCat("No such record with identifier: `",
-                                            vector_identifier, "`"));
+                                            vector_identifier.value_or(""),
+                                            "`"));
   }
   vmsdk::UniqueValkeyScanCursor cursor = vmsdk::MakeUniqueValkeyScanCursor();
   HashScanCallbackData callback_data{identifiers};
@@ -177,13 +178,13 @@ absl::StatusOr<vmsdk::UniqueValkeyString> JsonAttributeDataType::GetRecord(
 }
 
 absl::StatusOr<RecordsMap> JsonAttributeDataType::FetchAllRecords(
-    ValkeyModuleCtx *ctx, const std::string &vector_identifier,
+    ValkeyModuleCtx *ctx, const std::optional<std::string> &vector_identifier,
     ValkeyModuleKey *open_key, absl::string_view key,
     const absl::flat_hash_set<absl::string_view> &identifiers) const {
   // First, validate that a JSON object exists for the given key using the
   // vector identifier.
-  VMSDK_RETURN_IF_ERROR(
-      GetJsonRecord(ctx, open_key, key, vector_identifier, nullptr));
+  VMSDK_RETURN_IF_ERROR(GetJsonRecord(ctx, open_key, key,
+                                      vector_identifier.value_or(""), nullptr));
   RecordsMap key_value_content;
   for (const auto &identifier : identifiers) {
     auto str = GetRecord(ctx, open_key, key, identifier);

diff --git a/src/attribute_data_type.h b/src/attribute_data_type.h
@@ -69,7 +69,7 @@ class AttributeDataType {
            VALKEYMODULE_NOTIFY_EVICTED;
   };
   virtual absl::StatusOr<RecordsMap> FetchAllRecords(
-      ValkeyModuleCtx *ctx, const std::string &vector_identifier,
+      ValkeyModuleCtx *ctx, const std::optional<std::string> &vector_identifier,
       ValkeyModuleKey *open_key, absl::string_view key,
       const absl::flat_hash_set<absl::string_view> &identifiers) const = 0;
   virtual data_model::AttributeDataType ToProto() const = 0;
@@ -94,7 +94,7 @@ class HashAttributeDataType : public AttributeDataType {
   }
   inline std::string ToString() const override { return "HASH"; }
   absl::StatusOr<RecordsMap> FetchAllRecords(
-      ValkeyModuleCtx *ctx, const std::string &vector_identifier,
+      ValkeyModuleCtx *ctx, const std::optional<std::string> &vector_identifier,
       ValkeyModuleKey *open_key, absl::string_view key,
       const absl::flat_hash_set<absl::string_view> &identifiers) const override;
   bool IsProperType(ValkeyModuleKey *key) const override {
@@ -120,7 +120,7 @@ class JsonAttributeDataType : public AttributeDataType {
   }
   inline std::string ToString() const override { return "JSON"; }
   absl::StatusOr<RecordsMap> FetchAllRecords(
-      ValkeyModuleCtx *ctx, const std::string &vector_identifier,
+      ValkeyModuleCtx *ctx, const std::optional<std::string> &vector_identifier,
       ValkeyModuleKey *open_key, absl::string_view key,
       const absl::flat_hash_set<absl::string_view> &identifiers) const override;
   bool IsProperType(ValkeyModuleKey *key) const override {

diff --git a/src/commands/commands.cc b/src/commands/commands.cc
@@ -12,6 +12,7 @@
 
 #include "fanout.h"
 #include "ft_create_parser.h"
+#include "ft_search_parser.h"
 #include "src/acl.h"
 #include "src/commands/ft_search.h"
 #include "src/coordinator/metadata_manager.h"
@@ -129,9 +130,9 @@ absl::Status QueryCommand::Execute(ValkeyModuleCtx *ctx,
     uint32_t db_num = ValkeyModule_GetSelectedDb(ctx);
     parameters->db_num = db_num;
 
-    VMSDK_ASSIGN_OR_RETURN(parameters->index_schema,
-                           SchemaManager::Instance().GetIndexSchema(
-                               db_num, parameters->index_schema_name));
+    VMSDK_ASSIGN_OR_RETURN(
+        parameters->index_schema,
+        schema_manager.GetIndexSchema(db_num, parameters->index_schema_name));
     VMSDK_RETURN_IF_ERROR(
         vmsdk::ParseParamValue(itr, parameters->parse_vars.query_string));
     VMSDK_RETURN_IF_ERROR(parameters->ParseCommand(itr));
@@ -218,11 +219,17 @@ absl::Status QueryCommand::Execute(ValkeyModuleCtx *ctx,
             parameters->index_schema->GetVersion());
       }
 
+      // Extract sortby parameter if this is a SearchCommand
+      std::optional<query::SortByParameter> sortby_param = std::nullopt;
+      if (auto *search_cmd = dynamic_cast<SearchCommand *>(parameters.get())) {
+        sortby_param = search_cmd->sortby;
+      }
+
       return query::fanout::PerformSearchFanoutAsync(
           ctx, search_targets,
           ValkeySearch::Instance().GetCoordinatorClientPool(),
           std::move(parameters), ValkeySearch::Instance().GetReaderThreadPool(),
-          std::move(on_done_callback));
+          std::move(on_done_callback), sortby_param);
     }
     return query::SearchAsync(
         std::move(parameters), ValkeySearch::Instance().GetReaderThreadPool(),

diff --git a/src/commands/ft_aggregate.cc b/src/commands/ft_aggregate.cc
@@ -91,7 +91,7 @@ absl::Status AggregateParameters::ParseCommand(vmsdk::ArgsIterator &itr) {
   RealIndexInterface real_index_interface(index_schema);
   parse_vars_.index_interface_ = &real_index_interface;
 
-  VMSDK_RETURN_IF_ERROR(PreParseQueryString(*this));
+  VMSDK_RETURN_IF_ERROR(PreParseQueryString());
   // Ensure that key is first value if it gets included...
   CHECK(AddRecordAttribute("__key", "__key", indexes::IndexerType::kNone) == 0);
   auto score_sv = vmsdk::ToStringView(score_as.get());
@@ -112,7 +112,7 @@ absl::Status AggregateParameters::ParseCommand(vmsdk::ArgsIterator &itr) {
   limit.number = std::numeric_limits<uint64_t>::max();  // Override default of
                                                         // 10 from search
 
-  VMSDK_RETURN_IF_ERROR(PostParseQueryString(*this));
+  VMSDK_RETURN_IF_ERROR(PostParseQueryString());
   VMSDK_RETURN_IF_ERROR(VerifyQueryString(*this));
   VMSDK_RETURN_IF_ERROR(ManipulateReturnsClause(*this));
 
@@ -175,16 +175,16 @@ absl::StatusOr<std::pair<size_t, size_t>> ProcessNeighborsForProcessing(
   size_t key_index = 0, scores_index = 0;
 
   if (parameters.IsVectorQuery()) {
-    auto identifier =
+    auto vector_identifier =
         parameters.index_schema->GetIdentifier(parameters.attribute_alias);
-    if (!identifier.ok()) {
+    if (!vector_identifier.ok()) {
       ++Metrics::GetStats().query_failed_requests_cnt;
-      return identifier.status();
+      return vector_identifier.status();
     }
 
     query::ProcessNeighborsForReply(
         ctx, parameters.index_schema->GetAttributeDataType(), neighbors,
-        parameters, identifier.value());
+        parameters, vector_identifier.value());
 
     if (parameters.load_key) {
       key_index = parameters.AddRecordAttribute("__key", "__key",
@@ -196,9 +196,9 @@ absl::StatusOr<std::pair<size_t, size_t>> ProcessNeighborsForProcessing(
                                                    indexes::IndexerType::kNone);
     }
   } else {
-    query::ProcessNonVectorNeighborsForReply(
+    query::ProcessNeighborsForReply(
         ctx, parameters.index_schema->GetAttributeDataType(), neighbors,
-        parameters);
+        parameters, std::nullopt);
 
     if (parameters.load_key) {
       key_index = parameters.AddRecordAttribute("__key", "__key",