Extend Cypher queries with the index hinting feature (#1345)

2023-10-27 14:26:19 +02:00 · 2023-10-27 14:26:19 +02:00 · 989bb97514
commit 989bb97514
parent a94588bde3
15 changed files with 768 additions and 74 deletions
--- a/.gitignore
+++ b/.gitignore
@ -60,3 +60,5 @@ src/storage/distributed/rpc/concurrent_id_mapper_rpc_messages.hpp
 src/transactions/distributed/engine_rpc_messages.hpp
 /tests/manual/js/transaction_timeout/package-lock.json
 /tests/manual/js/transaction_timeout/node_modules/
 .vscode/
 src/query/frontend/opencypher/grammar/.antlr/*
--- a/src/query/frontend/ast/ast.hpp
+++ b/src/query/frontend/ast/ast.hpp
@ -2069,6 +2069,27 @@ class Query : public memgraph::query::Tree, public utils::Visitable<QueryVisitor
  friend class AstStorage;
 };
 struct IndexHint {
  static const utils::TypeInfo kType;
  const utils::TypeInfo &GetTypeInfo() const { return kType; }
  enum class IndexType { LABEL, LABEL_PROPERTY };
  memgraph::query::IndexHint::IndexType index_type_;
  memgraph::query::LabelIx label_;
  std::optional<memgraph::query::PropertyIx> property_{std::nullopt};
  IndexHint Clone(AstStorage *storage) const {
    IndexHint object;
    object.index_type_ = index_type_;
    object.label_ = storage->GetLabelIx(label_.name);
    if (property_) {
      object.property_ = storage->GetPropertyIx(property_->name);
    }
    return object;
  }
 };
 class CypherQuery : public memgraph::query::Query, public utils::Visitable<HierarchicalTreeVisitor> {
 public:
  static const utils::TypeInfo kType;
@ -2093,6 +2114,11 @@ class CypherQuery : public memgraph::query::Query, public utils::Visitable<Hiera
  memgraph::query::SingleQuery *single_query_{nullptr};
  /// Contains remaining queries that should form and union with `single_query_`.
  std::vector<memgraph::query::CypherUnion *> cypher_unions_;
  /// Index hint
  /// Suggestion: If we’re going to have multiple pre-query directives (not only index_hints_), they need to be
  /// contained within a dedicated class/struct
  std::vector<memgraph::query::IndexHint> index_hints_;
  /// Memory limit
  memgraph::query::Expression *memory_limit_{nullptr};
  size_t memory_scale_{1024U};
@ -2103,6 +2129,10 @@ class CypherQuery : public memgraph::query::Query, public utils::Visitable<Hiera
    for (auto i5 = 0; i5 < cypher_unions_.size(); ++i5) {
      object->cypher_unions_[i5] = cypher_unions_[i5] ? cypher_unions_[i5]->Clone(storage) : nullptr;
    }
    object->index_hints_.resize(index_hints_.size());
    for (auto i6 = 0; i6 < index_hints_.size(); ++i6) {
      object->index_hints_[i6] = index_hints_[i6].Clone(storage);
    }
    object->memory_limit_ = memory_limit_ ? memory_limit_->Clone(storage) : nullptr;
    object->memory_scale_ = memory_scale_;
    return object;
--- a/src/query/frontend/ast/cypher_main_visitor.cpp
+++ b/src/query/frontend/ast/cypher_main_visitor.cpp
@ -202,6 +202,20 @@ antlrcpp::Any CypherMainVisitor::visitCypherQuery(MemgraphCypher::CypherQueryCon
    cypher_query->cypher_unions_.push_back(std::any_cast<CypherUnion *>(child->accept(this)));
  }
  if (auto *index_hints_ctx = ctx->indexHints()) {
    for (auto *index_hint_ctx : index_hints_ctx->indexHint()) {
      auto label = AddLabel(std::any_cast<std::string>(index_hint_ctx->labelName()->accept(this)));
      if (!index_hint_ctx->propertyKeyName()) {
        cypher_query->index_hints_.emplace_back(IndexHint{.index_type_ = IndexHint::IndexType::LABEL, .label_ = label});
        continue;
      }
      cypher_query->index_hints_.emplace_back(
          IndexHint{.index_type_ = IndexHint::IndexType::LABEL_PROPERTY,
                    .label_ = label,
                    .property_ = std::any_cast<PropertyIx>(index_hint_ctx->propertyKeyName()->accept(this))});
    }
  }
  if (auto *memory_limit_ctx = ctx->queryMemoryLimit()) {
    const auto memory_limit_info = VisitMemoryLimit(memory_limit_ctx->memoryLimit(), this);
    if (memory_limit_info) {
--- a/src/query/frontend/opencypher/grammar/MemgraphCypher.g4
+++ b/src/query/frontend/opencypher/grammar/MemgraphCypher.g4
@ -114,6 +114,7 @@ memgraphCypherKeyword : cypherKeyword
                      | USE
                      | USER
                      | USERS
                      | USING
                      | VERSION
                      | TERMINATE
                      | TRANSACTIONS
@ -151,6 +152,8 @@ query : cypherQuery
      | edgeImportModeQuery
      ;
 cypherQuery : ( indexHints )? singleQuery ( cypherUnion )* ( queryMemoryLimit )? ;
 authQuery : createRole
          | dropRole
          | showRoles
@ -209,6 +212,10 @@ updateClause : set
 foreach :  FOREACH '(' variable IN expression '|' updateClause+  ')' ;
 indexHints: USING INDEX indexHint ( ',' indexHint )* ;
 indexHint: ':' labelName ( '(' propertyKeyName ')' )? ;
 callSubquery : CALL '{' cypherQuery '}' ;
 streamQuery : checkStream
@ -259,9 +266,9 @@ userOrRoleName : symbolicName ;
 createRole : CREATE ROLE role=userOrRoleName ;
-dropRole   : DROP ROLE role=userOrRoleName ;
+dropRole : DROP ROLE role=userOrRoleName ;
-showRoles  : SHOW ROLES ;
+showRoles : SHOW ROLES ;
 createUser : CREATE USER user=userOrRoleName
             ( IDENTIFIED BY password=literal )? ;
@ -347,11 +354,11 @@ showRoleForUser : SHOW ROLE FOR user=userOrRoleName ;
 showUsersForRole : SHOW USERS FOR role=userOrRoleName ;
-dumpQuery: DUMP DATABASE ;
+dumpQuery : DUMP DATABASE ;
-analyzeGraphQuery: ANALYZE GRAPH ( ON LABELS ( listOfColonSymbolicNames | ASTERISK ) ) ? ( DELETE STATISTICS ) ? ;
+analyzeGraphQuery : ANALYZE GRAPH ( ON LABELS ( listOfColonSymbolicNames | ASTERISK ) ) ? ( DELETE STATISTICS ) ? ;
-setReplicationRole  : SET REPLICATION ROLE TO ( MAIN | REPLICA )
+setReplicationRole : SET REPLICATION ROLE TO ( MAIN | REPLICA )
                      ( WITH PORT port=literal ) ? ;
 showReplicationRole : SHOW REPLICATION ROLE ;
@ -365,7 +372,7 @@ registerReplica : REGISTER REPLICA replicaName ( SYNC | ASYNC )
 dropReplica : DROP REPLICA replicaName ;
-showReplicas  : SHOW REPLICAS ;
+showReplicas : SHOW REPLICAS ;
 lockPathQuery : ( LOCK | UNLOCK ) DATA DIRECTORY | DATA DIRECTORY LOCK STATUS;
@ -402,7 +409,7 @@ streamName : symbolicName ;
 symbolicNameWithMinus : symbolicName ( MINUS symbolicName )* ;
-symbolicNameWithDotsAndMinus: symbolicNameWithMinus ( DOT symbolicNameWithMinus )* ;
+symbolicNameWithDotsAndMinus : symbolicNameWithMinus ( DOT symbolicNameWithMinus )* ;
 symbolicTopicNames : symbolicNameWithDotsAndMinus ( COMMA symbolicNameWithDotsAndMinus )* ;
@ -480,6 +487,6 @@ useDatabase : USE DATABASE databaseName ;
 dropDatabase : DROP DATABASE databaseName ;
-showDatabases: SHOW DATABASES ;
+showDatabases : SHOW DATABASES ;
 edgeImportModeQuery : EDGE IMPORT MODE ( ACTIVE | INACTIVE ) ;
--- a/src/query/frontend/opencypher/grammar/MemgraphCypherLexer.g4
+++ b/src/query/frontend/opencypher/grammar/MemgraphCypherLexer.g4
@ -137,5 +137,6 @@ UPDATE                  : U P D A T E ;
 USE                     : U S E ;
 USER                    : U S E R ;
 USERS                   : U S E R S ;
 USING                   : U S I N G ;
 VERSION                 : V E R S I O N ;
 WEBSOCKET               : W E B S O C K E T ;
--- a/src/query/plan/operator.hpp
+++ b/src/query/plan/operator.hpp
@ -1131,8 +1131,12 @@ class Filter : public memgraph::query::plan::LogicalOperator {
  static std::string SingleFilterName(const query::plan::FilterInfo &single_filter) {
    using Type = query::plan::FilterInfo::Type;
    if (single_filter.type == Type::Generic) {
-      return fmt::format("Generic {{{}}}", utils::IterableToString(single_filter.used_symbols, ", ",
+      std::set<std::string> symbol_names;
-                                                                   [](const auto &symbol) { return symbol.name(); }));
+      for (const auto &symbol : single_filter.used_symbols) {
        symbol_names.insert(symbol.name());
      }
      return fmt::format("Generic {{{}}}",
                         utils::IterableToString(symbol_names, ", ", [](const auto &name) { return name; }));
    } else if (single_filter.type == Type::Id) {
      return fmt::format("id({})", single_filter.id_filter->symbol_.name());
    } else if (single_filter.type == Type::Label) {
@ -1140,16 +1144,18 @@ class Filter : public memgraph::query::plan::LogicalOperator {
        LOG_FATAL("Label filters not using LabelsTest are not supported for query inspection!");
      }
      auto filter_expression = static_cast<LabelsTest *>(single_filter.expression);
      std::set<std::string> label_names;
      for (const auto &label : filter_expression->labels_) {
        label_names.insert(label.name);
      }
      if (filter_expression->expression_->GetTypeInfo() != Identifier::kType) {
-        return fmt::format("(:{})", utils::IterableToString(filter_expression->labels_, ":",
+        return fmt::format("(:{})", utils::IterableToString(label_names, ":", [](const auto &name) { return name; }));
                                                            [](const auto &label) { return label.name; }));
      }
      auto identifier_expression = static_cast<Identifier *>(filter_expression->expression_);
-      return fmt::format(
+      return fmt::format("({} :{})", identifier_expression->name_,
-          "({} :{})", identifier_expression->name_,
+                         utils::IterableToString(label_names, ":", [](const auto &name) { return name; }));
          utils::IterableToString(filter_expression->labels_, ":", [](const auto &label) { return label.name; }));
    } else if (single_filter.type == Type::Pattern) {
      return "Pattern";
    } else if (single_filter.type == Type::Property) {
@ -1161,9 +1167,11 @@ class Filter : public memgraph::query::plan::LogicalOperator {
  }
  std::string ToString() const override {
-    return fmt::format("Filter {}", utils::IterableToString(all_filters_, ", ", [](const auto &single_filter) {
+    std::set<std::string> filter_names;
-                         return Filter::SingleFilterName(single_filter);
+    for (const auto &filter : all_filters_) {
-                       }));
+      filter_names.insert(Filter::SingleFilterName(filter));
    }
    return fmt::format("Filter {}", utils::IterableToString(filter_names, ", ", [](const auto &name) { return name; }));
  }
  std::unique_ptr<LogicalOperator> Clone(AstStorage *storage) const override {
--- a/src/query/plan/planner.hpp
+++ b/src/query/plan/planner.hpp
@ -38,14 +38,20 @@ class PostProcessor final {
  Parameters parameters_;
 public:
  IndexHints index_hints_{};
  using ProcessedPlan = std::unique_ptr<LogicalOperator>;
  explicit PostProcessor(const Parameters &parameters) : parameters_(parameters) {}
  template <class TDbAccessor>
  PostProcessor(const Parameters &parameters, std::vector<IndexHint> index_hints, TDbAccessor *db)
      : parameters_(parameters), index_hints_(IndexHints(index_hints, db)) {}
  template <class TPlanningContext>
  std::unique_ptr<LogicalOperator> Rewrite(std::unique_ptr<LogicalOperator> plan, TPlanningContext *context) {
    auto index_lookup_plan =
-        RewriteWithIndexLookup(std::move(plan), context->symbol_table, context->ast_storage, context->db);
+        RewriteWithIndexLookup(std::move(plan), context->symbol_table, context->ast_storage, context->db, index_hints_);
    return RewriteWithJoinRewriter(std::move(index_lookup_plan), context->symbol_table, context->ast_storage,
                                   context->db);
  }
@ -122,7 +128,7 @@ auto MakeLogicalPlan(TPlanningContext *context, TPlanPostProcess *post_process,
 template <class TPlanningContext>
 auto MakeLogicalPlan(TPlanningContext *context, const Parameters &parameters, bool use_variable_planner) {
-  PostProcessor post_processor(parameters);
+  PostProcessor post_processor(parameters, context->query->index_hints_, context->db);
  return MakeLogicalPlan(context, &post_processor, use_variable_planner);
 }
--- a/src/query/plan/rewrite/index_lookup.hpp
+++ b/src/query/plan/rewrite/index_lookup.hpp
@ -32,6 +32,36 @@ DECLARE_int64(query_vertex_count_to_expand_existing);
 namespace memgraph::query::plan {
 /// Holds a given query's index hints after sorting them by type
 struct IndexHints {
  IndexHints() = default;
  template <class TDbAccessor>
  IndexHints(std::vector<IndexHint> index_hints, TDbAccessor *db) {
    for (const auto &index_hint : index_hints) {
      const auto index_type = index_hint.index_type_;
      const auto label_name = index_hint.label_.name;
      if (index_type == IndexHint::IndexType::LABEL) {
        if (!db->LabelIndexExists(db->NameToLabel(label_name))) {
          spdlog::debug("Index for label {} doesn't exist", label_name);
          continue;
        }
        label_index_hints_.emplace_back(index_hint);
      } else if (index_type == IndexHint::IndexType::LABEL_PROPERTY) {
        auto property_name = index_hint.property_->name;
        if (!db->LabelPropertyIndexExists(db->NameToLabel(label_name), db->NameToProperty(property_name))) {
          spdlog::debug("Index for label {} and property {} doesn't exist", label_name, property_name);
          continue;
        }
        label_property_index_hints_.emplace_back(index_hint);
      }
    }
  }
  std::vector<IndexHint> label_index_hints_{};
  std::vector<IndexHint> label_property_index_hints_{};
 };
 namespace impl {
 struct ExpressionRemovalResult {
@ -43,11 +73,18 @@ struct ExpressionRemovalResult {
 // given expression tree.
 ExpressionRemovalResult RemoveExpressions(Expression *expr, const std::unordered_set<Expression *> &exprs_to_remove);
 struct HashPair {
  template <class T1, class T2>
  std::size_t operator()(const std::pair<T1, T2> &pair) const {
    return utils::HashCombine<T1, T2>{}(pair.first, pair.second);
  }
 };
 template <class TDbAccessor>
 class IndexLookupRewriter final : public HierarchicalLogicalOperatorVisitor {
 public:
-  IndexLookupRewriter(SymbolTable *symbol_table, AstStorage *ast_storage, TDbAccessor *db)
+  IndexLookupRewriter(SymbolTable *symbol_table, AstStorage *ast_storage, TDbAccessor *db, IndexHints index_hints)
-      : symbol_table_(symbol_table), ast_storage_(ast_storage), db_(db) {}
+      : symbol_table_(symbol_table), ast_storage_(ast_storage), db_(db), index_hints_(index_hints) {}
  using HierarchicalLogicalOperatorVisitor::PostVisit;
  using HierarchicalLogicalOperatorVisitor::PreVisit;
@ -535,6 +572,7 @@ class IndexLookupRewriter final : public HierarchicalLogicalOperatorVisitor {
  // Expressions which no longer need a plain Filter operator.
  std::unordered_set<Expression *> filter_exprs_for_removal_;
  std::vector<LogicalOperator *> prev_ops_;
  IndexHints index_hints_;
  // additional symbols that are present from other non-main branches but have influence on indexing
  std::unordered_set<Symbol> additional_bound_symbols_;
@ -575,7 +613,7 @@ class IndexLookupRewriter final : public HierarchicalLogicalOperatorVisitor {
  }
  void RewriteBranch(std::shared_ptr<LogicalOperator> *branch) {
-    IndexLookupRewriter<TDbAccessor> rewriter(symbol_table_, ast_storage_, db_);
+    IndexLookupRewriter<TDbAccessor> rewriter(symbol_table_, ast_storage_, db_, index_hints_);
    (*branch)->Accept(rewriter);
    if (rewriter.new_root_) {
      *branch = rewriter.new_root_;
@ -588,6 +626,13 @@ class IndexLookupRewriter final : public HierarchicalLogicalOperatorVisitor {
  std::optional<LabelIx> FindBestLabelIndex(const std::unordered_set<LabelIx> &labels) {
    MG_ASSERT(!labels.empty(), "Trying to find the best label without any labels.");
    for (const auto &[index_type, label, _] : index_hints_.label_index_hints_) {
      if (labels.contains(label)) {
        return label;
      }
    }
    std::optional<LabelIx> best_label;
    for (const auto &label : labels) {
      if (!db_->LabelIndexExists(GetLabel(label))) continue;
@ -600,13 +645,12 @@ class IndexLookupRewriter final : public HierarchicalLogicalOperatorVisitor {
    return best_label;
  }
-  // Finds the label-property combination. The first criteria based on number of vertices indexed -> if one index has
+  struct CandidateIndices {
-  // 10x less than the other one, always choose the smaller one. Otherwise, choose the index with smallest average
+    std::vector<std::pair<IndexHint, FilterInfo>> candidate_indices_{};
-  // group size based on key distribution. If average group size is equal, choose the index that has distribution
+    std::unordered_map<std::pair<LabelIx, PropertyIx>, FilterInfo, HashPair> candidate_index_lookup_{};
-  // closer to uniform distribution. Conditions based on average group size and key distribution can be only taken
+  };
-  // into account if the user has run `ANALYZE GRAPH` query before If the index cannot be found, nullopt is returned.
+
-  std::optional<LabelPropertyIndex> FindBestLabelPropertyIndex(const Symbol &symbol,
+  CandidateIndices GetCandidateIndices(const Symbol &symbol, const std::unordered_set<Symbol> &bound_symbols) {
                                                               const std::unordered_set<Symbol> &bound_symbols) {
    auto are_bound = [&bound_symbols](const auto &used_symbols) {
      for (const auto &used_symbol : used_symbols) {
        if (!utils::Contains(bound_symbols, used_symbol)) {
@ -616,6 +660,39 @@ class IndexLookupRewriter final : public HierarchicalLogicalOperatorVisitor {
      return true;
    };
    std::vector<std::pair<IndexHint, FilterInfo>> candidate_indices{};
    std::unordered_map<std::pair<LabelIx, PropertyIx>, FilterInfo, HashPair> candidate_index_lookup{};
    for (const auto &label : filters_.FilteredLabels(symbol)) {
      for (const auto &filter : filters_.PropertyFilters(symbol)) {
        if (filter.property_filter->is_symbol_in_value_ || !are_bound(filter.used_symbols)) {
          // Skip filter expressions which use the symbol whose property we are
          // looking up or aren't bound. We cannot scan by such expressions. For
          // example, in `n.a = 2 + n.b` both sides of `=` refer to `n`, so we
          // cannot scan `n` by property index.
          continue;
        }
        const auto &property = filter.property_filter->property_;
        if (!db_->LabelPropertyIndexExists(GetLabel(label), GetProperty(property))) {
          continue;
        }
        candidate_indices.emplace_back(std::make_pair(
            IndexHint{.index_type_ = IndexHint::IndexType::LABEL_PROPERTY, .label_ = label, .property_ = property},
            filter));
        candidate_index_lookup.insert({std::make_pair(label, property), filter});
      }
    }
    return CandidateIndices{.candidate_indices_ = candidate_indices, .candidate_index_lookup_ = candidate_index_lookup};
  }
  // Finds the label-property combination. The first criteria based on number of vertices indexed -> if one index has
  // 10x less than the other one, always choose the smaller one. Otherwise, choose the index with smallest average group
  // size based on key distribution. If average group size is equal, choose the index that has distribution closer to
  // uniform distribution. Conditions based on average group size and key distribution can be only taken into account if
  // the user has run `ANALYZE GRAPH` query before If the index cannot be found, nullopt is returned.
  std::optional<LabelPropertyIndex> FindBestLabelPropertyIndex(const Symbol &symbol,
                                                               const std::unordered_set<Symbol> &bound_symbols) {
    /*
     * Comparator function between two indices. If new index has >= 10x vertices than the existing, it cannot be
     * better. If it is <= 10x in number of vertices, check average group size of property values. The index with
@ -640,54 +717,59 @@ class IndexLookupRewriter final : public HierarchicalLogicalOperatorVisitor {
      return utils::CompareDecimal(new_stats->statistic, found->index_stats->statistic);
    };
    auto [candidate_indices, candidate_index_lookup] = GetCandidateIndices(symbol, bound_symbols);
    for (const auto &[index_type, label, maybe_property] : index_hints_.label_property_index_hints_) {
      auto property = *maybe_property;
      if (candidate_index_lookup.contains(std::make_pair(label, property))) {
        return LabelPropertyIndex{.label = label,
                                  .filter = candidate_index_lookup.at(std::make_pair(label, property)),
                                  .vertex_count = std::numeric_limits<std::int64_t>::max()};
      }
    }
    std::optional<LabelPropertyIndex> found;
-    for (const auto &label : filters_.FilteredLabels(symbol)) {
+    // for (const auto &[label_and_property, filter] : candidate_indices) {
-      for (const auto &filter : filters_.PropertyFilters(symbol)) {
+    //   const auto &[label, property] = label_and_property;
-        if (filter.property_filter->is_symbol_in_value_ || !are_bound(filter.used_symbols)) {
+    for (const auto &[candidate, filter] : candidate_indices) {
-          // Skip filter expressions which use the symbol whose property we are
+      const auto &[_, label, maybe_property] = candidate;
-          // looking up or aren't bound. We cannot scan by such expressions. For
+      auto property = *maybe_property;
          // example, in `n.a = 2 + n.b` both sides of `=` refer to `n`, so we
          // cannot scan `n` by property index.
          continue;
        }
        const auto &property = filter.property_filter->property_;
        if (!db_->LabelPropertyIndexExists(GetLabel(label), GetProperty(property))) {
          continue;
        }
        auto is_better_type = [&found](PropertyFilter::Type type) {
          // Order the types by the most preferred index lookup type.
          static const PropertyFilter::Type kFilterTypeOrder[] = {
              PropertyFilter::Type::EQUAL, PropertyFilter::Type::RANGE, PropertyFilter::Type::REGEX_MATCH};
          auto *found_sort_ix = std::find(kFilterTypeOrder, kFilterTypeOrder + 3, found->filter.property_filter->type_);
          auto *type_sort_ix = std::find(kFilterTypeOrder, kFilterTypeOrder + 3, type);
          return type_sort_ix < found_sort_ix;
        };
-        int64_t vertex_count = db_->VerticesCount(GetLabel(label), GetProperty(property));
+      auto is_better_type = [&found](PropertyFilter::Type type) {
-        std::optional<storage::LabelPropertyIndexStats> new_stats =
+        // Order the types by the most preferred index lookup type.
-            db_->GetIndexStats(GetLabel(label), GetProperty(property));
+        static const PropertyFilter::Type kFilterTypeOrder[] = {
            PropertyFilter::Type::EQUAL, PropertyFilter::Type::RANGE, PropertyFilter::Type::REGEX_MATCH};
        auto *found_sort_ix = std::find(kFilterTypeOrder, kFilterTypeOrder + 3, found->filter.property_filter->type_);
        auto *type_sort_ix = std::find(kFilterTypeOrder, kFilterTypeOrder + 3, type);
        return type_sort_ix < found_sort_ix;
      };
-        // Conditions, from more to less important:
+      // Conditions, from more to less important:
-        // the index with 10x less vertices is better.
+      // the index with 10x less vertices is better.
-        // the index with smaller average group size is better.
+      // the index with smaller average group size is better.
-        // the index with equal avg group size and distribution closer to the uniform is better.
+      // the index with equal avg group size and distribution closer to the uniform is better.
-        // the index with less vertices is better.
+      // the index with less vertices is better.
-        // the index with same number of vertices but more optimized filter is better.
+      // the index with same number of vertices but more optimized filter is better.
        if (!found || vertex_count * 10 < found->vertex_count) {
          found = LabelPropertyIndex{label, filter, vertex_count, new_stats};
          continue;
        }
-        if (int cmp_res = compare_indices(found, new_stats, vertex_count);
+      int64_t vertex_count = db_->VerticesCount(GetLabel(label), GetProperty(property));
-            cmp_res == -1 ||
+      std::optional<storage::LabelPropertyIndexStats> new_stats =
-            cmp_res == 0 && (found->vertex_count > vertex_count ||
+          db_->GetIndexStats(GetLabel(label), GetProperty(property));
-                             found->vertex_count == vertex_count && is_better_type(filter.property_filter->type_))) {
+
-          found = LabelPropertyIndex{label, filter, vertex_count, new_stats};
+      if (!found || vertex_count * 10 < found->vertex_count) {
-        }
+        found = LabelPropertyIndex{label, filter, vertex_count, new_stats};
        continue;
      }
      if (int cmp_res = compare_indices(found, new_stats, vertex_count);
          cmp_res == -1 ||
          cmp_res == 0 && (found->vertex_count > vertex_count ||
                           found->vertex_count == vertex_count && is_better_type(filter.property_filter->type_))) {
        found = LabelPropertyIndex{label, filter, vertex_count, new_stats};
      }
    }
    return found;
  }
  // Creates a ScanAll by the best possible index for the `node_symbol`. If the node
  // does not have at least a label, no indexed lookup can be created and
  // `nullptr` is returned. The operator is chained after `input`. Optional
@ -798,8 +880,8 @@ class IndexLookupRewriter final : public HierarchicalLogicalOperatorVisitor {
 template <class TDbAccessor>
 std::unique_ptr<LogicalOperator> RewriteWithIndexLookup(std::unique_ptr<LogicalOperator> root_op,
                                                        SymbolTable *symbol_table, AstStorage *ast_storage,
-                                                        TDbAccessor *db) {
+                                                        TDbAccessor *db, IndexHints index_hints) {
-  impl::IndexLookupRewriter<TDbAccessor> rewriter(symbol_table, ast_storage, db);
+  impl::IndexLookupRewriter<TDbAccessor> rewriter(symbol_table, ast_storage, db, index_hints);
  root_op->Accept(rewriter);
  if (rewriter.new_root_) {
    // This shouldn't happen in real use case, because IndexLookupRewriter
--- a/tests/e2e/CMakeLists.txt
+++ b/tests/e2e/CMakeLists.txt
@ -66,6 +66,7 @@ add_subdirectory(concurrent_query_modules)
 add_subdirectory(show_index_info)
 add_subdirectory(set_properties)
 add_subdirectory(transaction_rollback)
 add_subdirectory(index_hints)
 add_subdirectory(query_modules)
 add_subdirectory(constraints)
--- a/tests/e2e/disk_storage/workloads.yaml
+++ b/tests/e2e/disk_storage/workloads.yaml
@ -1,7 +1,7 @@
 disk_storage: &disk_storage
  cluster:
    main:
-      args: ["--bolt-port", "7687", "--log-level", "TRACE", "--memory-limit", "125"]
+      args: ["--bolt-port", "7687", "--log-level", "TRACE", "--memory-limit", "150"]
      log_file: "disk_storage.log"
      setup_queries: []
      validation_queries: []
--- a/tests/e2e/index_hints/CMakeLists.txt
+++ b/tests/e2e/index_hints/CMakeLists.txt
@ -0,0 +1,6 @@
 function(copy_index_hints_e2e_python_files FILE_NAME)
    copy_e2e_python_files(index_hints ${FILE_NAME})
 endfunction()
 copy_index_hints_e2e_python_files(common.py)
 copy_index_hints_e2e_python_files(index_hints.py)
--- a/tests/e2e/index_hints/common.py
+++ b/tests/e2e/index_hints/common.py
@ -0,0 +1,45 @@
 # Copyright 2023 Memgraph Ltd.
 #
 # Use of this software is governed by the Business Source License
 # included in the file licenses/BSL.txt; by using this file, you agree to be bound by the terms of the Business Source
 # License, and you may not use this file except in compliance with the Business Source License.
 #
 # As of the Change Date specified in that file, in accordance with
 # the Business Source License, use of this software will be governed
 # by the Apache License, Version 2.0, included in the file
 # licenses/APL.txt.
 import typing
 import mgclient
 import pytest
 from gqlalchemy import Memgraph
 def execute_and_fetch_all(cursor: mgclient.Cursor, query: str, params: dict = {}) -> typing.List[tuple]:
    cursor.execute(query, params)
    return cursor.fetchall()
@pytest.fixture
 def connect(**kwargs) -> mgclient.Connection:
    connection = mgclient.connect(host="localhost", port=7687, **kwargs)
    connection.autocommit = True
    cursor = connection.cursor()
    execute_and_fetch_all(cursor, "USE DATABASE memgraph")
    try:
        execute_and_fetch_all(cursor, "DROP DATABASE clean")
    except:
        pass
    execute_and_fetch_all(cursor, "MATCH (n) DETACH DELETE n")
    yield connection
@pytest.fixture
 def memgraph(**kwargs) -> Memgraph:
    memgraph = Memgraph()
    yield memgraph
    memgraph.drop_database()
    memgraph.drop_indexes()
--- a/tests/e2e/index_hints/index_hints.py
+++ b/tests/e2e/index_hints/index_hints.py
@ -0,0 +1,479 @@
 # Copyright 2023 Memgraph Ltd.
 #
 # Use of this software is governed by the Business Source License
 # included in the file licenses/BSL.txt; by using this file, you agree to be bound by the terms of the Business Source
 # License, and you may not use this file except in compliance with the Business Source License.
 #
 # As of the Change Date specified in that file, in accordance with
 # the Business Source License, use of this software will be governed
 # by the Apache License, Version 2.0, included in the file
 # licenses/APL.txt.
 import sys
 import mgclient
 import pytest
 from common import memgraph
 def test_label_index_hint(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2 {id: i}));")
    memgraph.execute("FOREACH (i IN range(1, 10) | CREATE (n:Label2 {id: i+50}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    expected_explain_no_hint = [
        " * Produce {n}",
        " * Filter (n :Label1:Label2)",
        " * ScanAllByLabel (n :Label1)",
        " * Once",
    ]
    expected_explain_with_hint = [row.replace("(n :Label1)", "(n :Label2)") for row in expected_explain_no_hint]
    explain_no_hint = [
        row["QUERY PLAN"] for row in memgraph.execute_and_fetch("EXPLAIN MATCH (n:Label1:Label2) RETURN n;")
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label2 MATCH (n:Label1:Label2) RETURN n;")
    ]
    assert explain_no_hint == expected_explain_no_hint and explain_with_hint == expected_explain_with_hint
 def test_label_index_hint_alternative_orderings(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2:Label3 {id: i}));")
    memgraph.execute("FOREACH (i IN range(1, 10) | CREATE (n:Label2 {id: i+50}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    expected_explain_with_hint = [
        " * Produce {n}",
        " * Filter (n :Label1:Label2)",
        " * ScanAllByLabel (n :Label2)",
        " * Once",
    ]
    expected_explain_with_hint_ordering_3 = expected_explain_with_hint[:]
    expected_explain_with_hint_ordering_3[1] = " * Filter (n :Label1:Label2:Label3)"  # since it matches 3 labels
    explain_with_hint_ordering_1 = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label2 MATCH (n:Label1:Label2) RETURN n;")
    ]
    explain_with_hint_ordering_2 = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label2 MATCH (n:Label2:Label1) RETURN n;")
    ]
    explain_with_hint_ordering_3 = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label2 MATCH (n:Label3:Label2:Label1) RETURN n;")
    ]
    assert (
        expected_explain_with_hint == explain_with_hint_ordering_1 == explain_with_hint_ordering_2
        and expected_explain_with_hint_ordering_3 == explain_with_hint_ordering_3
    )
 def test_multiple_label_index_hints(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2 {id: i}));")
    memgraph.execute("FOREACH (i IN range(1, 10) | CREATE (n:Label2 {id: i+50}));")
    memgraph.execute("CREATE INDEX ON :Label0;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    expected_explain_with_hint = [
        " * Produce {n}",
        " * Filter (n :Label1:Label2)",
        " * ScanAllByLabel (n :Label2)",
        " * Once",
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label0, :Label2 MATCH (n:Label1:Label2) RETURN n;")
    ]
    assert explain_with_hint == expected_explain_with_hint
 def test_multiple_applicable_label_index_hints(memgraph):
    # Out of all applicable index hints, the first one given in the query should be used
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2:Label3 {id: i}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    memgraph.execute("CREATE INDEX ON :Label3;")
    expected_explain_with_hint = [
        " * Produce {n}",
        " * Filter (n :Label2:Label3)",
        " * ScanAllByLabel (n :Label3)",
        " * Once",
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label3, :Label2 MATCH (n:Label2:Label3) RETURN n;")
    ]
    assert explain_with_hint == expected_explain_with_hint
 def test_multiple_applicable_label_index_hints_alternative_orderings(memgraph):
    # Out of all applicable index hints, the first one given in the query should be used
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2:Label3 {id: i}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    memgraph.execute("CREATE INDEX ON :Label3;")
    expected_explain_with_hint_1 = [
        " * Produce {n}",
        " * Filter (n :Label2:Label3)",
        " * ScanAllByLabel (n :Label3)",
        " * Once",
    ]
    expected_explain_with_hint_2 = [row.replace("(n :Label3)", "(n :Label2)") for row in expected_explain_with_hint_1]
    explain_with_hint_ordering_1a = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label3, :Label2 MATCH (n:Label2:Label3) RETURN n;")
    ]
    explain_with_hint_ordering_1b = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label3, :Label2 MATCH (n:Label3:Label2) RETURN n;")
    ]
    explain_with_hint_ordering_2a = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label2, :Label3 MATCH (n:Label2:Label3) RETURN n;")
    ]
    explain_with_hint_ordering_2b = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label2, :Label3 MATCH (n:Label3:Label2) RETURN n;")
    ]
    assert (expected_explain_with_hint_1 == explain_with_hint_ordering_1a == explain_with_hint_ordering_1b) and (
        expected_explain_with_hint_2 == explain_with_hint_ordering_2a == explain_with_hint_ordering_2b
    )
 def test_label_property_index_hint(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 100) | CREATE (n:Label {id1: i}));")
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label {id2: i % 5}));")
    memgraph.execute("CREATE INDEX ON :Label(id1);")
    memgraph.execute("CREATE INDEX ON :Label(id2);")
    expected_explain_no_hint = [
        " * Produce {n}",
        " * Filter (n :Label), {n.id1}, {n.id2}",
        " * ScanAllByLabelPropertyValue (n :Label {id2})",
        " * Once",
    ]
    expected_explain_with_hint = [
        row.replace("(n :Label {id2})", "(n :Label {id1})") for row in expected_explain_no_hint
    ]
    explain_no_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch("EXPLAIN MATCH (n:Label) WHERE n.id2 = 3 AND n.id1 = 3 RETURN n;")
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id1) MATCH (n:Label) WHERE n.id2 = 3 AND n.id1 = 3 RETURN n;"
        )
    ]
    assert explain_no_hint == expected_explain_no_hint and explain_with_hint == expected_explain_with_hint
 def test_label_property_index_hint_alternative_orderings(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 100) | CREATE (n:Label {id1: i}));")
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label {id2: i % 5}));")
    memgraph.execute("CREATE INDEX ON :Label(id1);")
    memgraph.execute("CREATE INDEX ON :Label(id2);")
    expected_explain_with_hint = [
        " * Produce {n}",
        " * Filter (n :Label), {n.id1}, {n.id2}",
        " * ScanAllByLabelPropertyValue (n :Label {id1})",
        " * Once",
    ]
    explain_with_hint_ordering_1 = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id1) MATCH (n:Label) WHERE n.id2 = 3 AND n.id1 = 3 RETURN n;"
        )
    ]
    explain_with_hint_ordering_2 = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id1) MATCH (n:Label) WHERE n.id1 = 3 AND n.id2 = 3 RETURN n;"
        )
    ]
    assert expected_explain_with_hint == explain_with_hint_ordering_1 == explain_with_hint_ordering_2
 def test_multiple_label_property_index_hints(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 100) | CREATE (n:Label {id1: i}));")
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label {id2: i % 5}));")
    memgraph.execute("CREATE INDEX ON :Label(id0);")
    memgraph.execute("CREATE INDEX ON :Label(id1);")
    expected_explain_with_hint = [
        " * Produce {n}",
        " * Filter (n :Label), {n.id1}, {n.id2}",
        " * ScanAllByLabelPropertyValue (n :Label {id1})",
        " * Once",
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id0), :Label(id1) MATCH (n:Label) WHERE n.id2 = 3 AND n.id1 = 3 RETURN n;"
        )
    ]
    explain_with_hint_alternative_ordering = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id0), :Label(id1) MATCH (n:Label) WHERE n.id1 = 3 AND n.id2 = 3 RETURN n;"
        )
    ]
    assert explain_with_hint == expected_explain_with_hint == explain_with_hint_alternative_ordering
 def test_multiple_applicable_label_property_index_hints(memgraph):
    # Out of all applicable index hints, the first one given in the query should be used
    memgraph.execute("FOREACH (i IN range(1, 100) | CREATE (n:Label {id1: i}));")
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label {id2: i % 5}));")
    memgraph.execute("CREATE INDEX ON :Label(id1);")
    memgraph.execute("CREATE INDEX ON :Label(id2);")
    expected_explain_with_hint = [
        " * Produce {n}",
        " * Filter (n :Label), {n.id1}, {n.id2}",
        " * ScanAllByLabelPropertyValue (n :Label {id1})",
        " * Once",
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id1), :Label(id2) MATCH (n:Label) WHERE n.id2 = 3 AND n.id1 = 3 RETURN n;"
        )
    ]
    assert explain_with_hint == expected_explain_with_hint
 def test_multiple_applicable_label_property_index_hints_alternative_orderings(memgraph):
    # Out of all applicable index hints, the first one given in the query should be used
    memgraph.execute("FOREACH (i IN range(1, 100) | CREATE (n:Label {id1: i}));")
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label {id2: i % 5}));")
    memgraph.execute("CREATE INDEX ON :Label(id1);")
    memgraph.execute("CREATE INDEX ON :Label(id2);")
    expected_explain_with_hint_1 = [
        " * Produce {n}",
        " * Filter (n :Label), {n.id1}, {n.id2}",
        " * ScanAllByLabelPropertyValue (n :Label {id1})",
        " * Once",
    ]
    expected_explain_with_hint_2 = [
        row.replace("(n :Label {id1})", "(n :Label {id2})") for row in expected_explain_with_hint_1
    ]
    explain_with_hint_ordering_1a = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id1), :Label(id2) MATCH (n:Label) WHERE n.id2 = 3 AND n.id1 = 3 RETURN n;"
        )
    ]
    explain_with_hint_ordering_1b = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id1), :Label(id2) MATCH (n:Label) WHERE n.id1 = 3 AND n.id2 = 3 RETURN n;"
        )
    ]
    explain_with_hint_ordering_2a = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id2), :Label(id1) MATCH (n:Label) WHERE n.id2 = 3 AND n.id1 = 3 RETURN n;"
        )
    ]
    explain_with_hint_ordering_2b = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label(id2), :Label(id1) MATCH (n:Label) WHERE n.id1 = 3 AND n.id2 = 3 RETURN n;"
        )
    ]
    assert (expected_explain_with_hint_1 == explain_with_hint_ordering_1a == explain_with_hint_ordering_1b) and (
        expected_explain_with_hint_2 == explain_with_hint_ordering_2a == explain_with_hint_ordering_2b
    )
 def test_union_applicable_in_left_branch(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2 {id: i}));")
    memgraph.execute("FOREACH (i IN range(1, 10) | CREATE (n:Label2 {id: i+50}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    expected_explain_with_hint = [
        " * Distinct",
        " * Union {n : n}",
        " |\\ ",
        " | * Produce {n}",
        " | * ScanAllByLabel (n :Label2)",
        " | * Once",
        " * Produce {n}",
        " * ScanAllByLabel (n :Label1)",
        " * Once",
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label1 MATCH (n:Label1) RETURN n UNION MATCH (n:Label2) RETURN n;"
        )
    ]
    assert explain_with_hint == expected_explain_with_hint
 def test_union_applicable_in_right_branch(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2 {id: i}));")
    memgraph.execute("FOREACH (i IN range(1, 10) | CREATE (n:Label2 {id: i+50}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    expected_explain_with_hint = [
        " * Distinct",
        " * Union {n : n}",
        " |\\ ",
        " | * Produce {n}",
        " | * ScanAllByLabel (n :Label1)",
        " | * Once",
        " * Produce {n}",
        " * ScanAllByLabel (n :Label2)",
        " * Once",
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label1 MATCH (n:Label2) RETURN n UNION MATCH (n:Label1) RETURN n;"
        )
    ]
    assert explain_with_hint == expected_explain_with_hint
 def test_union_applicable_in_both_branches(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2:Label3 {id: i}));")
    memgraph.execute("FOREACH (i IN range(1, 10) | CREATE (n:Label1:Label2 {id: i+50}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    memgraph.execute("CREATE INDEX ON :Label3;")
    expected_explain_with_hint = [
        " * Distinct",
        " * Union {n : n}",
        " |\\ ",
        " | * Produce {n}",
        " | * Filter (n :Label2:Label3)",
        " | * ScanAllByLabel (n :Label2)",
        " | * Once",
        " * Produce {n}",
        " * Filter (n :Label1:Label2)",
        " * ScanAllByLabel (n :Label1)",
        " * Once",
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label1, :Label2 MATCH (n:Label1:Label2) RETURN n UNION MATCH (n:Label2:Label3) RETURN n;"
        )
    ]
    assert explain_with_hint == expected_explain_with_hint
 def test_multiple_match_query(memgraph):
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2:Label3 {id: i}));")
    memgraph.execute("FOREACH (i IN range(1, 10) | CREATE (n:Label1:Label2 {id: i+50}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    memgraph.execute("CREATE INDEX ON :Label2;")
    memgraph.execute("CREATE INDEX ON :Label3;")
    expected_explain_with_hint = [
        " * Produce {n, m}",
        " * Cartesian {m : n}",
        " |\\ ",
        " | * Filter (n :Label1:Label2), {n.id}",
        " | * ScanAllByLabel (n :Label1)",
        " | * Once",
        " * Filter (m :Label2:Label3), (n :Label1:Label2), {n.id}",
        " * ScanAllByLabel (m :Label2)",
        " * Once",
    ]
    explain_with_hint = [
        row["QUERY PLAN"]
        for row in memgraph.execute_and_fetch(
            "EXPLAIN USING INDEX :Label1, :Label2  MATCH (n:Label1:Label2) WHERE n.id = 1 MATCH (m:Label2:Label3) return n, m;"
        )
    ]
    assert explain_with_hint == expected_explain_with_hint
 def test_nonexistent_label_index(memgraph):
    # In case of hinting at a nonexistent index, the query should execute without exceptions, and its output should be
    # the same as without that hint
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label1:Label2 {id: i}));")
    memgraph.execute("FOREACH (i IN range(1, 10) | CREATE (n:Label2 {id: i+50}));")
    memgraph.execute("CREATE INDEX ON :Label1;")
    try:
        explain_no_hint = [
            row["QUERY PLAN"] for row in memgraph.execute_and_fetch("EXPLAIN MATCH (n:Label1:Label2) RETURN n;")
        ]
        explain_with_hint = [
            row["QUERY PLAN"]
            for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label2 MATCH (n:Label1:Label2) RETURN n;")
        ]
        assert explain_with_hint == explain_no_hint
    except mgclient.DatabaseError:
        assert False
 def test_nonexistent_label_property_index(memgraph):
    # In case of hinting at a nonexistent index, the query should execute without exceptions, and its output should be
    # the same as without that hint
    memgraph.execute("FOREACH (i IN range(1, 100) | CREATE (n:Label {id1: i}));")
    memgraph.execute("FOREACH (i IN range(1, 50) | CREATE (n:Label {id2: i % 5}));")
    memgraph.execute("CREATE INDEX ON :Label(id2);")
    try:
        explain_no_hint = [
            row["QUERY PLAN"] for row in memgraph.execute_and_fetch("EXPLAIN MATCH (n:Label1:Label2) RETURN n;")
        ]
        explain_with_hint = [
            row["QUERY PLAN"]
            for row in memgraph.execute_and_fetch("EXPLAIN USING INDEX :Label(id1) MATCH (n:Label1:Label2) RETURN n;")
        ]
        assert explain_with_hint == explain_no_hint
    except mgclient.DatabaseError:
        assert False
 if __name__ == "__main__":
    sys.exit(pytest.main([__file__, "-rA"]))
--- a/tests/e2e/index_hints/workloads.yaml
+++ b/tests/e2e/index_hints/workloads.yaml
@ -0,0 +1,13 @@
 index_hints_cluster: &index_hints_cluster
  cluster:
    main:
      args: ["--bolt-port", "7687", "--log-level=TRACE"]
      log_file: "index_hints.log"
      setup_queries: []
      validation_queries: []
 workloads:
  - name: "Analyze graph for better indexing"
    binary: "tests/e2e/pytest_runner.sh"
    args: ["index_hints/index_hints.py"]
    <<: *index_hints_cluster
--- a/tests/unit/query_plan_operator_to_string.cpp
+++ b/tests/unit/query_plan_operator_to_string.cpp
@ -241,7 +241,7 @@ TYPED_TEST(OperatorToStringTest, Filter) {
                                     EQ(PROPERTY_LOOKUP(this->dba, "person", property), LITERAL(5)), filters);
  std::string expected_string{
-      "Filter Generic {person}, id(person), (person :Customer:Visitor), (:Customer:Visitor), {person.name}, Pattern"};
+      "Filter (:Customer:Visitor), (person :Customer:Visitor), Generic {person}, Pattern, id(person), {person.name}"};
  EXPECT_EQ(last_op->ToString(), expected_string);
 }