#include #include #include "communication/bolt/v1/value.hpp" #include "communication/result_stream_faker.hpp" #include "glue/communication.hpp" #include "gmock/gmock.h" #include "gtest/gtest.h" #include "query/config.hpp" #include "query/exceptions.hpp" #include "query/interpreter.hpp" #include "query/stream.hpp" #include "query/typed_value.hpp" #include "query_common.hpp" #include "storage/v2/isolation_level.hpp" #include "storage/v2/property_value.hpp" #include "utils/csv_parsing.hpp" #include "utils/logging.hpp" namespace { auto ToEdgeList(const communication::bolt::Value &v) { std::vector list; for (auto x : v.ValueList()) { list.push_back(x.ValueEdge()); } return list; }; struct InterpreterFaker { explicit InterpreterFaker(storage::Storage *db, const query::InterpreterConfig config, const std::filesystem::path &data_directory) : interpreter_context(db, config, data_directory, "not used bootstrap servers"), interpreter(&interpreter_context) {} auto Prepare(const std::string &query, const std::map ¶ms = {}) { ResultStreamFaker stream(interpreter_context.db); const auto [header, _, qid] = interpreter.Prepare(query, params); stream.Header(header); return std::make_pair(std::move(stream), qid); } void Pull(ResultStreamFaker *stream, std::optional n = {}, std::optional qid = {}) { const auto summary = interpreter.Pull(stream, n, qid); stream->Summary(summary); } /** * Execute the given query and commit the transaction. * * Return the query stream. */ auto Interpret(const std::string &query, const std::map ¶ms = {}) { auto prepare_result = Prepare(query, params); auto &stream = prepare_result.first; auto summary = interpreter.Pull(&stream, {}, prepare_result.second); stream.Summary(summary); return std::move(stream); } query::InterpreterContext interpreter_context; query::Interpreter interpreter; }; } // namespace // TODO: This is not a unit test, but tests/integration dir is chaotic at the // moment. After tests refactoring is done, move/rename this. class InterpreterTest : public ::testing::Test { protected: storage::Storage db_; std::filesystem::path data_directory{std::filesystem::temp_directory_path() / "MG_tests_unit_interpreter"}; InterpreterFaker default_interpreter{&db_, {}, data_directory}; auto Prepare(const std::string &query, const std::map ¶ms = {}) { return default_interpreter.Prepare(query, params); } void Pull(ResultStreamFaker *stream, std::optional n = {}, std::optional qid = {}) { default_interpreter.Pull(stream, n, qid); } auto Interpret(const std::string &query, const std::map ¶ms = {}) { return default_interpreter.Interpret(query, params); } }; TEST_F(InterpreterTest, MultiplePulls) { { auto [stream, qid] = Prepare("UNWIND [1,2,3,4,5] as n RETURN n"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "n"); Pull(&stream, 1); ASSERT_EQ(stream.GetSummary().count("has_more"), 1); ASSERT_TRUE(stream.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueInt(), 1); Pull(&stream, 2); ASSERT_EQ(stream.GetSummary().count("has_more"), 1); ASSERT_TRUE(stream.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream.GetResults().size(), 3U); ASSERT_EQ(stream.GetResults()[1][0].ValueInt(), 2); ASSERT_EQ(stream.GetResults()[2][0].ValueInt(), 3); Pull(&stream); ASSERT_EQ(stream.GetSummary().count("has_more"), 1); ASSERT_FALSE(stream.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream.GetResults().size(), 5U); ASSERT_EQ(stream.GetResults()[3][0].ValueInt(), 4); ASSERT_EQ(stream.GetResults()[4][0].ValueInt(), 5); } } // Run query with different ast twice to see if query executes correctly when // ast is read from cache. TEST_F(InterpreterTest, AstCache) { { auto stream = Interpret("RETURN 2 + 3"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "2 + 3"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueInt(), 5); } { // Cached ast, different literals. auto stream = Interpret("RETURN 5 + 4"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueInt(), 9); } { // Different ast (because of different types). auto stream = Interpret("RETURN 5.5 + 4"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueDouble(), 9.5); } { // Cached ast, same literals. auto stream = Interpret("RETURN 2 + 3"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueInt(), 5); } { // Cached ast, different literals. auto stream = Interpret("RETURN 10.5 + 1"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueDouble(), 11.5); } { // Cached ast, same literals, different whitespaces. auto stream = Interpret("RETURN 10.5 + 1"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueDouble(), 11.5); } { // Cached ast, same literals, different named header. auto stream = Interpret("RETURN 10.5+1"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "10.5+1"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueDouble(), 11.5); } } // Run query with same ast multiple times with different parameters. TEST_F(InterpreterTest, Parameters) { { auto stream = Interpret("RETURN $2 + $`a b`", {{"2", storage::PropertyValue(10)}, {"a b", storage::PropertyValue(15)}}); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "$2 + $`a b`"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueInt(), 25); } { // Not needed parameter. auto stream = Interpret( "RETURN $2 + $`a b`", {{"2", storage::PropertyValue(10)}, {"a b", storage::PropertyValue(15)}, {"c", storage::PropertyValue(10)}}); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "$2 + $`a b`"); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueInt(), 25); } { // Cached ast, different parameters. auto stream = Interpret("RETURN $2 + $`a b`", {{"2", storage::PropertyValue("da")}, {"a b", storage::PropertyValue("ne")}}); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueString(), "dane"); } { // Non-primitive literal. auto stream = Interpret( "RETURN $2", {{"2", storage::PropertyValue(std::vector{ storage::PropertyValue(5), storage::PropertyValue(2), storage::PropertyValue(3)})}}); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 1U); auto result = query::test_common::ToIntList(glue::ToTypedValue(stream.GetResults()[0][0])); ASSERT_THAT(result, testing::ElementsAre(5, 2, 3)); } { // Cached ast, unprovided parameter. ASSERT_THROW( Interpret("RETURN $2 + $`a b`", {{"2", storage::PropertyValue("da")}, {"ab", storage::PropertyValue("ne")}}), query::UnprovidedParameterError); } } // Test bfs end to end. TEST_F(InterpreterTest, Bfs) { srand(0); const auto kNumLevels = 10; const auto kNumNodesPerLevel = 100; const auto kNumEdgesPerNode = 100; const auto kNumUnreachableNodes = 1000; const auto kNumUnreachableEdges = 100000; const auto kReachable = "reachable"; const auto kId = "id"; std::vector> levels(kNumLevels); int id = 0; // Set up. { auto storage_dba = db_.Access(); query::DbAccessor dba(&storage_dba); auto add_node = [&](int level, bool reachable) { auto node = dba.InsertVertex(); MG_ASSERT(node.SetProperty(dba.NameToProperty(kId), storage::PropertyValue(id++)).HasValue()); MG_ASSERT(node.SetProperty(dba.NameToProperty(kReachable), storage::PropertyValue(reachable)).HasValue()); levels[level].push_back(node); return node; }; auto add_edge = [&](auto &v1, auto &v2, bool reachable) { auto edge = dba.InsertEdge(&v1, &v2, dba.NameToEdgeType("edge")); MG_ASSERT(edge->SetProperty(dba.NameToProperty(kReachable), storage::PropertyValue(reachable)).HasValue()); }; // Add source node. add_node(0, true); // Add reachable nodes. for (int i = 1; i < kNumLevels; ++i) { for (int j = 0; j < kNumNodesPerLevel; ++j) { auto node = add_node(i, true); for (int k = 0; k < kNumEdgesPerNode; ++k) { auto &node2 = levels[i - 1][rand() % levels[i - 1].size()]; add_edge(node2, node, true); } } } // Add unreachable nodes. for (int i = 0; i < kNumUnreachableNodes; ++i) { auto node = add_node(rand() % kNumLevels, // Not really important. false); for (int j = 0; j < kNumEdgesPerNode; ++j) { auto &level = levels[rand() % kNumLevels]; auto &node2 = level[rand() % level.size()]; add_edge(node2, node, true); add_edge(node, node2, true); } } // Add unreachable edges. for (int i = 0; i < kNumUnreachableEdges; ++i) { auto &level1 = levels[rand() % kNumLevels]; auto &node1 = level1[rand() % level1.size()]; auto &level2 = levels[rand() % kNumLevels]; auto &node2 = level2[rand() % level2.size()]; add_edge(node1, node2, false); } ASSERT_FALSE(dba.Commit().HasError()); } auto stream = Interpret( "MATCH (n {id: 0})-[r *bfs..5 (e, n | n.reachable and " "e.reachable)]->(m) RETURN n, r, m"); ASSERT_EQ(stream.GetHeader().size(), 3U); EXPECT_EQ(stream.GetHeader()[0], "n"); EXPECT_EQ(stream.GetHeader()[1], "r"); EXPECT_EQ(stream.GetHeader()[2], "m"); ASSERT_EQ(stream.GetResults().size(), 5 * kNumNodesPerLevel); auto dba = db_.Access(); int expected_level = 1; int remaining_nodes_in_level = kNumNodesPerLevel; std::unordered_set matched_ids; for (const auto &result : stream.GetResults()) { const auto &begin = result[0].ValueVertex(); const auto &edges = ToEdgeList(result[1]); const auto &end = result[2].ValueVertex(); // Check that path is of expected length. Returned paths should be from // shorter to longer ones. EXPECT_EQ(edges.size(), expected_level); // Check that starting node is correct. EXPECT_EQ(edges.front().from, begin.id); EXPECT_EQ(begin.properties.at(kId).ValueInt(), 0); for (int i = 1; i < static_cast(edges.size()); ++i) { // Check that edges form a connected path. EXPECT_EQ(edges[i - 1].to.AsInt(), edges[i].from.AsInt()); } auto matched_id = end.properties.at(kId).ValueInt(); EXPECT_EQ(edges.back().to, end.id); // Check that we didn't match that node already. EXPECT_TRUE(matched_ids.insert(matched_id).second); // Check that shortest path was found. EXPECT_TRUE(matched_id > kNumNodesPerLevel * (expected_level - 1) && matched_id <= kNumNodesPerLevel * expected_level); if (!--remaining_nodes_in_level) { remaining_nodes_in_level = kNumNodesPerLevel; ++expected_level; } } } // Test shortest path end to end. TEST_F(InterpreterTest, ShortestPath) { Interpret( "CREATE (n:A {x: 1}), (m:B {x: 2}), (l:C {x: 1}), (n)-[:r1 {w: 1 " "}]->(m)-[:r2 {w: 2}]->(l), (n)-[:r3 {w: 4}]->(l)"); auto stream = Interpret("MATCH (n)-[e *wshortest 5 (e, n | e.w) ]->(m) return e"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "e"); ASSERT_EQ(stream.GetResults().size(), 3U); auto dba = db_.Access(); std::vector> expected_results{{"r1"}, {"r2"}, {"r1", "r2"}}; for (const auto &result : stream.GetResults()) { const auto &edges = ToEdgeList(result[0]); std::vector datum; datum.reserve(edges.size()); for (const auto &edge : edges) { datum.push_back(edge.type); } bool any_match = false; for (const auto &expected : expected_results) { if (expected == datum) { any_match = true; break; } } EXPECT_TRUE(any_match); } } TEST_F(InterpreterTest, CreateLabelIndexInMulticommandTransaction) { Interpret("BEGIN"); ASSERT_THROW(Interpret("CREATE INDEX ON :X"), query::IndexInMulticommandTxException); Interpret("ROLLBACK"); } TEST_F(InterpreterTest, CreateLabelPropertyIndexInMulticommandTransaction) { Interpret("BEGIN"); ASSERT_THROW(Interpret("CREATE INDEX ON :X(y)"), query::IndexInMulticommandTxException); Interpret("ROLLBACK"); } TEST_F(InterpreterTest, CreateExistenceConstraintInMulticommandTransaction) { Interpret("BEGIN"); ASSERT_THROW(Interpret("CREATE CONSTRAINT ON (n:A) ASSERT EXISTS (n.a)"), query::ConstraintInMulticommandTxException); Interpret("ROLLBACK"); } TEST_F(InterpreterTest, CreateUniqueConstraintInMulticommandTransaction) { Interpret("BEGIN"); ASSERT_THROW(Interpret("CREATE CONSTRAINT ON (n:A) ASSERT n.a, n.b IS UNIQUE"), query::ConstraintInMulticommandTxException); Interpret("ROLLBACK"); } TEST_F(InterpreterTest, ShowIndexInfoInMulticommandTransaction) { Interpret("BEGIN"); ASSERT_THROW(Interpret("SHOW INDEX INFO"), query::InfoInMulticommandTxException); Interpret("ROLLBACK"); } TEST_F(InterpreterTest, ShowConstraintInfoInMulticommandTransaction) { Interpret("BEGIN"); ASSERT_THROW(Interpret("SHOW CONSTRAINT INFO"), query::InfoInMulticommandTxException); Interpret("ROLLBACK"); } TEST_F(InterpreterTest, ShowStorageInfoInMulticommandTransaction) { Interpret("BEGIN"); ASSERT_THROW(Interpret("SHOW STORAGE INFO"), query::InfoInMulticommandTxException); Interpret("ROLLBACK"); } // NOLINTNEXTLINE(hicpp-special-member-functions) TEST_F(InterpreterTest, ExistenceConstraintTest) { Interpret("CREATE CONSTRAINT ON (n:A) ASSERT EXISTS (n.a);"); Interpret("CREATE (:A{a:1})"); Interpret("CREATE (:A{a:2})"); ASSERT_THROW(Interpret("CREATE (:A)"), query::QueryException); Interpret("MATCH (n:A{a:2}) SET n.a=3"); Interpret("CREATE (:A{a:2})"); Interpret("MATCH (n:A{a:2}) DETACH DELETE n"); Interpret("CREATE (n:A{a:2})"); ASSERT_THROW(Interpret("CREATE CONSTRAINT ON (n:A) ASSERT EXISTS (n.b);"), query::QueryRuntimeException); } TEST_F(InterpreterTest, UniqueConstraintTest) { // Empty property list should result with syntax exception. ASSERT_THROW(Interpret("CREATE CONSTRAINT ON (n:A) ASSERT IS UNIQUE;"), query::SyntaxException); ASSERT_THROW(Interpret("DROP CONSTRAINT ON (n:A) ASSERT IS UNIQUE;"), query::SyntaxException); // Too large list of properties should also result with syntax exception. { std::stringstream stream; stream << " ON (n:A) ASSERT "; for (size_t i = 0; i < 33; ++i) { if (i > 0) stream << ", "; stream << "n.prop" << i; } stream << " IS UNIQUE;"; std::string create_query = "CREATE CONSTRAINT" + stream.str(); std::string drop_query = "DROP CONSTRAINT" + stream.str(); ASSERT_THROW(Interpret(create_query), query::SyntaxException); ASSERT_THROW(Interpret(drop_query), query::SyntaxException); } // Providing property list with duplicates results with syntax exception. ASSERT_THROW(Interpret("CREATE CONSTRAINT ON (n:A) ASSERT n.a, n.b, n.a IS UNIQUE;"), query::SyntaxException); ASSERT_THROW(Interpret("DROP CONSTRAINT ON (n:A) ASSERT n.a, n.b, n.a IS UNIQUE;"), query::SyntaxException); // Commit of vertex should fail if a constraint is violated. Interpret("CREATE CONSTRAINT ON (n:A) ASSERT n.a, n.b IS UNIQUE;"); Interpret("CREATE (:A{a:1, b:2})"); Interpret("CREATE (:A{a:1, b:3})"); ASSERT_THROW(Interpret("CREATE (:A{a:1, b:2})"), query::QueryException); // Attempt to create a constraint should fail if it's violated. Interpret("CREATE (:A{a:1, c:2})"); Interpret("CREATE (:A{a:1, c:2})"); ASSERT_THROW(Interpret("CREATE CONSTRAINT ON (n:A) ASSERT n.a, n.c IS UNIQUE;"), query::QueryRuntimeException); Interpret("MATCH (n:A{a:2, b:2}) SET n.a=1"); Interpret("CREATE (:A{a:2})"); Interpret("MATCH (n:A{a:2}) DETACH DELETE n"); Interpret("CREATE (n:A{a:2})"); // Show constraint info. { auto stream = Interpret("SHOW CONSTRAINT INFO"); ASSERT_EQ(stream.GetHeader().size(), 3U); const auto &header = stream.GetHeader(); ASSERT_EQ(header[0], "constraint type"); ASSERT_EQ(header[1], "label"); ASSERT_EQ(header[2], "properties"); ASSERT_EQ(stream.GetResults().size(), 1U); const auto &result = stream.GetResults().front(); ASSERT_EQ(result.size(), 3U); ASSERT_EQ(result[0].ValueString(), "unique"); ASSERT_EQ(result[1].ValueString(), "A"); const auto &properties = result[2].ValueList(); ASSERT_EQ(properties.size(), 2U); ASSERT_EQ(properties[0].ValueString(), "a"); ASSERT_EQ(properties[1].ValueString(), "b"); } // Drop constraint. Interpret("DROP CONSTRAINT ON (n:A) ASSERT n.a, n.b IS UNIQUE;"); // Removing the same constraint twice should not throw any exception. Interpret("DROP CONSTRAINT ON (n:A) ASSERT n.a, n.b IS UNIQUE;"); } TEST_F(InterpreterTest, ExplainQuery) { const auto &interpreter_context = default_interpreter.interpreter_context; EXPECT_EQ(interpreter_context.plan_cache.size(), 0U); EXPECT_EQ(interpreter_context.ast_cache.size(), 0U); auto stream = Interpret("EXPLAIN MATCH (n) RETURN *;"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader().front(), "QUERY PLAN"); std::vector expected_rows{" * Produce {n}", " * ScanAll (n)", " * Once"}; ASSERT_EQ(stream.GetResults().size(), expected_rows.size()); auto expected_it = expected_rows.begin(); for (const auto &row : stream.GetResults()) { ASSERT_EQ(row.size(), 1U); EXPECT_EQ(row.front().ValueString(), *expected_it); ++expected_it; } // We should have a plan cache for MATCH ... EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); // We should have AST cache for EXPLAIN ... and for inner MATCH ... EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); Interpret("MATCH (n) RETURN *;"); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); } TEST_F(InterpreterTest, ExplainQueryMultiplePulls) { const auto &interpreter_context = default_interpreter.interpreter_context; EXPECT_EQ(interpreter_context.plan_cache.size(), 0U); EXPECT_EQ(interpreter_context.ast_cache.size(), 0U); auto [stream, qid] = Prepare("EXPLAIN MATCH (n) RETURN *;"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader().front(), "QUERY PLAN"); std::vector expected_rows{" * Produce {n}", " * ScanAll (n)", " * Once"}; Pull(&stream, 1); ASSERT_EQ(stream.GetResults().size(), 1); auto expected_it = expected_rows.begin(); ASSERT_EQ(stream.GetResults()[0].size(), 1U); EXPECT_EQ(stream.GetResults()[0].front().ValueString(), *expected_it); ++expected_it; Pull(&stream, 1); ASSERT_EQ(stream.GetResults().size(), 2); ASSERT_EQ(stream.GetResults()[1].size(), 1U); EXPECT_EQ(stream.GetResults()[1].front().ValueString(), *expected_it); ++expected_it; Pull(&stream); ASSERT_EQ(stream.GetResults().size(), 3); ASSERT_EQ(stream.GetResults()[2].size(), 1U); EXPECT_EQ(stream.GetResults()[2].front().ValueString(), *expected_it); // We should have a plan cache for MATCH ... EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); // We should have AST cache for EXPLAIN ... and for inner MATCH ... EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); Interpret("MATCH (n) RETURN *;"); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); } TEST_F(InterpreterTest, ExplainQueryInMulticommandTransaction) { const auto &interpreter_context = default_interpreter.interpreter_context; EXPECT_EQ(interpreter_context.plan_cache.size(), 0U); EXPECT_EQ(interpreter_context.ast_cache.size(), 0U); Interpret("BEGIN"); auto stream = Interpret("EXPLAIN MATCH (n) RETURN *;"); Interpret("COMMIT"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader().front(), "QUERY PLAN"); std::vector expected_rows{" * Produce {n}", " * ScanAll (n)", " * Once"}; ASSERT_EQ(stream.GetResults().size(), expected_rows.size()); auto expected_it = expected_rows.begin(); for (const auto &row : stream.GetResults()) { ASSERT_EQ(row.size(), 1U); EXPECT_EQ(row.front().ValueString(), *expected_it); ++expected_it; } // We should have a plan cache for MATCH ... EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); // We should have AST cache for EXPLAIN ... and for inner MATCH ... EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); Interpret("MATCH (n) RETURN *;"); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); } TEST_F(InterpreterTest, ExplainQueryWithParams) { const auto &interpreter_context = default_interpreter.interpreter_context; EXPECT_EQ(interpreter_context.plan_cache.size(), 0U); EXPECT_EQ(interpreter_context.ast_cache.size(), 0U); auto stream = Interpret("EXPLAIN MATCH (n) WHERE n.id = $id RETURN *;", {{"id", storage::PropertyValue(42)}}); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader().front(), "QUERY PLAN"); std::vector expected_rows{" * Produce {n}", " * Filter", " * ScanAll (n)", " * Once"}; ASSERT_EQ(stream.GetResults().size(), expected_rows.size()); auto expected_it = expected_rows.begin(); for (const auto &row : stream.GetResults()) { ASSERT_EQ(row.size(), 1U); EXPECT_EQ(row.front().ValueString(), *expected_it); ++expected_it; } // We should have a plan cache for MATCH ... EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); // We should have AST cache for EXPLAIN ... and for inner MATCH ... EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); Interpret("MATCH (n) WHERE n.id = $id RETURN *;", {{"id", storage::PropertyValue("something else")}}); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); } TEST_F(InterpreterTest, ProfileQuery) { const auto &interpreter_context = default_interpreter.interpreter_context; EXPECT_EQ(interpreter_context.plan_cache.size(), 0U); EXPECT_EQ(interpreter_context.ast_cache.size(), 0U); auto stream = Interpret("PROFILE MATCH (n) RETURN *;"); std::vector expected_header{"OPERATOR", "ACTUAL HITS", "RELATIVE TIME", "ABSOLUTE TIME"}; EXPECT_EQ(stream.GetHeader(), expected_header); std::vector expected_rows{"* Produce", "* ScanAll", "* Once"}; ASSERT_EQ(stream.GetResults().size(), expected_rows.size()); auto expected_it = expected_rows.begin(); for (const auto &row : stream.GetResults()) { ASSERT_EQ(row.size(), 4U); EXPECT_EQ(row.front().ValueString(), *expected_it); ++expected_it; } // We should have a plan cache for MATCH ... EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); // We should have AST cache for PROFILE ... and for inner MATCH ... EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); Interpret("MATCH (n) RETURN *;"); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); } TEST_F(InterpreterTest, ProfileQueryMultiplePulls) { const auto &interpreter_context = default_interpreter.interpreter_context; EXPECT_EQ(interpreter_context.plan_cache.size(), 0U); EXPECT_EQ(interpreter_context.ast_cache.size(), 0U); auto [stream, qid] = Prepare("PROFILE MATCH (n) RETURN *;"); std::vector expected_header{"OPERATOR", "ACTUAL HITS", "RELATIVE TIME", "ABSOLUTE TIME"}; EXPECT_EQ(stream.GetHeader(), expected_header); std::vector expected_rows{"* Produce", "* ScanAll", "* Once"}; auto expected_it = expected_rows.begin(); Pull(&stream, 1); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0].size(), 4U); ASSERT_EQ(stream.GetResults()[0][0].ValueString(), *expected_it); ++expected_it; Pull(&stream, 1); ASSERT_EQ(stream.GetResults().size(), 2U); ASSERT_EQ(stream.GetResults()[1].size(), 4U); ASSERT_EQ(stream.GetResults()[1][0].ValueString(), *expected_it); ++expected_it; Pull(&stream); ASSERT_EQ(stream.GetResults().size(), 3U); ASSERT_EQ(stream.GetResults()[2].size(), 4U); ASSERT_EQ(stream.GetResults()[2][0].ValueString(), *expected_it); // We should have a plan cache for MATCH ... EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); // We should have AST cache for PROFILE ... and for inner MATCH ... EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); Interpret("MATCH (n) RETURN *;"); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); } TEST_F(InterpreterTest, ProfileQueryInMulticommandTransaction) { Interpret("BEGIN"); ASSERT_THROW(Interpret("PROFILE MATCH (n) RETURN *;"), query::ProfileInMulticommandTxException); Interpret("ROLLBACK"); } TEST_F(InterpreterTest, ProfileQueryWithParams) { const auto &interpreter_context = default_interpreter.interpreter_context; EXPECT_EQ(interpreter_context.plan_cache.size(), 0U); EXPECT_EQ(interpreter_context.ast_cache.size(), 0U); auto stream = Interpret("PROFILE MATCH (n) WHERE n.id = $id RETURN *;", {{"id", storage::PropertyValue(42)}}); std::vector expected_header{"OPERATOR", "ACTUAL HITS", "RELATIVE TIME", "ABSOLUTE TIME"}; EXPECT_EQ(stream.GetHeader(), expected_header); std::vector expected_rows{"* Produce", "* Filter", "* ScanAll", "* Once"}; ASSERT_EQ(stream.GetResults().size(), expected_rows.size()); auto expected_it = expected_rows.begin(); for (const auto &row : stream.GetResults()) { ASSERT_EQ(row.size(), 4U); EXPECT_EQ(row.front().ValueString(), *expected_it); ++expected_it; } // We should have a plan cache for MATCH ... EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); // We should have AST cache for PROFILE ... and for inner MATCH ... EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); Interpret("MATCH (n) WHERE n.id = $id RETURN *;", {{"id", storage::PropertyValue("something else")}}); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); } TEST_F(InterpreterTest, ProfileQueryWithLiterals) { const auto &interpreter_context = default_interpreter.interpreter_context; EXPECT_EQ(interpreter_context.plan_cache.size(), 0U); EXPECT_EQ(interpreter_context.ast_cache.size(), 0U); auto stream = Interpret("PROFILE UNWIND range(1, 1000) AS x CREATE (:Node {id: x});", {}); std::vector expected_header{"OPERATOR", "ACTUAL HITS", "RELATIVE TIME", "ABSOLUTE TIME"}; EXPECT_EQ(stream.GetHeader(), expected_header); std::vector expected_rows{"* CreateNode", "* Unwind", "* Once"}; ASSERT_EQ(stream.GetResults().size(), expected_rows.size()); auto expected_it = expected_rows.begin(); for (const auto &row : stream.GetResults()) { ASSERT_EQ(row.size(), 4U); EXPECT_EQ(row.front().ValueString(), *expected_it); ++expected_it; } // We should have a plan cache for UNWIND ... EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); // We should have AST cache for PROFILE ... and for inner UNWIND ... EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); Interpret("UNWIND range(42, 4242) AS x CREATE (:Node {id: x});", {}); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); EXPECT_EQ(interpreter_context.ast_cache.size(), 2U); } TEST_F(InterpreterTest, Transactions) { auto &interpreter = default_interpreter.interpreter; { ASSERT_THROW(interpreter.CommitTransaction(), query::ExplicitTransactionUsageException); ASSERT_THROW(interpreter.RollbackTransaction(), query::ExplicitTransactionUsageException); interpreter.BeginTransaction(); ASSERT_THROW(interpreter.BeginTransaction(), query::ExplicitTransactionUsageException); auto [stream, qid] = Prepare("RETURN 2"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "2"); Pull(&stream, 1); ASSERT_EQ(stream.GetSummary().count("has_more"), 1); ASSERT_FALSE(stream.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueInt(), 2); interpreter.CommitTransaction(); } { interpreter.BeginTransaction(); auto [stream, qid] = Prepare("RETURN 2"); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "2"); Pull(&stream, 1); ASSERT_EQ(stream.GetSummary().count("has_more"), 1); ASSERT_FALSE(stream.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream.GetResults()[0].size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueInt(), 2); interpreter.RollbackTransaction(); } } TEST_F(InterpreterTest, Qid) { auto &interpreter = default_interpreter.interpreter; { interpreter.BeginTransaction(); auto [stream, qid] = Prepare("RETURN 2"); ASSERT_TRUE(qid); ASSERT_THROW(Pull(&stream, {}, *qid + 1), query::InvalidArgumentsException); interpreter.RollbackTransaction(); } { interpreter.BeginTransaction(); auto [stream1, qid1] = Prepare("UNWIND(range(1,3)) as n RETURN n"); ASSERT_TRUE(qid1); ASSERT_EQ(stream1.GetHeader().size(), 1U); EXPECT_EQ(stream1.GetHeader()[0], "n"); auto [stream2, qid2] = Prepare("UNWIND(range(4,6)) as n RETURN n"); ASSERT_TRUE(qid2); ASSERT_EQ(stream2.GetHeader().size(), 1U); EXPECT_EQ(stream2.GetHeader()[0], "n"); Pull(&stream1, 1, qid1); ASSERT_EQ(stream1.GetSummary().count("has_more"), 1); ASSERT_TRUE(stream1.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream1.GetResults().size(), 1U); ASSERT_EQ(stream1.GetResults()[0].size(), 1U); ASSERT_EQ(stream1.GetResults()[0][0].ValueInt(), 1); auto [stream3, qid3] = Prepare("UNWIND(range(7,9)) as n RETURN n"); ASSERT_TRUE(qid3); ASSERT_EQ(stream3.GetHeader().size(), 1U); EXPECT_EQ(stream3.GetHeader()[0], "n"); Pull(&stream2, {}, qid2); ASSERT_EQ(stream2.GetSummary().count("has_more"), 1); ASSERT_FALSE(stream2.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream2.GetResults().size(), 3U); ASSERT_EQ(stream2.GetResults()[0].size(), 1U); ASSERT_EQ(stream2.GetResults()[0][0].ValueInt(), 4); ASSERT_EQ(stream2.GetResults()[1][0].ValueInt(), 5); ASSERT_EQ(stream2.GetResults()[2][0].ValueInt(), 6); Pull(&stream3, 1, qid3); ASSERT_EQ(stream3.GetSummary().count("has_more"), 1); ASSERT_TRUE(stream3.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream3.GetResults().size(), 1U); ASSERT_EQ(stream3.GetResults()[0].size(), 1U); ASSERT_EQ(stream3.GetResults()[0][0].ValueInt(), 7); Pull(&stream1, {}, qid1); ASSERT_EQ(stream1.GetSummary().count("has_more"), 1); ASSERT_FALSE(stream1.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream1.GetResults().size(), 3U); ASSERT_EQ(stream1.GetResults()[1].size(), 1U); ASSERT_EQ(stream1.GetResults()[1][0].ValueInt(), 2); ASSERT_EQ(stream1.GetResults()[2][0].ValueInt(), 3); Pull(&stream3); ASSERT_EQ(stream3.GetSummary().count("has_more"), 1); ASSERT_FALSE(stream3.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream3.GetResults().size(), 3U); ASSERT_EQ(stream3.GetResults()[1].size(), 1U); ASSERT_EQ(stream3.GetResults()[1][0].ValueInt(), 8); ASSERT_EQ(stream3.GetResults()[2][0].ValueInt(), 9); interpreter.CommitTransaction(); } } namespace { // copied from utils_csv_parsing.cpp - tmp dir management and csv file writer class TmpDirManager final { public: explicit TmpDirManager(const std::string_view directory) : tmp_dir_{std::filesystem::temp_directory_path() / directory} { CreateDir(); } ~TmpDirManager() { Clear(); } const std::filesystem::path &Path() const { return tmp_dir_; } private: std::filesystem::path tmp_dir_; void CreateDir() { if (!std::filesystem::exists(tmp_dir_)) { std::filesystem::create_directory(tmp_dir_); } } void Clear() { if (!std::filesystem::exists(tmp_dir_)) return; std::filesystem::remove_all(tmp_dir_); } }; class FileWriter { public: explicit FileWriter(const std::filesystem::path path) { stream_.open(path); } FileWriter(const FileWriter &) = delete; FileWriter &operator=(const FileWriter &) = delete; FileWriter(FileWriter &&) = delete; FileWriter &operator=(FileWriter &&) = delete; void Close() { stream_.close(); } size_t WriteLine(const std::string_view line) { if (!stream_.is_open()) { return 0; } stream_ << line << std::endl; // including the newline character return line.size() + 1; } private: std::ofstream stream_; }; std::string CreateRow(const std::vector &columns, const std::string_view delim) { return utils::Join(columns, delim); } } // namespace TEST_F(InterpreterTest, LoadCsvClause) { auto dir_manager = TmpDirManager("csv_directory"); const auto csv_path = dir_manager.Path() / "file.csv"; auto writer = FileWriter(csv_path); const std::string delimiter{"|"}; const std::vector header{"A", "B", "C"}; writer.WriteLine(CreateRow(header, delimiter)); const std::vector good_columns_1{"a", "b", "c"}; writer.WriteLine(CreateRow(good_columns_1, delimiter)); const std::vector bad_columns{"\"\"1", "2", "3"}; writer.WriteLine(CreateRow(bad_columns, delimiter)); const std::vector good_columns_2{"d", "e", "f"}; writer.WriteLine(CreateRow(good_columns_2, delimiter)); writer.Close(); { const std::string query = fmt::format(R"(LOAD CSV FROM "{}" WITH HEADER IGNORE BAD DELIMITER "{}" AS x RETURN x.A)", csv_path.string(), delimiter); auto [stream, qid] = Prepare(query); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "x.A"); Pull(&stream, 1); ASSERT_EQ(stream.GetSummary().count("has_more"), 1); ASSERT_TRUE(stream.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream.GetResults().size(), 1U); ASSERT_EQ(stream.GetResults()[0][0].ValueString(), "a"); Pull(&stream, 1); ASSERT_EQ(stream.GetSummary().count("has_more"), 1); ASSERT_FALSE(stream.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream.GetResults().size(), 2U); ASSERT_EQ(stream.GetResults()[1][0].ValueString(), "d"); } { const std::string query = fmt::format(R"(LOAD CSV FROM "{}" WITH HEADER IGNORE BAD DELIMITER "{}" AS x RETURN x.C)", csv_path.string(), delimiter); auto [stream, qid] = Prepare(query); ASSERT_EQ(stream.GetHeader().size(), 1U); EXPECT_EQ(stream.GetHeader()[0], "x.C"); Pull(&stream); ASSERT_EQ(stream.GetSummary().count("has_more"), 1); ASSERT_FALSE(stream.GetSummary().at("has_more").ValueBool()); ASSERT_EQ(stream.GetResults().size(), 2U); ASSERT_EQ(stream.GetResults()[0][0].ValueString(), "c"); ASSERT_EQ(stream.GetResults()[1][0].ValueString(), "f"); } } TEST_F(InterpreterTest, CacheableQueries) { const auto &interpreter_context = default_interpreter.interpreter_context; // This should be cached { SCOPED_TRACE("Cacheable query"); Interpret("RETURN 1"); EXPECT_EQ(interpreter_context.ast_cache.size(), 1U); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); } { SCOPED_TRACE("Uncacheable query"); // Queries which are calling procedure should not be cached because the // result signature could be changed Interpret("CALL mg.load_all()"); EXPECT_EQ(interpreter_context.ast_cache.size(), 1U); EXPECT_EQ(interpreter_context.plan_cache.size(), 1U); } } TEST_F(InterpreterTest, AllowLoadCsvConfig) { const auto check_load_csv_queries = [&](const bool allow_load_csv) { TmpDirManager directory_manager{"allow_load_csv"}; const auto csv_path = directory_manager.Path() / "file.csv"; auto writer = FileWriter(csv_path); const std::vector data{"A", "B", "C"}; writer.WriteLine(CreateRow(data, ",")); writer.Close(); const std::array queries = { fmt::format("LOAD CSV FROM \"{}\" WITH HEADER AS row RETURN row", csv_path.string()), "CREATE TRIGGER trigger ON CREATE BEFORE COMMIT EXECUTE LOAD CSV FROM 'file.csv' WITH HEADER AS row RETURN " "row"}; InterpreterFaker interpreter_faker{&db_, {.query = {.allow_load_csv = allow_load_csv}}, directory_manager.Path()}; for (const auto &query : queries) { if (allow_load_csv) { SCOPED_TRACE(fmt::format("'{}' should not throw because LOAD CSV is allowed", query)); ASSERT_NO_THROW(interpreter_faker.Interpret(query)); } else { SCOPED_TRACE(fmt::format("'{}' should throw becuase LOAD CSV is not allowed", query)); ASSERT_THROW(interpreter_faker.Interpret(query), utils::BasicException); } SCOPED_TRACE(fmt::format("Normal query should not throw (allow_load_csv: {})", allow_load_csv)); ASSERT_NO_THROW(interpreter_faker.Interpret("RETURN 1")); } }; check_load_csv_queries(true); check_load_csv_queries(false); }