#include #include #include #include #include "gtest/gtest.h" #include "database/graph_db.hpp" #include "distributed/coordination.hpp" #include "distributed/coordination_master.hpp" #include "distributed/coordination_worker.hpp" #include "distributed/plan_consumer.hpp" #include "distributed/plan_dispatcher.hpp" #include "distributed/remote_data_rpc_clients.hpp" #include "distributed/remote_data_rpc_server.hpp" #include "distributed/remote_pull_rpc_clients.hpp" #include "io/network/endpoint.hpp" #include "query/frontend/ast/ast.hpp" #include "query/frontend/ast/cypher_main_visitor.hpp" #include "query/frontend/semantic/symbol_generator.hpp" #include "query/frontend/semantic/symbol_table.hpp" #include "query/plan/planner.hpp" #include "query_plan_common.hpp" #include "transactions/engine_master.hpp" #include "query_common.hpp" #include "query_plan_common.hpp" template using optional = std::experimental::optional; using namespace distributed; class DistributedGraphDbTest : public ::testing::Test { const std::string kLocal = "127.0.0.1"; class WorkerInThread { public: WorkerInThread(database::Config config) : worker_(config) { thread_ = std::thread([this, config] { worker_.WaitForShutdown(); }); } ~WorkerInThread() { if (thread_.joinable()) thread_.join(); } database::Worker worker_; std::thread thread_; }; protected: void SetUp() override { const auto kInitTime = 200ms; database::Config master_config; master_config.master_endpoint = {kLocal, 0}; master_.emplace(master_config); std::this_thread::sleep_for(kInitTime); auto worker_config = [this](int worker_id) { database::Config config; config.worker_id = worker_id; config.master_endpoint = master_->endpoint(); config.worker_endpoint = {kLocal, 0}; return config; }; worker1_.emplace(worker_config(1)); std::this_thread::sleep_for(kInitTime); worker2_.emplace(worker_config(2)); std::this_thread::sleep_for(kInitTime); } void TearDown() override { // Kill master first because it will expect a shutdown response from the // workers. master_ = std::experimental::nullopt; worker2_ = std::experimental::nullopt; worker1_ = std::experimental::nullopt; } database::Master &master() { return *master_; } auto &master_tx_engine() { return dynamic_cast(master_->tx_engine()); } database::Worker &worker1() { return worker1_->worker_; } database::Worker &worker2() { return worker2_->worker_; } private: optional master_; optional worker1_; optional worker2_; }; TEST_F(DistributedGraphDbTest, Coordination) { EXPECT_NE(master().endpoint().port(), 0); EXPECT_NE(worker1().endpoint().port(), 0); EXPECT_NE(worker2().endpoint().port(), 0); EXPECT_EQ(master().GetEndpoint(1), worker1().endpoint()); EXPECT_EQ(master().GetEndpoint(2), worker2().endpoint()); EXPECT_EQ(worker1().GetEndpoint(0), master().endpoint()); EXPECT_EQ(worker1().GetEndpoint(2), worker2().endpoint()); EXPECT_EQ(worker2().GetEndpoint(0), master().endpoint()); EXPECT_EQ(worker2().GetEndpoint(1), worker1().endpoint()); } TEST_F(DistributedGraphDbTest, TxEngine) { auto *tx1 = master_tx_engine().Begin(); auto *tx2 = master_tx_engine().Begin(); EXPECT_EQ(tx2->snapshot().size(), 1); EXPECT_EQ( worker1().tx_engine().RunningTransaction(tx1->id_)->snapshot().size(), 0); EXPECT_EQ(worker2().tx_engine().RunningTransaction(tx2->id_)->snapshot(), tx2->snapshot()); ::testing::FLAGS_gtest_death_test_style = "threadsafe"; EXPECT_DEATH(worker2().tx_engine().RunningTransaction(123), ""); } template using mapper_vec = std::vector>>; TEST_F(DistributedGraphDbTest, StorageTypes) { auto test_mappers = [](auto mappers, auto ids) { for (size_t i = 0; i < mappers.size(); ++i) { ids.emplace_back( mappers[i].get().value_to_id("value" + std::to_string(i))); } EXPECT_GT(ids.size(), 0); for (size_t i = 0; i < mappers.size(); ++i) { for (size_t j = 0; j < ids.size(); ++j) { EXPECT_EQ(mappers[i].get().id_to_value(ids[j]), "value" + std::to_string(j)); } } }; test_mappers(mapper_vec{master().label_mapper(), worker1().label_mapper(), worker2().label_mapper()}, std::vector{}); test_mappers(mapper_vec{master().edge_type_mapper(), worker1().edge_type_mapper(), worker2().edge_type_mapper()}, std::vector{}); test_mappers(mapper_vec{master().property_mapper(), worker1().property_mapper(), worker2().property_mapper()}, std::vector{}); } TEST_F(DistributedGraphDbTest, Counters) { EXPECT_EQ(master().counters().Get("a"), 0); EXPECT_EQ(worker1().counters().Get("a"), 1); EXPECT_EQ(worker2().counters().Get("a"), 2); EXPECT_EQ(worker1().counters().Get("b"), 0); EXPECT_EQ(worker2().counters().Get("b"), 1); EXPECT_EQ(master().counters().Get("b"), 2); } TEST_F(DistributedGraphDbTest, RemoteDataGetting) { using GraphDbAccessor = database::GraphDbAccessor; // Only old data is visible remotely, so create and commit some data. gid::Gid v1_id, v2_id, e1_id; { GraphDbAccessor dba{master()}; auto v1 = dba.InsertVertex(); auto v2 = dba.InsertVertex(); auto e1 = dba.InsertEdge(v1, v2, dba.EdgeType("et")); // Set some data so we see we're getting the right stuff. v1.PropsSet(dba.Property("p1"), 42); v1.add_label(dba.Label("label")); v2.PropsSet(dba.Property("p2"), "value"); e1.PropsSet(dba.Property("p3"), true); v1_id = v1.gid(); v2_id = v2.gid(); e1_id = e1.gid(); dba.Commit(); } // The master must start a transaction before workers can work in it. database::GraphDbAccessor master_dba{master()}; { database::GraphDbAccessor w1_dba{worker1(), master_dba.transaction_id()}; VertexAccessor v1_in_w1{{v1_id, 0}, w1_dba}; EXPECT_NE(v1_in_w1.GetOld(), nullptr); EXPECT_EQ(v1_in_w1.GetNew(), nullptr); EXPECT_EQ(v1_in_w1.PropsAt(w1_dba.Property("p1")).Value(), 42); EXPECT_TRUE(v1_in_w1.has_label(w1_dba.Label("label"))); } { database::GraphDbAccessor w2_dba{worker2(), master_dba.transaction_id()}; VertexAccessor v2_in_w2{{v2_id, 0}, w2_dba}; EXPECT_NE(v2_in_w2.GetOld(), nullptr); EXPECT_EQ(v2_in_w2.GetNew(), nullptr); EXPECT_EQ(v2_in_w2.PropsAt(w2_dba.Property("p2")).Value(), "value"); EXPECT_FALSE(v2_in_w2.has_label(w2_dba.Label("label"))); VertexAccessor v1_in_w2{{v1_id, 0}, w2_dba}; EdgeAccessor e1_in_w2{{e1_id, 0}, w2_dba}; EXPECT_EQ(e1_in_w2.from(), v1_in_w2); EXPECT_EQ(e1_in_w2.to(), v2_in_w2); EXPECT_EQ(e1_in_w2.EdgeType(), w2_dba.EdgeType("et")); EXPECT_EQ(e1_in_w2.PropsAt(w2_dba.Property("p3")).Value(), true); } } TEST_F(DistributedGraphDbTest, DispatchPlan) { auto kRPCWaitTime = 600ms; int64_t plan_id = 5; SymbolTable symbol_table; AstTreeStorage storage; auto scan_all = MakeScanAll(storage, symbol_table, "n"); master().plan_dispatcher().DispatchPlan(plan_id, scan_all.op_, symbol_table); std::this_thread::sleep_for(kRPCWaitTime); auto check_for_worker = [plan_id, &symbol_table](auto &worker) { auto &cached = worker.plan_consumer().PlanForId(plan_id); EXPECT_NE(dynamic_cast(cached.plan.get()), nullptr); EXPECT_EQ(cached.symbol_table.max_position(), symbol_table.max_position()); EXPECT_EQ(cached.symbol_table.table(), symbol_table.table()); }; check_for_worker(worker1()); check_for_worker(worker2()); } TEST_F(DistributedGraphDbTest, RemotePullProduceRpc) { database::GraphDbAccessor dba{master()}; Context ctx{dba}; SymbolGenerator symbol_generator{ctx.symbol_table_}; AstTreeStorage storage; // Query plan for: UNWIND [42, true, "bla", 1, 2] as x RETURN x using namespace query; auto list = LIST(LITERAL(42), LITERAL(true), LITERAL("bla"), LITERAL(1), LITERAL(2)); auto x = ctx.symbol_table_.CreateSymbol("x", true); auto unwind = std::make_shared(nullptr, list, x); auto x_expr = IDENT("x"); ctx.symbol_table_[*x_expr] = x; auto x_ne = NEXPR("x", x_expr); ctx.symbol_table_[*x_ne] = ctx.symbol_table_.CreateSymbol("x_ne", true); auto produce = MakeProduce(unwind, x_ne); // Test that the plan works locally. auto results = CollectProduce(produce.get(), ctx.symbol_table_, dba); ASSERT_EQ(results.size(), 5); const int plan_id = 42; master().plan_dispatcher().DispatchPlan(plan_id, produce, ctx.symbol_table_); Parameters params; std::vector symbols{ctx.symbol_table_[*x_ne]}; auto remote_pull = [this, plan_id, ¶ms, &symbols]( database::GraphDbAccessor &dba, int worker_id) { return master().remote_pull_clients().RemotePull(dba, worker_id, plan_id, params, symbols, 3); }; auto expect_first_batch = [](auto &batch) { EXPECT_EQ(batch.pull_state, distributed::RemotePullState::CURSOR_IN_PROGRESS); ASSERT_EQ(batch.frames.size(), 3); ASSERT_EQ(batch.frames[0].size(), 1); EXPECT_EQ(batch.frames[0][0].ValueInt(), 42); EXPECT_EQ(batch.frames[1][0].ValueBool(), true); EXPECT_EQ(batch.frames[2][0].ValueString(), "bla"); }; auto expect_second_batch = [](auto &batch) { EXPECT_EQ(batch.pull_state, distributed::RemotePullState::CURSOR_EXHAUSTED); ASSERT_EQ(batch.frames.size(), 2); ASSERT_EQ(batch.frames[0].size(), 1); EXPECT_EQ(batch.frames[0][0].ValueInt(), 1); EXPECT_EQ(batch.frames[1][0].ValueInt(), 2); }; database::GraphDbAccessor dba_1{master()}; database::GraphDbAccessor dba_2{master()}; for (int worker_id : {1, 2}) { // TODO flor, proper test async here. auto tx1_batch1 = remote_pull(dba_1, worker_id).get(); expect_first_batch(tx1_batch1); auto tx2_batch1 = remote_pull(dba_2, worker_id).get(); expect_first_batch(tx2_batch1); auto tx2_batch2 = remote_pull(dba_2, worker_id).get(); expect_second_batch(tx2_batch2); auto tx1_batch2 = remote_pull(dba_1, worker_id).get(); expect_second_batch(tx1_batch2); } master().remote_pull_clients().EndAllRemotePulls(dba_1.transaction_id(), plan_id); master().remote_pull_clients().EndAllRemotePulls(dba_2.transaction_id(), plan_id); } TEST_F(DistributedGraphDbTest, RemotePullProduceRpcWithGraphElements) { // Create some data on the master and both workers. Eeach edge (3 of them) and // vertex (6 of them) will be uniquely identified with their worker id and // sequence ID, so we can check we retrieved all. storage::Property prop; { database::GraphDbAccessor dba{master()}; prop = dba.Property("prop"); auto create_data = [prop](database::GraphDbAccessor &dba, int worker_id) { auto v1 = dba.InsertVertex(); v1.PropsSet(prop, worker_id * 10); auto v2 = dba.InsertVertex(); v2.PropsSet(prop, worker_id * 10 + 1); auto e12 = dba.InsertEdge(v1, v2, dba.EdgeType("et")); e12.PropsSet(prop, worker_id * 10 + 2); }; create_data(dba, 0); database::GraphDbAccessor dba_w1{worker1(), dba.transaction_id()}; create_data(dba_w1, 1); database::GraphDbAccessor dba_w2{worker2(), dba.transaction_id()}; create_data(dba_w2, 2); dba.Commit(); } database::GraphDbAccessor dba{master()}; Context ctx{dba}; SymbolGenerator symbol_generator{ctx.symbol_table_}; AstTreeStorage storage; // Query plan for: MATCH p = (n)-[r]->(m) return [n, r], m, p // Use this query to test graph elements are transferred correctly in // collections too. auto n = MakeScanAll(storage, ctx.symbol_table_, "n"); auto r_m = MakeExpand(storage, ctx.symbol_table_, n.op_, n.sym_, "r", EdgeAtom::Direction::OUT, {}, "m", false, GraphView::OLD); auto p_sym = ctx.symbol_table_.CreateSymbol("p", true); auto p = std::make_shared( r_m.op_, p_sym, std::vector{n.sym_, r_m.edge_sym_, r_m.node_sym_}); auto return_n = IDENT("n"); ctx.symbol_table_[*return_n] = n.sym_; auto return_r = IDENT("r"); ctx.symbol_table_[*return_r] = r_m.edge_sym_; auto return_n_r = NEXPR("[n, r]", LIST(return_n, return_r)); ctx.symbol_table_[*return_n_r] = ctx.symbol_table_.CreateSymbol("", true); auto return_m = NEXPR("m", IDENT("m")); ctx.symbol_table_[*return_m->expression_] = r_m.node_sym_; ctx.symbol_table_[*return_m] = ctx.symbol_table_.CreateSymbol("", true); auto return_p = NEXPR("p", IDENT("p")); ctx.symbol_table_[*return_p->expression_] = p_sym; ctx.symbol_table_[*return_p] = ctx.symbol_table_.CreateSymbol("", true); auto produce = MakeProduce(p, return_n_r, return_m, return_p); auto check_result = [prop]( int worker_id, const std::vector> &frames) { int offset = worker_id * 10; ASSERT_EQ(frames.size(), 1); auto &row = frames[0]; ASSERT_EQ(row.size(), 3); auto &list = row[0].ValueList(); ASSERT_EQ(list.size(), 2); ASSERT_EQ(list[0].ValueVertex().PropsAt(prop).Value(), offset); ASSERT_EQ(list[1].ValueEdge().PropsAt(prop).Value(), offset + 2); ASSERT_EQ(row[1].ValueVertex().PropsAt(prop).Value(), offset + 1); auto &path = row[2].ValuePath(); ASSERT_EQ(path.size(), 1); ASSERT_EQ(path.vertices()[0].PropsAt(prop).Value(), offset); ASSERT_EQ(path.edges()[0].PropsAt(prop).Value(), offset + 2); ASSERT_EQ(path.vertices()[1].PropsAt(prop).Value(), offset + 1); }; // Test that the plan works locally. auto results = CollectProduce(produce.get(), ctx.symbol_table_, dba); check_result(0, results); const int plan_id = 42; master().plan_dispatcher().DispatchPlan(plan_id, produce, ctx.symbol_table_); Parameters params; std::vector symbols{ctx.symbol_table_[*return_n_r], ctx.symbol_table_[*return_m], p_sym}; auto remote_pull = [this, plan_id, ¶ms, &symbols]( database::GraphDbAccessor &dba, int worker_id) { return master().remote_pull_clients().RemotePull(dba, worker_id, plan_id, params, symbols, 3); }; auto future_w1_results = remote_pull(dba, 1); auto future_w2_results = remote_pull(dba, 2); check_result(1, future_w1_results.get().frames); check_result(2, future_w2_results.get().frames); master().remote_pull_clients().EndAllRemotePulls(dba.transaction_id(), plan_id); } TEST_F(DistributedGraphDbTest, BuildIndexDistributed) { using GraphDbAccessor = database::GraphDbAccessor; storage::Label label; storage::Property property; { GraphDbAccessor dba0{master()}; label = dba0.Label("label"); property = dba0.Property("property"); auto tx_id = dba0.transaction_id(); GraphDbAccessor dba1{worker1(), tx_id}; GraphDbAccessor dba2{worker2(), tx_id}; auto add_vertex = [label, property](GraphDbAccessor &dba) { auto vertex = dba.InsertVertex(); vertex.add_label(label); vertex.PropsSet(property, 1); }; for (int i = 0; i < 100; ++i) add_vertex(dba0); for (int i = 0; i < 50; ++i) add_vertex(dba1); for (int i = 0; i < 300; ++i) add_vertex(dba2); dba0.Commit(); } { GraphDbAccessor dba{master()}; dba.BuildIndex(label, property); EXPECT_TRUE(dba.LabelPropertyIndexExists(label, property)); EXPECT_EQ(CountIterable(dba.Vertices(label, property, false)), 100); } GraphDbAccessor dba_master{master()}; { GraphDbAccessor dba{worker1(), dba_master.transaction_id()}; EXPECT_TRUE(dba.LabelPropertyIndexExists(label, property)); EXPECT_EQ(CountIterable(dba.Vertices(label, property, false)), 50); } { GraphDbAccessor dba{worker2(), dba_master.transaction_id()}; EXPECT_TRUE(dba.LabelPropertyIndexExists(label, property)); EXPECT_EQ(CountIterable(dba.Vertices(label, property, false)), 300); } }