Make Distributed Memgraph Stub
Summary: * main file (copied distributed_test.cpp), start_main.py, config Made a dedicated client and memgraph file (stubs) + code structure changes Reviewers: sasa.stanko Reviewed By: sasa.stanko Subscribers: pullbot, lion, buda Differential Revision: https://phabricator.memgraph.io/D709
This commit is contained in:
parent
9d1265f41f
commit
a6b8d6b4cf
@ -27,21 +27,34 @@ include_directories(SYSTEM ${CMAKE_BINARY_DIR}/libs/gflags/include)
|
||||
file(GLOB_RECURSE src_files ${src_dir}/*.cpp)
|
||||
add_library(distributed_lib STATIC ${src_files})
|
||||
|
||||
## executable
|
||||
#### HACK: there is temporarily no working main file as the API is changing
|
||||
# set(executable_name distributed)
|
||||
# add_executable(${executable_name} ${PROJECT_SOURCE_DIR}/main.cpp)
|
||||
# target_link_libraries(${executable_name} distributed_lib)
|
||||
# target_link_libraries(${executable_name} memgraph_lib)
|
||||
# target_link_libraries(${executable_name} ${MEMGRAPH_ALL_LIBS})
|
||||
## distributed Memgraph executable
|
||||
set(executable_name main)
|
||||
add_executable(${executable_name} ${PROJECT_SOURCE_DIR}/main.cpp)
|
||||
target_link_libraries(${executable_name} distributed_lib)
|
||||
target_link_libraries(${executable_name} memgraph_lib)
|
||||
target_link_libraries(${executable_name} ${MEMGRAPH_ALL_LIBS})
|
||||
|
||||
## dummy distributed Memgraph client
|
||||
set(executable_name main-client)
|
||||
add_executable(${executable_name} ${PROJECT_SOURCE_DIR}/main-client.cpp)
|
||||
target_link_libraries(${executable_name} distributed_lib)
|
||||
target_link_libraries(${executable_name} memgraph_lib)
|
||||
target_link_libraries(${executable_name} ${MEMGRAPH_ALL_LIBS})
|
||||
|
||||
# tests
|
||||
add_subdirectory(${PROJECT_SOURCE_DIR}/tests)
|
||||
|
||||
# copy test scripts into the build/ directory
|
||||
# copy test scripts into the build/ directory (for distributed tests)
|
||||
configure_file(${PROJECT_SOURCE_DIR}/tests/start_distributed.py
|
||||
${PROJECT_BINARY_DIR}/tests/start_distributed.py COPYONLY)
|
||||
|
||||
configure_file(${PROJECT_SOURCE_DIR}/tests/config
|
||||
${PROJECT_BINARY_DIR}/tests/config COPYONLY)
|
||||
|
||||
# copy main scripts into build/ directory (for distributed Memgraph)
|
||||
configure_file(${PROJECT_SOURCE_DIR}/start_main.py
|
||||
${PROJECT_BINARY_DIR}/start_main.py COPYONLY)
|
||||
|
||||
configure_file(${PROJECT_SOURCE_DIR}/config
|
||||
${PROJECT_BINARY_DIR}/config COPYONLY)
|
||||
|
||||
|
3
experimental/distributed/config
Normal file
3
experimental/distributed/config
Normal file
@ -0,0 +1,3 @@
|
||||
0 127.0.0.1 10010
|
||||
1 127.0.0.1 10011
|
||||
2 127.0.0.1 10012
|
41
experimental/distributed/main-client.cpp
Normal file
41
experimental/distributed/main-client.cpp
Normal file
@ -0,0 +1,41 @@
|
||||
#include "memgraph_distributed.hpp"
|
||||
#include "memgraph_config.hpp"
|
||||
|
||||
#include "reactors_distributed.hpp"
|
||||
|
||||
#include <iostream>
|
||||
#include <fstream>
|
||||
|
||||
#include <gflags/gflags.h>
|
||||
#include <glog/logging.h>
|
||||
|
||||
/**
|
||||
* This is the client that issues some hard-coded queries.
|
||||
*/
|
||||
class Client : public Reactor {
|
||||
public:
|
||||
Client(std::string name) : Reactor(name) {
|
||||
}
|
||||
|
||||
virtual void Run() {
|
||||
|
||||
}
|
||||
};
|
||||
|
||||
int main(int argc, char *argv[]) {
|
||||
google::InitGoogleLogging(argv[0]);
|
||||
gflags::ParseCommandLineFlags(&argc, &argv, true);
|
||||
|
||||
System &system = System::GetInstance();
|
||||
Distributed &distributed = Distributed::GetInstance();
|
||||
MemgraphDistributed& memgraph = MemgraphDistributed::GetInstance();
|
||||
memgraph.RegisterConfig(ParseConfig());
|
||||
distributed.StartServices();
|
||||
|
||||
system.Spawn<Client>("client");
|
||||
|
||||
system.AwaitShutdown();
|
||||
distributed.StopServices();
|
||||
|
||||
return 0;
|
||||
}
|
134
experimental/distributed/main.cpp
Normal file
134
experimental/distributed/main.cpp
Normal file
@ -0,0 +1,134 @@
|
||||
#include "memgraph_distributed.hpp"
|
||||
#include "memgraph_config.hpp"
|
||||
|
||||
#include "reactors_distributed.hpp"
|
||||
|
||||
#include <iostream>
|
||||
#include <fstream>
|
||||
|
||||
#include <glog/logging.h>
|
||||
|
||||
DEFINE_uint64(my_mnid, -1, "Memgraph node id"); // TODO(zuza): this should be assigned by the leader once in the future
|
||||
|
||||
/**
|
||||
* Sends a text message and has a return address.
|
||||
*/
|
||||
class TextMessage : public ReturnAddressMsg {
|
||||
public:
|
||||
TextMessage(std::string reactor, std::string channel, std::string s)
|
||||
: ReturnAddressMsg(reactor, channel), text(s) {}
|
||||
|
||||
template <class Archive>
|
||||
void serialize(Archive &archive) {
|
||||
archive(cereal::virtual_base_class<ReturnAddressMsg>(this), text);
|
||||
}
|
||||
|
||||
std::string text;
|
||||
|
||||
protected:
|
||||
friend class cereal::access;
|
||||
TextMessage() {} // Cereal needs access to a default constructor.
|
||||
};
|
||||
CEREAL_REGISTER_TYPE(TextMessage);
|
||||
|
||||
class Master : public Reactor {
|
||||
public:
|
||||
Master(std::string name, MnidT mnid)
|
||||
: Reactor(name), mnid_(mnid) {
|
||||
worker_mnids_ = MemgraphDistributed::GetInstance().GetAllMnids();
|
||||
worker_mnids_.erase(worker_mnids_.begin()); // remove the master from the beginning
|
||||
}
|
||||
|
||||
virtual void Run() {
|
||||
MemgraphDistributed &memgraph = MemgraphDistributed::GetInstance();
|
||||
Distributed &distributed = Distributed::GetInstance();
|
||||
|
||||
std::cout << "Master (" << mnid_ << ") @ " << distributed.network().Address()
|
||||
<< ":" << distributed.network().Port() << std::endl;
|
||||
|
||||
auto stream = main_.first;
|
||||
|
||||
// wait until every worker sends a ReturnAddressMsg back, then close
|
||||
stream->OnEvent<TextMessage>([this](const TextMessage &msg,
|
||||
const Subscription &subscription) {
|
||||
std::cout << "Message from " << msg.Address() << ":" << msg.Port() << " .. " << msg.text << "\n";
|
||||
++workers_seen;
|
||||
if (workers_seen == worker_mnids_.size()) {
|
||||
subscription.Unsubscribe();
|
||||
// Sleep for a while so we can read output in the terminal.
|
||||
// (start_distributed.py runs each process in a new tab which is
|
||||
// closed immediately after process has finished)
|
||||
std::this_thread::sleep_for(std::chrono::seconds(4));
|
||||
CloseChannel("main");
|
||||
}
|
||||
});
|
||||
|
||||
// send a TextMessage to each worker
|
||||
for (auto wmnid : worker_mnids_) {
|
||||
std::cout << "wmnid_ = " << wmnid << std::endl;
|
||||
|
||||
auto stream = memgraph.FindChannel(wmnid, "worker", "main");
|
||||
stream->OnEventOnce()
|
||||
.ChainOnce<ChannelResolvedMessage>([this, stream](const ChannelResolvedMessage &msg, const Subscription&){
|
||||
msg.channelWriter()->Send<TextMessage>("master", "main", "hi from master");
|
||||
stream->Close();
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
protected:
|
||||
MnidT workers_seen = 0;
|
||||
const MnidT mnid_;
|
||||
std::vector<MnidT> worker_mnids_;
|
||||
};
|
||||
|
||||
class Worker : public Reactor {
|
||||
public:
|
||||
Worker(std::string name, MnidT mnid)
|
||||
: Reactor(name), mnid_(mnid) {}
|
||||
|
||||
virtual void Run() {
|
||||
Distributed &distributed = Distributed::GetInstance();
|
||||
|
||||
std::cout << "Worker (" << mnid_ << ") @ " << distributed.network().Address()
|
||||
<< ":" << distributed.network().Port() << std::endl;
|
||||
|
||||
auto stream = main_.first;
|
||||
// wait until master sends us a TextMessage, then reply back and close
|
||||
stream->OnEventOnce()
|
||||
.ChainOnce<TextMessage>([this](const TextMessage &msg, const Subscription&) {
|
||||
std::cout << "Message from " << msg.Address() << ":" << msg.Port() << " .. " << msg.text << "\n";
|
||||
|
||||
msg.GetReturnChannelWriter()
|
||||
->Send<TextMessage>("worker", "main", "hi from worker");
|
||||
|
||||
// Sleep for a while so we can read output in the terminal.
|
||||
std::this_thread::sleep_for(std::chrono::seconds(4));
|
||||
CloseChannel("main");
|
||||
});
|
||||
}
|
||||
|
||||
protected:
|
||||
const MnidT mnid_;
|
||||
};
|
||||
|
||||
int main(int argc, char *argv[]) {
|
||||
google::InitGoogleLogging(argv[0]);
|
||||
gflags::ParseCommandLineFlags(&argc, &argv, true);
|
||||
|
||||
System &system = System::GetInstance();
|
||||
Distributed& distributed = Distributed::GetInstance();
|
||||
MemgraphDistributed& memgraph = MemgraphDistributed::GetInstance();
|
||||
memgraph.RegisterConfig(ParseConfig());
|
||||
distributed.StartServices();
|
||||
|
||||
if (FLAGS_my_mnid == memgraph.LeaderMnid()) {
|
||||
system.Spawn<Master>("master", FLAGS_my_mnid);
|
||||
} else {
|
||||
system.Spawn<Worker>("worker", FLAGS_my_mnid);
|
||||
}
|
||||
system.AwaitShutdown();
|
||||
distributed.StopServices();
|
||||
|
||||
return 0;
|
||||
}
|
25
experimental/distributed/src/memgraph_config.cpp
Normal file
25
experimental/distributed/src/memgraph_config.cpp
Normal file
@ -0,0 +1,25 @@
|
||||
#include "memgraph_config.hpp"
|
||||
|
||||
DEFINE_string(config_filename, "", "File containing list of all processes");
|
||||
|
||||
Config ParseConfig(const std::string &filename) {
|
||||
std::ifstream file(filename, std::ifstream::in);
|
||||
assert(file.good());
|
||||
|
||||
Config config;
|
||||
|
||||
while (file.good()) {
|
||||
MnidT mnid;
|
||||
std::string address;
|
||||
uint16_t port;
|
||||
|
||||
file >> mnid >> address >> port;
|
||||
if (file.eof())
|
||||
break;
|
||||
|
||||
config.nodes.push_back(Config::NodeConfig{mnid, address, port});
|
||||
}
|
||||
|
||||
file.close();
|
||||
return config;
|
||||
}
|
39
experimental/distributed/src/memgraph_config.hpp
Normal file
39
experimental/distributed/src/memgraph_config.hpp
Normal file
@ -0,0 +1,39 @@
|
||||
#pragma once
|
||||
|
||||
#include <cstdint>
|
||||
#include <cassert>
|
||||
#include <fstream>
|
||||
#include <utility>
|
||||
#include <vector>
|
||||
#include <string>
|
||||
|
||||
#include <gflags/gflags.h>
|
||||
|
||||
/**
|
||||
* About config file
|
||||
*
|
||||
* Each line contains three strings:
|
||||
* memgraph node id, ip address of the worker, and port of the worker
|
||||
* Data on the first line is used to start master.
|
||||
* Data on the remaining lines is used to start workers.
|
||||
*/
|
||||
DECLARE_string(config_filename);
|
||||
|
||||
using MnidT = uint64_t;
|
||||
|
||||
struct Config {
|
||||
struct NodeConfig {
|
||||
MnidT mnid;
|
||||
std::string address;
|
||||
uint16_t port;
|
||||
};
|
||||
|
||||
std::vector<NodeConfig> nodes;
|
||||
};
|
||||
|
||||
/**
|
||||
* Parse config file.
|
||||
*
|
||||
* @return config object.
|
||||
*/
|
||||
Config ParseConfig(const std::string &filename = FLAGS_config_filename);
|
77
experimental/distributed/src/memgraph_distributed.hpp
Normal file
77
experimental/distributed/src/memgraph_distributed.hpp
Normal file
@ -0,0 +1,77 @@
|
||||
#pragma once
|
||||
|
||||
#include "memgraph_config.hpp"
|
||||
|
||||
#include "reactors_distributed.hpp"
|
||||
|
||||
#include <unordered_map>
|
||||
#include <mutex>
|
||||
#include <string>
|
||||
#include <utility>
|
||||
#include <vector>
|
||||
|
||||
class MemgraphDistributed {
|
||||
private:
|
||||
using Location = std::pair<std::string, uint16_t>;
|
||||
|
||||
public:
|
||||
/**
|
||||
* Get the (singleton) instance of MemgraphDistributed.
|
||||
*
|
||||
* More info: https://stackoverflow.com/questions/1008019/c-singleton-design-pattern
|
||||
*/
|
||||
static MemgraphDistributed &GetInstance() {
|
||||
static MemgraphDistributed memgraph; // guaranteed to be destroyed, initialized on first use
|
||||
return memgraph;
|
||||
}
|
||||
|
||||
EventStream* FindChannel(MnidT mnid,
|
||||
const std::string &reactor,
|
||||
const std::string &channel) {
|
||||
std::unique_lock<std::recursive_mutex> lock(mutex_);
|
||||
const auto &location = mnodes_.at(mnid);
|
||||
return Distributed::GetInstance().FindChannel(location.first, location.second, reactor, channel);
|
||||
}
|
||||
|
||||
void RegisterConfig(const Config &config) {
|
||||
config_ = config;
|
||||
for (auto &node : config_.nodes) {
|
||||
RegisterMemgraphNode(node.mnid, node.address, node.port);
|
||||
}
|
||||
}
|
||||
|
||||
std::vector<MnidT> GetAllMnids() {
|
||||
std::vector<MnidT> mnids;
|
||||
for (auto &node : config_.nodes) {
|
||||
mnids.push_back(node.mnid);
|
||||
}
|
||||
return mnids;
|
||||
}
|
||||
|
||||
/**
|
||||
* The leader is currently the first node in the config.
|
||||
*/
|
||||
MnidT LeaderMnid() {
|
||||
return config_.nodes.front().mnid;
|
||||
}
|
||||
|
||||
protected:
|
||||
MemgraphDistributed() {}
|
||||
|
||||
/** Register memgraph node id to the given location. */
|
||||
void RegisterMemgraphNode(MnidT mnid, const std::string &address, uint16_t port) {
|
||||
std::unique_lock<std::recursive_mutex> lock(mutex_);
|
||||
mnodes_[mnid] = Location(address, port);
|
||||
}
|
||||
|
||||
private:
|
||||
Config config_;
|
||||
|
||||
std::recursive_mutex mutex_;
|
||||
std::unordered_map<MnidT, Location> mnodes_;
|
||||
|
||||
MemgraphDistributed(const MemgraphDistributed &) = delete;
|
||||
MemgraphDistributed(MemgraphDistributed &&) = delete;
|
||||
MemgraphDistributed &operator=(const MemgraphDistributed &) = delete;
|
||||
MemgraphDistributed &operator=(MemgraphDistributed &&) = delete;
|
||||
};
|
36
experimental/distributed/start_main.py
Normal file
36
experimental/distributed/start_main.py
Normal file
@ -0,0 +1,36 @@
|
||||
#!/usr/bin/env python3
|
||||
# Automatically copied to the build/ directory during Makefile (configured by cmake)
|
||||
|
||||
import os
|
||||
|
||||
command = 'gnome-terminal'
|
||||
config_filename = 'config'
|
||||
glog_flags = '-alsologtostderr --minloglevel=2'
|
||||
|
||||
|
||||
def GetMainCall(my_mnid, address, port):
|
||||
return "./main {} --my_mnid {} --address {} --port {} --config_filename={}".format(
|
||||
glog_flags, my_mnid, address, port, config_filename)
|
||||
|
||||
|
||||
def GetClientCall():
|
||||
return "./main-client {} --address 127.0.0.1 --port 10000 --config_filename={}".format(
|
||||
glog_flags, config_filename)
|
||||
|
||||
|
||||
def NamedGnomeTab(name, command):
|
||||
return " --tab -e \"bash -c 'printf \\\"\\033]0;{}\\007\\\"; {}'\" ".format(name, command)
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
f = open(config_filename, 'r')
|
||||
for line in f:
|
||||
data = line.strip().split(' ')
|
||||
my_mnid = data[0]
|
||||
address = data[1]
|
||||
port = data[2]
|
||||
command += NamedGnomeTab("mnid={}".format(my_mnid), GetMainCall(my_mnid, address, port))
|
||||
|
||||
command += NamedGnomeTab("client", GetClientCall())
|
||||
print(command)
|
||||
os.system(command)
|
@ -1,5 +1,4 @@
|
||||
# Unfortunately I don't know how to force CMake to copy this script to
|
||||
# the test folder so for now you will have to do it yourself.
|
||||
# Automatically copied to the build/ directory during Makefile (configured by cmake)
|
||||
|
||||
import os
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user