#include "query/plan/operator.hpp" #include #include #include #include #include #include #include "boost/archive/binary_iarchive.hpp" #include "boost/archive/binary_oarchive.hpp" #include "boost/serialization/export.hpp" #include "glog/logging.h" #include "database/graph_db_accessor.hpp" #include "distributed/remote_pull_rpc_clients.hpp" #include "distributed/remote_updates_rpc_clients.hpp" #include "distributed/remote_updates_rpc_server.hpp" #include "query/context.hpp" #include "query/exceptions.hpp" #include "query/frontend/ast/ast.hpp" #include "query/frontend/semantic/symbol_table.hpp" #include "query/interpret/eval.hpp" #include "query/path.hpp" #include "utils/exceptions.hpp" DEFINE_HIDDEN_int32(remote_pull_sleep, 2, "Sleep between remote result pulling in milliseconds"); // macro for the default implementation of LogicalOperator::Accept // that accepts the visitor and visits it's input_ operator #define ACCEPT_WITH_INPUT(class_name) \ bool class_name::Accept(HierarchicalLogicalOperatorVisitor &visitor) { \ if (visitor.PreVisit(*this)) { \ input_->Accept(visitor); \ } \ return visitor.PostVisit(*this); \ } namespace query::plan { namespace { // Sets a property on a record accessor from a TypedValue. In cases when the // TypedValue cannot be converted to PropertyValue, // QueryRuntimeException is raised. template void PropsSetChecked(TRecordAccessor &record, storage::Property key, TypedValue value) { try { record.PropsSet(key, value); } catch (const TypedValueException &) { throw QueryRuntimeException("'{}' cannot be used as a property value.", value.type()); } catch (const RecordDeletedError &) { throw QueryRuntimeException( "Trying to set properties on a deleted graph element."); } } // Checks if the given value of the symbol has the expected type. If not, raises // QueryRuntimeException. void ExpectType(Symbol symbol, TypedValue value, TypedValue::Type expected) { if (value.type() != expected) throw QueryRuntimeException("Expected a {} for '{}', but got {}.", expected, symbol.name(), value.type()); } // Returns boolean result of evaluating filter expression. Null is treated as // false. Other non boolean values raise a QueryRuntimeException. bool EvaluateFilter(ExpressionEvaluator &evaluator, Expression *filter) { TypedValue result = filter->Accept(evaluator); // Null is treated like false. if (result.IsNull()) return false; if (result.type() != TypedValue::Type::Bool) throw QueryRuntimeException( "Filter expression must be a bool or null, but got {}.", result.type()); return result.Value(); } } // namespace bool Once::OnceCursor::Pull(Frame &, Context &) { if (!did_pull_) { did_pull_ = true; return true; } return false; } std::unique_ptr Once::MakeCursor(database::GraphDbAccessor &) const { return std::make_unique(); } void Once::OnceCursor::Reset() { did_pull_ = false; } CreateNode::CreateNode(NodeAtom *node_atom, const std::shared_ptr &input) : node_atom_(node_atom), input_(input ? input : std::make_shared()) {} ACCEPT_WITH_INPUT(CreateNode) std::unique_ptr CreateNode::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector CreateNode::ModifiedSymbols( const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); symbols.emplace_back(table.at(*node_atom_->identifier_)); return symbols; } CreateNode::CreateNodeCursor::CreateNodeCursor(const CreateNode &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_->MakeCursor(db)) {} bool CreateNode::CreateNodeCursor::Pull(Frame &frame, Context &context) { if (input_cursor_->Pull(frame, context)) { Create(frame, context); return true; } return false; } void CreateNode::CreateNodeCursor::Reset() { input_cursor_->Reset(); } void CreateNode::CreateNodeCursor::Create(Frame &frame, Context &context) { auto new_node = db_.InsertVertex(); for (auto label : self_.node_atom_->labels_) new_node.add_label(label); // Evaluator should use the latest accessors, as modified in this query, when // setting properties on new nodes. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::NEW); for (auto &kv : self_.node_atom_->properties_) PropsSetChecked(new_node, kv.first.second, kv.second->Accept(evaluator)); frame[context.symbol_table_.at(*self_.node_atom_->identifier_)] = new_node; } CreateExpand::CreateExpand(NodeAtom *node_atom, EdgeAtom *edge_atom, const std::shared_ptr &input, Symbol input_symbol, bool existing_node) : node_atom_(node_atom), edge_atom_(edge_atom), input_(input ? input : std::make_shared()), input_symbol_(input_symbol), existing_node_(existing_node) {} ACCEPT_WITH_INPUT(CreateExpand) std::unique_ptr CreateExpand::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector CreateExpand::ModifiedSymbols( const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); symbols.emplace_back(table.at(*node_atom_->identifier_)); symbols.emplace_back(table.at(*edge_atom_->identifier_)); return symbols; } CreateExpand::CreateExpandCursor::CreateExpandCursor( const CreateExpand &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_->MakeCursor(db)) {} bool CreateExpand::CreateExpandCursor::Pull(Frame &frame, Context &context) { if (!input_cursor_->Pull(frame, context)) return false; // get the origin vertex TypedValue &vertex_value = frame[self_.input_symbol_]; ExpectType(self_.input_symbol_, vertex_value, TypedValue::Type::Vertex); auto &v1 = vertex_value.Value(); // Similarly to CreateNode, newly created edges and nodes should use the // latest accesors. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::NEW); // E.g. we pickup new properties: `CREATE (n {p: 42}) -[:r {ep: n.p}]-> ()` v1.SwitchNew(); // get the destination vertex (possibly an existing node) auto &v2 = OtherVertex(frame, context.symbol_table_, evaluator); v2.SwitchNew(); // create an edge between the two nodes switch (self_.edge_atom_->direction_) { case EdgeAtom::Direction::IN: CreateEdge(v2, v1, frame, context.symbol_table_, evaluator); break; case EdgeAtom::Direction::OUT: CreateEdge(v1, v2, frame, context.symbol_table_, evaluator); break; case EdgeAtom::Direction::BOTH: // in the case of an undirected CreateExpand we choose an arbitrary // direction. this is used in the MERGE clause // it is not allowed in the CREATE clause, and the semantic // checker needs to ensure it doesn't reach this point CreateEdge(v1, v2, frame, context.symbol_table_, evaluator); } return true; } void CreateExpand::CreateExpandCursor::Reset() { input_cursor_->Reset(); } VertexAccessor &CreateExpand::CreateExpandCursor::OtherVertex( Frame &frame, const SymbolTable &symbol_table, ExpressionEvaluator &evaluator) { if (self_.existing_node_) { const auto &dest_node_symbol = symbol_table.at(*self_.node_atom_->identifier_); TypedValue &dest_node_value = frame[dest_node_symbol]; ExpectType(dest_node_symbol, dest_node_value, TypedValue::Type::Vertex); return dest_node_value.Value(); } else { // the node does not exist, it needs to be created auto node = db_.InsertVertex(); for (auto label : self_.node_atom_->labels_) node.add_label(label); for (auto kv : self_.node_atom_->properties_) PropsSetChecked(node, kv.first.second, kv.second->Accept(evaluator)); auto symbol = symbol_table.at(*self_.node_atom_->identifier_); frame[symbol] = node; return frame[symbol].Value(); } } void CreateExpand::CreateExpandCursor::CreateEdge( VertexAccessor &from, VertexAccessor &to, Frame &frame, const SymbolTable &symbol_table, ExpressionEvaluator &evaluator) { EdgeAccessor edge = db_.InsertEdge(from, to, self_.edge_atom_->edge_types_[0]); for (auto kv : self_.edge_atom_->properties_) PropsSetChecked(edge, kv.first.second, kv.second->Accept(evaluator)); frame[symbol_table.at(*self_.edge_atom_->identifier_)] = edge; } template class ScanAllCursor : public Cursor { public: explicit ScanAllCursor(Symbol output_symbol, std::unique_ptr &&input_cursor, TVerticesFun &&get_vertices, database::GraphDbAccessor &db) : output_symbol_(output_symbol), input_cursor_(std::move(input_cursor)), get_vertices_(std::move(get_vertices)), db_(db) {} bool Pull(Frame &frame, Context &context) override { if (db_.should_abort()) throw HintedAbortError(); if (!vertices_ || vertices_it_.value() == vertices_.value().end()) { if (!input_cursor_->Pull(frame, context)) return false; // We need a getter function, because in case of exhausting a lazy // iterable, we cannot simply reset it by calling begin(). vertices_.emplace(get_vertices_(frame, context)); vertices_it_.emplace(vertices_.value().begin()); } // if vertices_ is empty then we are done even though we have just // reinitialized vertices_it_ if (vertices_it_.value() == vertices_.value().end()) return false; frame[output_symbol_] = *vertices_it_.value()++; return true; } void Reset() override { input_cursor_->Reset(); vertices_ = std::experimental::nullopt; vertices_it_ = std::experimental::nullopt; } private: const Symbol output_symbol_; const std::unique_ptr input_cursor_; TVerticesFun get_vertices_; std::experimental::optional< typename std::result_of::type> vertices_; std::experimental::optional vertices_it_; database::GraphDbAccessor &db_; }; ScanAll::ScanAll(const std::shared_ptr &input, Symbol output_symbol, GraphView graph_view) : input_(input ? input : std::make_shared()), output_symbol_(output_symbol), graph_view_(graph_view) { CHECK(graph_view != GraphView::AS_IS) << "ScanAll must have explicitly defined GraphView"; } ACCEPT_WITH_INPUT(ScanAll) std::unique_ptr ScanAll::MakeCursor( database::GraphDbAccessor &db) const { auto vertices = [this, &db](Frame &, Context &) { return db.Vertices(graph_view_ == GraphView::NEW); }; return std::make_unique>( output_symbol_, input_->MakeCursor(db), std::move(vertices), db); } std::vector ScanAll::ModifiedSymbols(const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); symbols.emplace_back(output_symbol_); return symbols; } ScanAllByLabel::ScanAllByLabel(const std::shared_ptr &input, Symbol output_symbol, storage::Label label, GraphView graph_view) : ScanAll(input, output_symbol, graph_view), label_(label) {} ACCEPT_WITH_INPUT(ScanAllByLabel) std::unique_ptr ScanAllByLabel::MakeCursor( database::GraphDbAccessor &db) const { auto vertices = [this, &db](Frame &, Context &) { return db.Vertices(label_, graph_view_ == GraphView::NEW); }; return std::make_unique>( output_symbol_, input_->MakeCursor(db), std::move(vertices), db); } ScanAllByLabelPropertyRange::ScanAllByLabelPropertyRange( const std::shared_ptr &input, Symbol output_symbol, storage::Label label, storage::Property property, std::experimental::optional lower_bound, std::experimental::optional upper_bound, GraphView graph_view) : ScanAll(input, output_symbol, graph_view), label_(label), property_(property), lower_bound_(lower_bound), upper_bound_(upper_bound) { DCHECK(lower_bound_ || upper_bound_) << "Only one bound can be left out"; } ACCEPT_WITH_INPUT(ScanAllByLabelPropertyRange) std::unique_ptr ScanAllByLabelPropertyRange::MakeCursor( database::GraphDbAccessor &db) const { auto vertices = [this, &db](Frame &frame, Context &context) { ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db, graph_view_); auto convert = [&evaluator](const auto &bound) -> std::experimental::optional> { if (!bound) return std::experimental::nullopt; return std::experimental::make_optional(utils::Bound( bound.value().value()->Accept(evaluator), bound.value().type())); }; return db.Vertices(label_, property_, convert(lower_bound()), convert(upper_bound()), graph_view_ == GraphView::NEW); }; return std::make_unique>( output_symbol_, input_->MakeCursor(db), std::move(vertices), db); } ScanAllByLabelPropertyValue::ScanAllByLabelPropertyValue( const std::shared_ptr &input, Symbol output_symbol, storage::Label label, storage::Property property, Expression *expression, GraphView graph_view) : ScanAll(input, output_symbol, graph_view), label_(label), property_(property), expression_(expression) { DCHECK(expression) << "Expression is not optional."; } ACCEPT_WITH_INPUT(ScanAllByLabelPropertyValue) class ScanAllByLabelPropertyValueCursor : public Cursor { public: ScanAllByLabelPropertyValueCursor(const ScanAllByLabelPropertyValue &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input()->MakeCursor(db_)) {} bool Pull(Frame &frame, Context &context) override { if (db_.should_abort()) throw HintedAbortError(); if (!vertices_ || vertices_it_.value() == vertices_.value().end()) { if (!input_cursor_->Pull(frame, context)) return false; ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, self_.graph_view()); TypedValue value = self_.expression()->Accept(evaluator); if (value.IsNull()) return Pull(frame, context); try { vertices_.emplace(db_.Vertices(self_.label(), self_.property(), value, self_.graph_view() == GraphView::NEW)); } catch (const TypedValueException &) { throw QueryRuntimeException("'{}' cannot be used as a property value.", value.type()); } vertices_it_.emplace(vertices_.value().begin()); } // if vertices_ is empty then we are done even though we have just // reinitialized vertices_it_ if (vertices_it_.value() == vertices_.value().end()) return false; frame[self_.output_symbol()] = *vertices_it_.value()++; return true; } void Reset() override { input_cursor_->Reset(); vertices_ = std::experimental::nullopt; vertices_it_ = std::experimental::nullopt; } private: const ScanAllByLabelPropertyValue &self_; database::GraphDbAccessor &db_; const std::unique_ptr input_cursor_; std::experimental::optional vertices_; std::experimental::optional vertices_it_; }; std::unique_ptr ScanAllByLabelPropertyValue::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } ExpandCommon::ExpandCommon(Symbol node_symbol, Symbol edge_symbol, EdgeAtom::Direction direction, const std::vector &edge_types, const std::shared_ptr &input, Symbol input_symbol, bool existing_node, GraphView graph_view) : node_symbol_(node_symbol), edge_symbol_(edge_symbol), direction_(direction), edge_types_(edge_types), input_(input ? input : std::make_shared()), input_symbol_(input_symbol), existing_node_(existing_node), graph_view_(graph_view) {} bool ExpandCommon::HandleExistingNode(const VertexAccessor &new_node, Frame &frame) const { if (existing_node_) { TypedValue &old_node_value = frame[node_symbol_]; // old_node_value may be Null when using optional matching if (old_node_value.IsNull()) return false; ExpectType(node_symbol_, old_node_value, TypedValue::Type::Vertex); return old_node_value.Value() == new_node; } else { frame[node_symbol_] = new_node; return true; } } ACCEPT_WITH_INPUT(Expand) std::unique_ptr Expand::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Expand::ModifiedSymbols(const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); symbols.emplace_back(node_symbol()); symbols.emplace_back(edge_symbol()); return symbols; } Expand::ExpandCursor::ExpandCursor(const Expand &self, database::GraphDbAccessor &db) : self_(self), input_cursor_(self.input_->MakeCursor(db)), db_(db) {} bool Expand::ExpandCursor::Pull(Frame &frame, Context &context) { // A helper function for expanding a node from an edge. auto pull_node = [this, &frame](const EdgeAccessor &new_edge, EdgeAtom::Direction direction) { if (self_.existing_node_) return; switch (direction) { case EdgeAtom::Direction::IN: frame[self_.node_symbol_] = new_edge.from(); break; case EdgeAtom::Direction::OUT: frame[self_.node_symbol_] = new_edge.to(); break; case EdgeAtom::Direction::BOTH: LOG(FATAL) << "Must indicate exact expansion direction here"; } }; while (true) { if (db_.should_abort()) throw HintedAbortError(); // attempt to get a value from the incoming edges if (in_edges_ && *in_edges_it_ != in_edges_->end()) { EdgeAccessor edge = *(*in_edges_it_)++; frame[self_.edge_symbol_] = edge; pull_node(edge, EdgeAtom::Direction::IN); return true; } // attempt to get a value from the outgoing edges if (out_edges_ && *out_edges_it_ != out_edges_->end()) { EdgeAccessor edge = *(*out_edges_it_)++; // when expanding in EdgeAtom::Direction::BOTH directions // we should do only one expansion for cycles, and it was // already done in the block above if (self_.direction_ == EdgeAtom::Direction::BOTH && edge.is_cycle()) continue; frame[self_.edge_symbol_] = edge; pull_node(edge, EdgeAtom::Direction::OUT); return true; } // if we are here, either the edges have not been initialized, // or they have been exhausted. attempt to initialize the edges, // if the input is exhausted if (!InitEdges(frame, context)) return false; // we have re-initialized the edges, continue with the loop } } void Expand::ExpandCursor::Reset() { input_cursor_->Reset(); in_edges_ = std::experimental::nullopt; in_edges_it_ = std::experimental::nullopt; out_edges_ = std::experimental::nullopt; out_edges_it_ = std::experimental::nullopt; } namespace { // Switch the given [Vertex/Edge]Accessor to the desired state. template void SwitchAccessor(TAccessor &accessor, GraphView graph_view) { switch (graph_view) { case GraphView::NEW: accessor.SwitchNew(); break; case GraphView::OLD: accessor.SwitchOld(); break; case GraphView::AS_IS: break; } } } // namespace bool Expand::ExpandCursor::InitEdges(Frame &frame, Context &context) { // Input Vertex could be null if it is created by a failed optional match. In // those cases we skip that input pull and continue with the next. while (true) { if (!input_cursor_->Pull(frame, context)) return false; TypedValue &vertex_value = frame[self_.input_symbol_]; // Null check due to possible failed optional match. if (vertex_value.IsNull()) continue; ExpectType(self_.input_symbol_, vertex_value, TypedValue::Type::Vertex); auto &vertex = vertex_value.Value(); SwitchAccessor(vertex, self_.graph_view_); auto direction = self_.direction_; if (direction == EdgeAtom::Direction::IN || direction == EdgeAtom::Direction::BOTH) { if (self_.existing_node_) { TypedValue &existing_node = frame[self_.node_symbol_]; // old_node_value may be Null when using optional matching if (!existing_node.IsNull()) { ExpectType(self_.node_symbol_, existing_node, TypedValue::Type::Vertex); in_edges_.emplace( vertex.in(existing_node.ValueVertex(), &self_.edge_types())); } } else { in_edges_.emplace(vertex.in(&self_.edge_types())); } in_edges_it_.emplace(in_edges_->begin()); } if (direction == EdgeAtom::Direction::OUT || direction == EdgeAtom::Direction::BOTH) { if (self_.existing_node_) { TypedValue &existing_node = frame[self_.node_symbol_]; // old_node_value may be Null when using optional matching if (!existing_node.IsNull()) { ExpectType(self_.node_symbol_, existing_node, TypedValue::Type::Vertex); out_edges_.emplace( vertex.out(existing_node.ValueVertex(), &self_.edge_types())); } } else { out_edges_.emplace(vertex.out(&self_.edge_types())); } out_edges_it_.emplace(out_edges_->begin()); } return true; } } ExpandVariable::ExpandVariable( Symbol node_symbol, Symbol edge_symbol, EdgeAtom::Type type, EdgeAtom::Direction direction, const std::vector &edge_types, bool is_reverse, Expression *lower_bound, Expression *upper_bound, const std::shared_ptr &input, Symbol input_symbol, bool existing_node, Lambda filter_lambda, std::experimental::optional weight_lambda, std::experimental::optional total_weight, GraphView graph_view) : ExpandCommon(node_symbol, edge_symbol, direction, edge_types, input, input_symbol, existing_node, graph_view), type_(type), is_reverse_(is_reverse), lower_bound_(lower_bound), upper_bound_(upper_bound), filter_lambda_(filter_lambda), weight_lambda_(weight_lambda), total_weight_(total_weight) { DCHECK(type_ == EdgeAtom::Type::DEPTH_FIRST || type_ == EdgeAtom::Type::BREADTH_FIRST || type_ == EdgeAtom::Type::WEIGHTED_SHORTEST_PATH) << "ExpandVariable can only be used with breadth first, depth first or " "weighted shortest path type"; DCHECK(!(type_ == EdgeAtom::Type::BREADTH_FIRST && is_reverse)) << "Breadth first expansion can't be reversed"; } ACCEPT_WITH_INPUT(ExpandVariable) std::vector ExpandVariable::ModifiedSymbols( const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); symbols.emplace_back(node_symbol()); symbols.emplace_back(edge_symbol()); return symbols; } namespace { /** * Helper function that returns an iterable over * pairs * for the given params. * * @param vertex - The vertex to expand from. * @param direction - Expansion direction. All directions (IN, OUT, BOTH) * are supported. * @return See above. */ auto ExpandFromVertex(const VertexAccessor &vertex, EdgeAtom::Direction direction, const std::vector &edge_types) { // wraps an EdgeAccessor into a pair auto wrapper = [](EdgeAtom::Direction direction, auto &&vertices) { return iter::imap( [direction](const EdgeAccessor &edge) { return std::make_pair(edge, direction); }, std::move(vertices)); }; // prepare a vector of elements we'll pass to the itertools std::vector chain_elements; if (direction != EdgeAtom::Direction::OUT && vertex.in_degree() > 0) { auto edges = vertex.in(&edge_types); if (edges.begin() != edges.end()) { chain_elements.emplace_back( wrapper(EdgeAtom::Direction::IN, std::move(edges))); } } if (direction != EdgeAtom::Direction::IN && vertex.out_degree() > 0) { auto edges = vertex.out(&edge_types); if (edges.begin() != edges.end()) { chain_elements.emplace_back( wrapper(EdgeAtom::Direction::OUT, std::move(edges))); } } return iter::chain.from_iterable(std::move(chain_elements)); } /** A helper function for evaluating an expression that's an int. * * @param evaluator * @param expr * @param what - Name of what's getting evaluated. Used for user * feedback (via exception) when the evaluated value is not an int. */ int64_t EvaluateInt(ExpressionEvaluator &evaluator, Expression *expr, const std::string &what) { TypedValue value = expr->Accept(evaluator); try { return value.Value(); } catch (TypedValueException &e) { throw QueryRuntimeException(what + " must be an int"); } } } // namespace class ExpandVariableCursor : public Cursor { public: ExpandVariableCursor(const ExpandVariable &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_->MakeCursor(db)) {} bool Pull(Frame &frame, Context &context) override { ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, self_.graph_view_); while (true) { if (Expand(frame, context)) return true; if (PullInput(frame, context)) { // if lower bound is zero we also yield empty paths if (lower_bound_ == 0) { auto &start_vertex = frame[self_.input_symbol_].Value(); if (self_.HandleExistingNode(start_vertex, frame)) { return true; } } // if lower bound is not zero, we just continue, the next // loop iteration will attempt to expand and we're good } else return false; // else continue with the loop, try to expand again // because we succesfully pulled from the input } } void Reset() override { input_cursor_->Reset(); edges_.clear(); edges_it_.clear(); } private: const ExpandVariable &self_; database::GraphDbAccessor &db_; const std::unique_ptr input_cursor_; // bounds. in the cursor they are not optional but set to // default values if missing in the ExpandVariable operator // initialize to arbitrary values, they should only be used // after a successful pull from the input int64_t upper_bound_{-1}; int64_t lower_bound_{-1}; // a stack of edge iterables corresponding to the level/depth of // the expansion currently being Pulled std::vector(), EdgeAtom::Direction::IN, self_.edge_types_))> edges_; // an iterator indicating the possition in the corresponding edges_ // element std::vectorbegin())> edges_it_; /** * Helper function that Pulls from the input vertex and * makes iteration over it's edges possible. * * @return If the Pull succeeded. If not, this VariableExpandCursor * is exhausted. */ bool PullInput(Frame &frame, Context &context) { // Input Vertex could be null if it is created by a failed optional // match. // In those cases we skip that input pull and continue with the next. while (true) { if (!input_cursor_->Pull(frame, context)) return false; TypedValue &vertex_value = frame[self_.input_symbol_]; // Null check due to possible failed optional match. if (vertex_value.IsNull()) continue; ExpectType(self_.input_symbol_, vertex_value, TypedValue::Type::Vertex); auto &vertex = vertex_value.Value(); SwitchAccessor(vertex, self_.graph_view_); // Evaluate the upper and lower bounds. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_); auto calc_bound = [&evaluator](auto &bound) { auto value = EvaluateInt(evaluator, bound, "Variable expansion bound"); if (value < 0) throw QueryRuntimeException( "Variable expansion bound must be positive or zero"); return value; }; lower_bound_ = self_.lower_bound_ ? calc_bound(self_.lower_bound_) : 1; upper_bound_ = self_.upper_bound_ ? calc_bound(self_.upper_bound_) : std::numeric_limits::max(); if (upper_bound_ > 0) { SwitchAccessor(vertex, self_.graph_view_); edges_.emplace_back( ExpandFromVertex(vertex, self_.direction_, self_.edge_types_)); edges_it_.emplace_back(edges_.back().begin()); } // reset the frame value to an empty edge list frame[self_.edge_symbol_] = std::vector(); return true; } } // Helper function for appending an edge to the list on the frame. void AppendEdge(const EdgeAccessor &new_edge, std::vector &edges_on_frame) { // We are placing an edge on the frame. It is possible that there already // exists an edge on the frame for this level. If so first remove it. DCHECK(edges_.size() > 0) << "Edges are empty"; if (self_.is_reverse_) { // TODO: This is innefficient, we should look into replacing // vector with something else for TypedValue::List. size_t diff = edges_on_frame.size() - std::min(edges_on_frame.size(), edges_.size() - 1U); if (diff > 0U) edges_on_frame.erase(edges_on_frame.begin(), edges_on_frame.begin() + diff); edges_on_frame.insert(edges_on_frame.begin(), new_edge); } else { edges_on_frame.resize( std::min(edges_on_frame.size(), edges_.size() - 1U)); edges_on_frame.emplace_back(new_edge); } } /** * Performs a single expansion for the current state of this * VariableExpansionCursor. * * @return True if the expansion was a success and this Cursor's * consumer can consume it. False if the expansion failed. In that * case no more expansions are available from the current input * vertex and another Pull from the input cursor should be performed. */ bool Expand(Frame &frame, Context &context) { ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, self_.graph_view_); // Some expansions might not be valid due to edge uniqueness and // existing_node criterions, so expand in a loop until either the input // vertex is exhausted or a valid variable-length expansion is available. while (true) { // pop from the stack while there is stuff to pop and the current // level is exhausted while (!edges_.empty() && edges_it_.back() == edges_.back().end()) { edges_.pop_back(); edges_it_.pop_back(); } // check if we exhausted everything, if so return false if (edges_.empty()) return false; // we use this a lot std::vector &edges_on_frame = frame[self_.edge_symbol_].Value>(); // it is possible that edges_on_frame does not contain as many // elements as edges_ due to edge-uniqueness (when a whole layer // gets exhausted but no edges are valid). for that reason only // pop from edges_on_frame if they contain enough elements if (self_.is_reverse_) { auto diff = edges_on_frame.size() - std::min(edges_on_frame.size(), edges_.size()); if (diff > 0) { edges_on_frame.erase(edges_on_frame.begin(), edges_on_frame.begin() + diff); } } else { edges_on_frame.resize(std::min(edges_on_frame.size(), edges_.size())); } // if we are here, we have a valid stack, // get the edge, increase the relevant iterator std::pair current_edge = *edges_it_.back()++; // Check edge-uniqueness. bool found_existing = std::any_of(edges_on_frame.begin(), edges_on_frame.end(), [¤t_edge](const TypedValue &edge) { return current_edge.first == edge.Value(); }); if (found_existing) continue; AppendEdge(current_edge.first, edges_on_frame); VertexAccessor current_vertex = current_edge.second == EdgeAtom::Direction::IN ? current_edge.first.from() : current_edge.first.to(); if (!self_.HandleExistingNode(current_vertex, frame)) continue; // Skip expanding out of filtered expansion. frame[self_.filter_lambda_.inner_edge_symbol] = current_edge.first; frame[self_.filter_lambda_.inner_node_symbol] = current_vertex; if (self_.filter_lambda_.expression && !EvaluateFilter(evaluator, self_.filter_lambda_.expression)) continue; // we are doing depth-first search, so place the current // edge's expansions onto the stack, if we should continue to expand if (upper_bound_ > static_cast(edges_.size())) { SwitchAccessor(current_vertex, self_.graph_view_); edges_.emplace_back(ExpandFromVertex(current_vertex, self_.direction_, self_.edge_types_)); edges_it_.emplace_back(edges_.back().begin()); } // We only yield true if we satisfy the lower bound. if (static_cast(edges_on_frame.size()) >= lower_bound_) return true; else continue; } } }; class ExpandBreadthFirstCursor : public query::plan::Cursor { public: ExpandBreadthFirstCursor(const ExpandVariable &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} bool Pull(Frame &frame, Context &context) override { // evaulator for the filtering condition ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, self_.graph_view_); // for the given (edge, vertex) pair checks if they satisfy the // "where" condition. if so, places them in the to_visit_ structure. auto expand_pair = [this, &evaluator, &frame](EdgeAccessor edge, VertexAccessor vertex) { // if we already processed the given vertex it doesn't get expanded if (processed_.find(vertex) != processed_.end()) return; SwitchAccessor(edge, self_.graph_view_); SwitchAccessor(vertex, self_.graph_view_); frame[self_.filter_lambda_.inner_edge_symbol] = edge; frame[self_.filter_lambda_.inner_node_symbol] = vertex; if (self_.filter_lambda_.expression) { TypedValue result = self_.filter_lambda_.expression->Accept(evaluator); switch (result.type()) { case TypedValue::Type::Null: return; case TypedValue::Type::Bool: if (!result.Value()) return; break; default: throw QueryRuntimeException( "Expansion condition must be boolean or null"); } } to_visit_next_.emplace_back(edge, vertex); processed_.emplace(vertex, edge); }; // populates the to_visit_next_ structure with expansions // from the given vertex. skips expansions that don't satisfy // the "where" condition. auto expand_from_vertex = [this, &expand_pair](VertexAccessor &vertex) { if (self_.direction_ != EdgeAtom::Direction::IN) { for (const EdgeAccessor &edge : vertex.out(&self_.edge_types_)) expand_pair(edge, edge.to()); } if (self_.direction_ != EdgeAtom::Direction::OUT) { for (const EdgeAccessor &edge : vertex.in(&self_.edge_types_)) expand_pair(edge, edge.from()); } }; // do it all in a loop because we skip some elements while (true) { // if we have nothing to visit on the current depth, switch to next if (to_visit_current_.empty()) to_visit_current_.swap(to_visit_next_); // if current is still empty, it means both are empty, so pull from // input if (to_visit_current_.empty()) { if (!input_cursor_->Pull(frame, context)) return false; processed_.clear(); auto vertex_value = frame[self_.input_symbol_]; // it is possible that the vertex is Null due to optional matching if (vertex_value.IsNull()) continue; auto vertex = vertex_value.Value(); SwitchAccessor(vertex, self_.graph_view_); processed_.emplace(vertex, std::experimental::nullopt); expand_from_vertex(vertex); lower_bound_ = self_.lower_bound_ ? EvaluateInt(evaluator, self_.lower_bound_, "Min depth in breadth-first expansion") : 1; upper_bound_ = self_.upper_bound_ ? EvaluateInt(evaluator, self_.upper_bound_, "Max depth in breadth-first expansion") : std::numeric_limits::max(); if (upper_bound_ < 1) throw QueryRuntimeException( "Max depth in breadth-first expansion must be greater then " "zero"); // go back to loop start and see if we expanded anything continue; } // take the next expansion from the queue std::pair expansion = to_visit_current_.front(); to_visit_current_.pop_front(); // create the frame value for the edges std::vector edge_list{expansion.first}; auto last_vertex = expansion.second; while (true) { const EdgeAccessor &last_edge = edge_list.back().Value(); last_vertex = last_edge.from() == last_vertex ? last_edge.to() : last_edge.from(); // origin_vertex must be in processed const auto &previous_edge = processed_.find(last_vertex)->second; if (!previous_edge) break; edge_list.push_back(previous_edge.value()); } // expand only if what we've just expanded is less then max depth if (static_cast(edge_list.size()) < upper_bound_) expand_from_vertex(expansion.second); if (static_cast(edge_list.size()) < lower_bound_) continue; // place destination node on the frame, handle existence flag if (self_.existing_node_) { TypedValue &node = frame[self_.node_symbol_]; // due to optional matching the existing node could be null if (node.IsNull() || (node != expansion.second).Value()) continue; } else frame[self_.node_symbol_] = expansion.second; // place edges on the frame in the correct order std::reverse(edge_list.begin(), edge_list.end()); frame[self_.edge_symbol_] = std::move(edge_list); return true; } } void Reset() override { input_cursor_->Reset(); processed_.clear(); to_visit_next_.clear(); to_visit_current_.clear(); } private: const ExpandVariable &self_; database::GraphDbAccessor &db_; const std::unique_ptr input_cursor_; // Depth bounds. Calculated on each pull from the input, the initial value is // irrelevant. int lower_bound_{-1}; int upper_bound_{-1}; // maps vertices to the edge they got expanded from. it is an optional // edge because the root does not get expanded from anything. // contains visited vertices as well as those scheduled to be visited. std::unordered_map> processed_; // edge/vertex pairs we have yet to visit, for current and next depth std::deque> to_visit_current_; std::deque> to_visit_next_; }; class ExpandWeightedShortestPathCursor : public query::plan::Cursor { public: ExpandWeightedShortestPathCursor(const ExpandVariable &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} bool Pull(Frame &frame, Context &context) override { ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, self_.graph_view_); // For the given (vertex, edge, vertex) tuple checks if they satisfy the // "where" condition. if so, places them in the priority queue. auto expand_pair = [this, &evaluator, &frame]( VertexAccessor from, EdgeAccessor edge, VertexAccessor vertex) { SwitchAccessor(edge, self_.graph_view_); SwitchAccessor(vertex, self_.graph_view_); if (self_.filter_lambda_.expression) { frame[self_.filter_lambda_.inner_edge_symbol] = edge; frame[self_.filter_lambda_.inner_node_symbol] = vertex; if (!EvaluateFilter(evaluator, self_.filter_lambda_.expression)) return; } frame[self_.weight_lambda_->inner_edge_symbol] = edge; frame[self_.weight_lambda_->inner_node_symbol] = vertex; TypedValue typed_weight = self_.weight_lambda_->expression->Accept(evaluator); if (!typed_weight.IsNumeric()) { throw QueryRuntimeException("Calculated weight must be numeric, got {}", typed_weight.type()); } if ((typed_weight < 0).Value()) { throw QueryRuntimeException("Calculated weight can't be negative!"); } auto total_weight = weights_[from] + typed_weight; auto found_it = weights_.find(vertex); if (found_it != weights_.end() && found_it->second.Value() <= total_weight.Value()) return; pq_.push(std::make_pair(std::make_pair(vertex, edge), total_weight.Value())); }; // Populates the priority queue structure with expansions // from the given vertex. skips expansions that don't satisfy // the "where" condition. auto expand_from_vertex = [this, &expand_pair](VertexAccessor &vertex) { if (self_.direction_ != EdgeAtom::Direction::IN) { for (const EdgeAccessor &edge : vertex.out(&self_.edge_types_)) { expand_pair(vertex, edge, edge.to()); } } if (self_.direction_ != EdgeAtom::Direction::OUT) { for (const EdgeAccessor &edge : vertex.in(&self_.edge_types_)) { expand_pair(vertex, edge, edge.from()); } } }; while (true) { if (pq_.empty()) { if (!input_cursor_->Pull(frame, context)) return false; auto vertex_value = frame[self_.input_symbol_]; if (vertex_value.IsNull()) continue; auto vertex = vertex_value.Value(); if (self_.existing_node_) { TypedValue &node = frame[self_.node_symbol_]; // Due to optional matching the existing node could be null. // Skip expansion for such nodes. if (node.IsNull()) continue; } SwitchAccessor(vertex, self_.graph_view_); upper_bound_ = self_.upper_bound_ ? EvaluateInt(evaluator, self_.upper_bound_, "Max depth in weighted shortest path expansion") : std::numeric_limits::max(); if (upper_bound_ < 1) throw QueryRuntimeException( "Max depth in weighted shortest path expansion must be greater " "than zero"); // Clear existing data structures. previous_.clear(); weights_.clear(); pq_.push(std::make_pair( std::make_pair(vertex, std::experimental::nullopt), 0.0)); } while (!pq_.empty()) { auto current = pq_.top(); pq_.pop(); // Check if the edge has already been processed. if (weights_.find(current.first.first) != weights_.end()) { continue; } previous_.emplace(current.first.first, current.first.second); weights_.emplace(current.first.first, current.second); // Reconstruct the path. auto last_vertex = current.first.first; std::vector edge_list{}; while (true) { // Origin_vertex must be in previous. const auto &previous_edge = previous_.find(last_vertex)->second; if (!previous_edge) break; last_vertex = previous_edge->from() == last_vertex ? previous_edge->to() : previous_edge->from(); edge_list.push_back(previous_edge.value()); } // Expand only if what we've just expanded is less then max depth. if (static_cast(edge_list.size()) < upper_bound_) expand_from_vertex(current.first.first); if (edge_list.empty()) continue; // Place destination node on the frame, handle existence flag. if (self_.existing_node_) { TypedValue &node = frame[self_.node_symbol_]; if ((node != current.first.first).Value()) continue; else // Prevent expanding other paths, because we found the // shortest to existing node. ClearQueue(); } else { frame[self_.node_symbol_] = current.first.first; } if (!self_.is_reverse_) { // Place edges on the frame in the correct order. std::reverse(edge_list.begin(), edge_list.end()); } frame[self_.edge_symbol_] = std::move(edge_list); frame[self_.total_weight_.value()] = current.second; return true; } } } void Reset() override { input_cursor_->Reset(); previous_.clear(); weights_.clear(); ClearQueue(); } private: const ExpandVariable &self_; database::GraphDbAccessor &db_; const std::unique_ptr input_cursor_; // Upper bound on the path length. int upper_bound_{-1}; // Maps vertices to weights they got in expansion. std::unordered_map weights_; // Maps vertices to edges used to reach them. std::unordered_map> previous_; // Priority queue comparator. Keep lowest weight on top of the queue. class PriorityQueueComparator { public: bool operator()( const std::pair>, double> &lhs, const std::pair>, double> &rhs) { return lhs.second > rhs.second; } }; std::priority_queue< std::pair< std::pair>, double>, std::vector>, double>>, PriorityQueueComparator> pq_; void ClearQueue() { while (!pq_.empty()) pq_.pop(); } }; std::unique_ptr ExpandVariable::MakeCursor( database::GraphDbAccessor &db) const { if (type_ == EdgeAtom::Type::BREADTH_FIRST) return std::make_unique(*this, db); else if (type_ == EdgeAtom::Type::WEIGHTED_SHORTEST_PATH) return std::make_unique(*this, db); else return std::make_unique(*this, db); } class ConstructNamedPathCursor : public Cursor { public: ConstructNamedPathCursor(const ConstructNamedPath &self, database::GraphDbAccessor &db) : self_(self), input_cursor_(self_.input()->MakeCursor(db)) {} bool Pull(Frame &frame, Context &context) override { if (!input_cursor_->Pull(frame, context)) return false; auto symbol_it = self_.path_elements().begin(); DCHECK(symbol_it != self_.path_elements().end()) << "Named path must contain at least one node"; TypedValue start_vertex = frame[*symbol_it++]; // In an OPTIONAL MATCH everything could be Null. if (start_vertex.IsNull()) { frame[self_.path_symbol()] = TypedValue::Null; return true; } DCHECK(start_vertex.IsVertex()) << "First named path element must be a vertex"; query::Path path(start_vertex.ValueVertex()); // If the last path element symbol was for an edge list, then // the next symbol is a vertex and it should not append to the path // because // expansion already did it. bool last_was_edge_list = false; for (; symbol_it != self_.path_elements().end(); symbol_it++) { TypedValue expansion = frame[*symbol_it]; // We can have Null (OPTIONAL MATCH), a vertex, an edge, or an edge // list (variable expand or BFS). switch (expansion.type()) { case TypedValue::Type::Null: frame[self_.path_symbol()] = TypedValue::Null; return true; case TypedValue::Type::Vertex: if (!last_was_edge_list) path.Expand(expansion.ValueVertex()); last_was_edge_list = false; break; case TypedValue::Type::Edge: path.Expand(expansion.ValueEdge()); break; case TypedValue::Type::List: { last_was_edge_list = true; // We need to expand all edges in the list and intermediary // vertices. const std::vector &edges = expansion.ValueList(); for (const auto &edge_value : edges) { const EdgeAccessor &edge = edge_value.ValueEdge(); const VertexAccessor from = edge.from(); if (path.vertices().back() == from) path.Expand(edge, edge.to()); else path.Expand(edge, from); } break; } default: LOG(FATAL) << "Unsupported type in named path construction"; break; } } frame[self_.path_symbol()] = path; return true; } void Reset() override { input_cursor_->Reset(); } private: const ConstructNamedPath self_; const std::unique_ptr input_cursor_; }; ACCEPT_WITH_INPUT(ConstructNamedPath) std::unique_ptr ConstructNamedPath::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector ConstructNamedPath::ModifiedSymbols( const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); symbols.emplace_back(path_symbol_); return symbols; } Filter::Filter(const std::shared_ptr &input, Expression *expression) : input_(input ? input : std::make_shared()), expression_(expression) {} ACCEPT_WITH_INPUT(Filter) std::unique_ptr Filter::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Filter::ModifiedSymbols(const SymbolTable &table) const { return input_->ModifiedSymbols(table); } Filter::FilterCursor::FilterCursor(const Filter &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} bool Filter::FilterCursor::Pull(Frame &frame, Context &context) { // Like all filters, newly set values should not affect filtering of old // nodes and edges. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::OLD); while (input_cursor_->Pull(frame, context)) { if (EvaluateFilter(evaluator, self_.expression_)) return true; } return false; } void Filter::FilterCursor::Reset() { input_cursor_->Reset(); } Produce::Produce(const std::shared_ptr &input, const std::vector &named_expressions) : input_(input ? input : std::make_shared()), named_expressions_(named_expressions) {} ACCEPT_WITH_INPUT(Produce) std::unique_ptr Produce::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Produce::OutputSymbols( const SymbolTable &symbol_table) const { std::vector symbols; for (const auto &named_expr : named_expressions_) { symbols.emplace_back(symbol_table.at(*named_expr)); } return symbols; } std::vector Produce::ModifiedSymbols(const SymbolTable &table) const { return OutputSymbols(table); } const std::vector &Produce::named_expressions() { return named_expressions_; } Produce::ProduceCursor::ProduceCursor(const Produce &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} bool Produce::ProduceCursor::Pull(Frame &frame, Context &context) { if (input_cursor_->Pull(frame, context)) { // Produce should always yield the latest results. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::NEW); for (auto named_expr : self_.named_expressions_) named_expr->Accept(evaluator); return true; } return false; } void Produce::ProduceCursor::Reset() { input_cursor_->Reset(); } Delete::Delete(const std::shared_ptr &input_, const std::vector &expressions, bool detach_) : input_(input_), expressions_(expressions), detach_(detach_) {} ACCEPT_WITH_INPUT(Delete) std::unique_ptr Delete::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Delete::ModifiedSymbols(const SymbolTable &table) const { return input_->ModifiedSymbols(table); } Delete::DeleteCursor::DeleteCursor(const Delete &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} bool Delete::DeleteCursor::Pull(Frame &frame, Context &context) { if (!input_cursor_->Pull(frame, context)) return false; // Delete should get the latest information, this way it is also possible // to // delete newly added nodes and edges. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::NEW); // collect expressions results so edges can get deleted before vertices // this is necessary because an edge that gets deleted could block vertex // deletion std::vector expression_results; expression_results.reserve(self_.expressions_.size()); for (Expression *expression : self_.expressions_) { expression_results.emplace_back(expression->Accept(evaluator)); } // delete edges first for (TypedValue &expression_result : expression_results) if (expression_result.type() == TypedValue::Type::Edge) db_.RemoveEdge(expression_result.Value()); // delete vertices for (TypedValue &expression_result : expression_results) switch (expression_result.type()) { case TypedValue::Type::Vertex: { VertexAccessor &va = expression_result.Value(); va.SwitchNew(); // necessary because an edge deletion could have // updated if (self_.detach_) db_.DetachRemoveVertex(va); else if (!db_.RemoveVertex(va)) throw QueryRuntimeException( "Failed to remove vertex because of it's existing " "connections. Consider using DETACH DELETE."); break; } // skip Edges (already deleted) and Nulls (can occur in optional // match) case TypedValue::Type::Edge: case TypedValue::Type::Null: break; // check we're not trying to delete anything except vertices and edges default: throw QueryRuntimeException("Can only delete edges and vertices"); } return true; } void Delete::DeleteCursor::Reset() { input_cursor_->Reset(); } SetProperty::SetProperty(const std::shared_ptr &input, PropertyLookup *lhs, Expression *rhs) : input_(input), lhs_(lhs), rhs_(rhs) {} ACCEPT_WITH_INPUT(SetProperty) std::unique_ptr SetProperty::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector SetProperty::ModifiedSymbols( const SymbolTable &table) const { return input_->ModifiedSymbols(table); } SetProperty::SetPropertyCursor::SetPropertyCursor(const SetProperty &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_->MakeCursor(db)) {} bool SetProperty::SetPropertyCursor::Pull(Frame &frame, Context &context) { if (!input_cursor_->Pull(frame, context)) return false; // Set, just like Create needs to see the latest changes. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::NEW); TypedValue lhs = self_.lhs_->expression_->Accept(evaluator); TypedValue rhs = self_.rhs_->Accept(evaluator); switch (lhs.type()) { case TypedValue::Type::Vertex: PropsSetChecked(lhs.Value(), self_.lhs_->property_, rhs); break; case TypedValue::Type::Edge: PropsSetChecked(lhs.Value(), self_.lhs_->property_, rhs); break; case TypedValue::Type::Null: // Skip setting properties on Null (can occur in optional match). break; case TypedValue::Type::Map: // Semantically modifying a map makes sense, but it's not supported due // to // all the copying we do (when PropertyValue -> TypedValue and in // ExpressionEvaluator). So even though we set a map property here, that // is never visible to the user and it's not stored. // TODO: fix above described bug default: throw QueryRuntimeException( "Properties can only be set on Vertices and Edges"); } return true; } void SetProperty::SetPropertyCursor::Reset() { input_cursor_->Reset(); } SetProperties::SetProperties(const std::shared_ptr &input, Symbol input_symbol, Expression *rhs, Op op) : input_(input), input_symbol_(input_symbol), rhs_(rhs), op_(op) {} ACCEPT_WITH_INPUT(SetProperties) std::unique_ptr SetProperties::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector SetProperties::ModifiedSymbols( const SymbolTable &table) const { return input_->ModifiedSymbols(table); } SetProperties::SetPropertiesCursor::SetPropertiesCursor( const SetProperties &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_->MakeCursor(db)) {} bool SetProperties::SetPropertiesCursor::Pull(Frame &frame, Context &context) { if (!input_cursor_->Pull(frame, context)) return false; TypedValue &lhs = frame[self_.input_symbol_]; // Set, just like Create needs to see the latest changes. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::NEW); TypedValue rhs = self_.rhs_->Accept(evaluator); switch (lhs.type()) { case TypedValue::Type::Vertex: Set(lhs.Value(), rhs); break; case TypedValue::Type::Edge: Set(lhs.Value(), rhs); break; case TypedValue::Type::Null: // Skip setting properties on Null (can occur in optional match). break; default: throw QueryRuntimeException( "Properties can only be set on Vertices and Edges"); } return true; } void SetProperties::SetPropertiesCursor::Reset() { input_cursor_->Reset(); } template void SetProperties::SetPropertiesCursor::Set(TRecordAccessor &record, const TypedValue &rhs) const { record.SwitchNew(); if (self_.op_ == Op::REPLACE) { try { record.PropsClear(); } catch (const RecordDeletedError &) { throw QueryRuntimeException( "Trying to set properties on a deleted graph element."); } } auto set_props = [&record](const auto &properties) { try { for (const auto &kv : properties) record.PropsSet(kv.first, kv.second); } catch (const RecordDeletedError &) { throw QueryRuntimeException( "Trying to set properties on a deleted graph element."); } }; switch (rhs.type()) { case TypedValue::Type::Edge: set_props(rhs.Value().Properties()); break; case TypedValue::Type::Vertex: set_props(rhs.Value().Properties()); break; case TypedValue::Type::Map: { for (const auto &kv : rhs.Value>()) PropsSetChecked(record, db_.Property(kv.first), kv.second); break; } default: throw QueryRuntimeException( "Can only set Vertices, Edges and maps as properties"); } } // instantiate the SetProperties function with concrete TRecordAccessor // types template void SetProperties::SetPropertiesCursor::Set( RecordAccessor &record, const TypedValue &rhs) const; template void SetProperties::SetPropertiesCursor::Set( RecordAccessor &record, const TypedValue &rhs) const; SetLabels::SetLabels(const std::shared_ptr &input, Symbol input_symbol, const std::vector &labels) : input_(input), input_symbol_(input_symbol), labels_(labels) {} ACCEPT_WITH_INPUT(SetLabels) std::unique_ptr SetLabels::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector SetLabels::ModifiedSymbols(const SymbolTable &table) const { return input_->ModifiedSymbols(table); } SetLabels::SetLabelsCursor::SetLabelsCursor(const SetLabels &self, database::GraphDbAccessor &db) : self_(self), input_cursor_(self.input_->MakeCursor(db)) {} bool SetLabels::SetLabelsCursor::Pull(Frame &frame, Context &context) { if (!input_cursor_->Pull(frame, context)) return false; TypedValue &vertex_value = frame[self_.input_symbol_]; // Skip setting labels on Null (can occur in optional match). if (vertex_value.IsNull()) return true; ExpectType(self_.input_symbol_, vertex_value, TypedValue::Type::Vertex); auto &vertex = vertex_value.Value(); vertex.SwitchNew(); try { for (auto label : self_.labels_) vertex.add_label(label); } catch (const RecordDeletedError &) { throw QueryRuntimeException("Trying to set labels on a deleted Vertex"); } return true; } void SetLabels::SetLabelsCursor::Reset() { input_cursor_->Reset(); } RemoveProperty::RemoveProperty(const std::shared_ptr &input, PropertyLookup *lhs) : input_(input), lhs_(lhs) {} ACCEPT_WITH_INPUT(RemoveProperty) std::unique_ptr RemoveProperty::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector RemoveProperty::ModifiedSymbols( const SymbolTable &table) const { return input_->ModifiedSymbols(table); } RemoveProperty::RemovePropertyCursor::RemovePropertyCursor( const RemoveProperty &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_->MakeCursor(db)) {} bool RemoveProperty::RemovePropertyCursor::Pull(Frame &frame, Context &context) { if (!input_cursor_->Pull(frame, context)) return false; // Remove, just like Delete needs to see the latest changes. ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::NEW); TypedValue lhs = self_.lhs_->expression_->Accept(evaluator); switch (lhs.type()) { case TypedValue::Type::Vertex: try { lhs.Value().PropsErase(self_.lhs_->property_); } catch (const RecordDeletedError &) { throw QueryRuntimeException( "Trying to remove properties from a deleted Vertex"); } break; case TypedValue::Type::Edge: try { lhs.Value().PropsErase(self_.lhs_->property_); } catch (const RecordDeletedError &) { throw QueryRuntimeException( "Trying to remove properties from a deleted Edge"); } break; case TypedValue::Type::Null: // Skip removing properties on Null (can occur in optional match). break; default: throw QueryRuntimeException( "Properties can only be removed on Vertices and Edges"); } return true; } void RemoveProperty::RemovePropertyCursor::Reset() { input_cursor_->Reset(); } RemoveLabels::RemoveLabels(const std::shared_ptr &input, Symbol input_symbol, const std::vector &labels) : input_(input), input_symbol_(input_symbol), labels_(labels) {} ACCEPT_WITH_INPUT(RemoveLabels) std::unique_ptr RemoveLabels::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector RemoveLabels::ModifiedSymbols( const SymbolTable &table) const { return input_->ModifiedSymbols(table); } RemoveLabels::RemoveLabelsCursor::RemoveLabelsCursor( const RemoveLabels &self, database::GraphDbAccessor &db) : self_(self), input_cursor_(self.input_->MakeCursor(db)) {} bool RemoveLabels::RemoveLabelsCursor::Pull(Frame &frame, Context &context) { if (!input_cursor_->Pull(frame, context)) return false; TypedValue &vertex_value = frame[self_.input_symbol_]; // Skip removing labels on Null (can occur in optional match). if (vertex_value.IsNull()) return true; ExpectType(self_.input_symbol_, vertex_value, TypedValue::Type::Vertex); auto &vertex = vertex_value.Value(); vertex.SwitchNew(); try { for (auto label : self_.labels_) vertex.remove_label(label); } catch (const RecordDeletedError &) { throw QueryRuntimeException( "Trying to remove labels from a deleted Vertex"); } return true; } void RemoveLabels::RemoveLabelsCursor::Reset() { input_cursor_->Reset(); } template ExpandUniquenessFilter::ExpandUniquenessFilter( const std::shared_ptr &input, Symbol expand_symbol, const std::vector &previous_symbols) : input_(input), expand_symbol_(expand_symbol), previous_symbols_(previous_symbols) {} template ACCEPT_WITH_INPUT(ExpandUniquenessFilter) template std::unique_ptr ExpandUniquenessFilter::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } template std::vector ExpandUniquenessFilter::ModifiedSymbols( const SymbolTable &table) const { return input_->ModifiedSymbols(table); } template ExpandUniquenessFilter::ExpandUniquenessFilterCursor:: ExpandUniquenessFilterCursor(const ExpandUniquenessFilter &self, database::GraphDbAccessor &db) : self_(self), input_cursor_(self.input_->MakeCursor(db)) {} namespace { /** * Returns true if: * - a and b are vertex values and are the same * - a and b are either edge or edge-list values, and there * is at least one matching edge in the two values */ template bool ContainsSame(const TypedValue &a, const TypedValue &b); template <> bool ContainsSame(const TypedValue &a, const TypedValue &b) { return a.Value() == b.Value(); } template <> bool ContainsSame(const TypedValue &a, const TypedValue &b) { auto compare_to_list = [](const TypedValue &list, const TypedValue &other) { for (const TypedValue &list_elem : list.Value>()) if (ContainsSame(list_elem, other)) return true; return false; }; if (a.type() == TypedValue::Type::List) return compare_to_list(a, b); if (b.type() == TypedValue::Type::List) return compare_to_list(b, a); return a.Value() == b.Value(); } } // namespace template bool ExpandUniquenessFilter::ExpandUniquenessFilterCursor::Pull( Frame &frame, Context &context) { auto expansion_ok = [&]() { TypedValue &expand_value = frame[self_.expand_symbol_]; for (const auto &previous_symbol : self_.previous_symbols_) { TypedValue &previous_value = frame[previous_symbol]; // This shouldn't raise a TypedValueException, because the planner // makes sure these are all of the expected type. In case they are not, // an error should be raised long before this code is executed. if (ContainsSame(previous_value, expand_value)) return false; } return true; }; while (input_cursor_->Pull(frame, context)) if (expansion_ok()) return true; return false; } template void ExpandUniquenessFilter::ExpandUniquenessFilterCursor::Reset() { input_cursor_->Reset(); } // instantiations of the ExpandUniquenessFilter template class // we only ever need these two template class ExpandUniquenessFilter; template class ExpandUniquenessFilter; Accumulate::Accumulate(const std::shared_ptr &input, const std::vector &symbols, bool advance_command) : input_(input), symbols_(symbols), advance_command_(advance_command) {} ACCEPT_WITH_INPUT(Accumulate) std::unique_ptr Accumulate::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Accumulate::ModifiedSymbols(const SymbolTable &) const { return symbols_; } Accumulate::AccumulateCursor::AccumulateCursor(const Accumulate &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_->MakeCursor(db)) {} bool Accumulate::AccumulateCursor::Pull(Frame &frame, Context &context) { // cache all the input if (!pulled_all_input_) { while (input_cursor_->Pull(frame, context)) { std::vector row; row.reserve(self_.symbols_.size()); for (const Symbol &symbol : self_.symbols_) row.emplace_back(frame[symbol]); cache_.emplace_back(std::move(row)); } pulled_all_input_ = true; cache_it_ = cache_.begin(); if (self_.advance_command_) { db_.AdvanceCommand(); for (auto &row : cache_) for (auto &col : row) query::ReconstructTypedValue(col); } } if (cache_it_ == cache_.end()) return false; auto row_it = (cache_it_++)->begin(); for (const Symbol &symbol : self_.symbols_) frame[symbol] = *row_it++; return true; } void Accumulate::AccumulateCursor::Reset() { input_cursor_->Reset(); cache_.clear(); cache_it_ = cache_.begin(); pulled_all_input_ = false; } Aggregate::Aggregate(const std::shared_ptr &input, const std::vector &aggregations, const std::vector &group_by, const std::vector &remember) : input_(input ? input : std::make_shared()), aggregations_(aggregations), group_by_(group_by), remember_(remember) {} ACCEPT_WITH_INPUT(Aggregate) std::unique_ptr Aggregate::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Aggregate::ModifiedSymbols(const SymbolTable &) const { auto symbols = remember_; for (const auto &elem : aggregations_) symbols.push_back(elem.output_sym); return symbols; } Aggregate::AggregateCursor::AggregateCursor(const Aggregate &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} namespace { /** Returns the default TypedValue for an Aggregation element. * This value is valid both for returning when where are no inputs * to the aggregation op, and for initializing an aggregation result * when there are */ TypedValue DefaultAggregationOpValue(const Aggregate::Element &element) { switch (element.op) { case Aggregation::Op::COUNT: return TypedValue(0); case Aggregation::Op::SUM: case Aggregation::Op::MIN: case Aggregation::Op::MAX: case Aggregation::Op::AVG: return TypedValue::Null; case Aggregation::Op::COLLECT_LIST: return TypedValue(std::vector()); case Aggregation::Op::COLLECT_MAP: return TypedValue(std::map()); } } } // namespace bool Aggregate::AggregateCursor::Pull(Frame &frame, Context &context) { if (!pulled_all_input_) { ProcessAll(frame, context); pulled_all_input_ = true; aggregation_it_ = aggregation_.begin(); // in case there is no input and no group_bys we need to return true // just this once if (aggregation_.empty() && self_.group_by_.empty()) { // place default aggregation values on the frame for (const auto &elem : self_.aggregations_) frame[elem.output_sym] = DefaultAggregationOpValue(elem); // place null as remember values on the frame for (const Symbol &remember_sym : self_.remember_) frame[remember_sym] = TypedValue::Null; return true; } } if (aggregation_it_ == aggregation_.end()) return false; // place aggregation values on the frame auto aggregation_values_it = aggregation_it_->second.values_.begin(); for (const auto &aggregation_elem : self_.aggregations_) frame[aggregation_elem.output_sym] = *aggregation_values_it++; // place remember values on the frame auto remember_values_it = aggregation_it_->second.remember_.begin(); for (const Symbol &remember_sym : self_.remember_) frame[remember_sym] = *remember_values_it++; aggregation_it_++; return true; } void Aggregate::AggregateCursor::ProcessAll(Frame &frame, Context &context) { ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_, GraphView::NEW); while (input_cursor_->Pull(frame, context)) ProcessOne(frame, context.symbol_table_, evaluator); // calculate AVG aggregations (so far they have only been summed) for (int pos = 0; pos < static_cast(self_.aggregations_.size()); ++pos) { if (self_.aggregations_[pos].op != Aggregation::Op::AVG) continue; for (auto &kv : aggregation_) { AggregationValue &agg_value = kv.second; int count = agg_value.counts_[pos]; if (count > 0) agg_value.values_[pos] = agg_value.values_[pos] / (double)count; } } } void Aggregate::AggregateCursor::ProcessOne(Frame &frame, const SymbolTable &symbol_table, ExpressionEvaluator &evaluator) { std::vector group_by; group_by.reserve(self_.group_by_.size()); for (Expression *expression : self_.group_by_) { group_by.emplace_back(expression->Accept(evaluator)); } AggregationValue &agg_value = aggregation_[group_by]; EnsureInitialized(frame, agg_value); Update(frame, symbol_table, evaluator, agg_value); } void Aggregate::AggregateCursor::EnsureInitialized( Frame &frame, Aggregate::AggregateCursor::AggregationValue &agg_value) const { if (agg_value.values_.size() > 0) return; for (const auto &agg_elem : self_.aggregations_) agg_value.values_.emplace_back(DefaultAggregationOpValue(agg_elem)); agg_value.counts_.resize(self_.aggregations_.size(), 0); for (const Symbol &remember_sym : self_.remember_) agg_value.remember_.push_back(frame[remember_sym]); } void Aggregate::AggregateCursor::Update( Frame &, const SymbolTable &, ExpressionEvaluator &evaluator, Aggregate::AggregateCursor::AggregationValue &agg_value) { DCHECK(self_.aggregations_.size() == agg_value.values_.size()) << "Expected as much AggregationValue.values_ as there are " "aggregations."; DCHECK(self_.aggregations_.size() == agg_value.counts_.size()) << "Expected as much AggregationValue.counts_ as there are " "aggregations."; // we iterate over counts, values and aggregation info at the same time auto count_it = agg_value.counts_.begin(); auto value_it = agg_value.values_.begin(); auto agg_elem_it = self_.aggregations_.begin(); for (; count_it < agg_value.counts_.end(); count_it++, value_it++, agg_elem_it++) { // COUNT(*) is the only case where input expression is optional // handle it here auto input_expr_ptr = agg_elem_it->value; if (!input_expr_ptr) { *count_it += 1; *value_it = *count_it; continue; } TypedValue input_value = input_expr_ptr->Accept(evaluator); // Aggregations skip Null input values. if (input_value.IsNull()) continue; const auto &agg_op = agg_elem_it->op; *count_it += 1; if (*count_it == 1) { // first value, nothing to aggregate. check type, set and continue. switch (agg_op) { case Aggregation::Op::MIN: case Aggregation::Op::MAX: *value_it = input_value; EnsureOkForMinMax(input_value); break; case Aggregation::Op::SUM: case Aggregation::Op::AVG: *value_it = input_value; EnsureOkForAvgSum(input_value); break; case Aggregation::Op::COUNT: *value_it = 1; break; case Aggregation::Op::COLLECT_LIST: value_it->Value>().push_back(input_value); break; case Aggregation::Op::COLLECT_MAP: auto key = agg_elem_it->key->Accept(evaluator); if (key.type() != TypedValue::Type::String) throw QueryRuntimeException("Map key must be a string"); value_it->Value>().emplace( key.Value(), input_value); break; } continue; } // aggregation of existing values switch (agg_op) { case Aggregation::Op::COUNT: *value_it = *count_it; break; case Aggregation::Op::MIN: { EnsureOkForMinMax(input_value); try { TypedValue comparison_result = input_value < *value_it; // since we skip nulls we either have a valid comparison, or // an exception was just thrown above // safe to assume a bool TypedValue if (comparison_result.Value()) *value_it = input_value; } catch (const TypedValueException &) { throw QueryRuntimeException("Unable to get MIN of '{}' and '{}'", input_value.type(), value_it->type()); } break; } case Aggregation::Op::MAX: { // all comments as for Op::Min EnsureOkForMinMax(input_value); try { TypedValue comparison_result = input_value > *value_it; if (comparison_result.Value()) *value_it = input_value; } catch (const TypedValueException &) { throw QueryRuntimeException("Unable to get MAX of '{}' and '{}'", input_value.type(), value_it->type()); } break; } case Aggregation::Op::AVG: // for averaging we sum first and divide by count once all // the input has been processed case Aggregation::Op::SUM: EnsureOkForAvgSum(input_value); *value_it = *value_it + input_value; break; case Aggregation::Op::COLLECT_LIST: value_it->Value>().push_back(input_value); break; case Aggregation::Op::COLLECT_MAP: auto key = agg_elem_it->key->Accept(evaluator); if (key.type() != TypedValue::Type::String) throw QueryRuntimeException("Map key must be a string"); value_it->Value>().emplace( key.Value(), input_value); break; } // end switch over Aggregation::Op enum } // end loop over all aggregations } void Aggregate::AggregateCursor::Reset() { input_cursor_->Reset(); aggregation_.clear(); aggregation_it_ = aggregation_.begin(); pulled_all_input_ = false; } void Aggregate::AggregateCursor::EnsureOkForMinMax( const TypedValue &value) const { switch (value.type()) { case TypedValue::Type::Bool: case TypedValue::Type::Int: case TypedValue::Type::Double: case TypedValue::Type::String: return; default: throw QueryRuntimeException( "Only Bool, Int, Double and String values are allowed in " "MIN and MAX aggregations"); } } void Aggregate::AggregateCursor::EnsureOkForAvgSum( const TypedValue &value) const { switch (value.type()) { case TypedValue::Type::Int: case TypedValue::Type::Double: return; default: throw QueryRuntimeException( "Only numeric values allowed in SUM and AVG aggregations"); } } bool TypedValueVectorEqual::operator()( const std::vector &left, const std::vector &right) const { DCHECK(left.size() == right.size()) << "TypedValueVector comparison should only be done over vectors " "of the same size"; return std::equal(left.begin(), left.end(), right.begin(), TypedValue::BoolEqual{}); } Skip::Skip(const std::shared_ptr &input, Expression *expression) : input_(input), expression_(expression) {} ACCEPT_WITH_INPUT(Skip) std::unique_ptr Skip::MakeCursor(database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Skip::OutputSymbols(const SymbolTable &symbol_table) const { // Propagate this to potential Produce. return input_->OutputSymbols(symbol_table); } std::vector Skip::ModifiedSymbols(const SymbolTable &table) const { return input_->ModifiedSymbols(table); } Skip::SkipCursor::SkipCursor(const Skip &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} bool Skip::SkipCursor::Pull(Frame &frame, Context &context) { while (input_cursor_->Pull(frame, context)) { if (to_skip_ == -1) { // first successful pull from the input // evaluate the skip expression ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_); TypedValue to_skip = self_.expression_->Accept(evaluator); if (to_skip.type() != TypedValue::Type::Int) throw QueryRuntimeException("Result of SKIP expression must be an int"); to_skip_ = to_skip.Value(); if (to_skip_ < 0) throw QueryRuntimeException( "Result of SKIP expression must be greater or equal to zero"); } if (skipped_++ < to_skip_) continue; return true; } return false; } void Skip::SkipCursor::Reset() { input_cursor_->Reset(); to_skip_ = -1; skipped_ = 0; } Limit::Limit(const std::shared_ptr &input, Expression *expression) : input_(input), expression_(expression) {} ACCEPT_WITH_INPUT(Limit) std::unique_ptr Limit::MakeCursor(database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Limit::OutputSymbols( const SymbolTable &symbol_table) const { // Propagate this to potential Produce. return input_->OutputSymbols(symbol_table); } std::vector Limit::ModifiedSymbols(const SymbolTable &table) const { return input_->ModifiedSymbols(table); } Limit::LimitCursor::LimitCursor(const Limit &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} bool Limit::LimitCursor::Pull(Frame &frame, Context &context) { // we need to evaluate the limit expression before the first input Pull // because it might be 0 and thereby we shouldn't Pull from input at all // we can do this before Pulling from the input because the limit // expression is not allowed to contain any identifiers if (limit_ == -1) { ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_); TypedValue limit = self_.expression_->Accept(evaluator); if (limit.type() != TypedValue::Type::Int) throw QueryRuntimeException("Result of LIMIT expression must be an int"); limit_ = limit.Value(); if (limit_ < 0) throw QueryRuntimeException( "Result of LIMIT expression must be greater or equal to zero"); } // check we have not exceeded the limit before pulling if (pulled_++ >= limit_) return false; return input_cursor_->Pull(frame, context); } void Limit::LimitCursor::Reset() { input_cursor_->Reset(); limit_ = -1; pulled_ = 0; } OrderBy::OrderBy(const std::shared_ptr &input, const std::vector> &order_by, const std::vector &output_symbols) : input_(input), output_symbols_(output_symbols) { // split the order_by vector into two vectors of orderings and expressions std::vector ordering; ordering.reserve(order_by.size()); order_by_.reserve(order_by.size()); for (const auto &ordering_expression_pair : order_by) { ordering.emplace_back(ordering_expression_pair.first); order_by_.emplace_back(ordering_expression_pair.second); } compare_ = TypedValueVectorCompare(ordering); } ACCEPT_WITH_INPUT(OrderBy) std::unique_ptr OrderBy::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector OrderBy::OutputSymbols( const SymbolTable &symbol_table) const { // Propagate this to potential Produce. return input_->OutputSymbols(symbol_table); } std::vector OrderBy::ModifiedSymbols(const SymbolTable &table) const { return input_->ModifiedSymbols(table); } OrderBy::OrderByCursor::OrderByCursor(const OrderBy &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self_.input_->MakeCursor(db)) {} bool OrderBy::OrderByCursor::Pull(Frame &frame, Context &context) { if (!did_pull_all_) { ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_); while (input_cursor_->Pull(frame, context)) { // collect the order_by elements std::vector order_by; order_by.reserve(self_.order_by_.size()); for (auto expression_ptr : self_.order_by_) { order_by.emplace_back(expression_ptr->Accept(evaluator)); } // collect the output elements std::vector output; output.reserve(self_.output_symbols_.size()); for (const Symbol &output_sym : self_.output_symbols_) output.emplace_back(frame[output_sym]); cache_.emplace_back(std::move(order_by), std::move(output)); } std::sort(cache_.begin(), cache_.end(), [this](const auto &pair1, const auto &pair2) { return self_.compare_(pair1.first, pair2.first); }); did_pull_all_ = true; cache_it_ = cache_.begin(); } if (cache_it_ == cache_.end()) return false; // place the output values on the frame DCHECK(self_.output_symbols_.size() == cache_it_->second.size()) << "Number of values does not match the number of output symbols " "in OrderBy"; auto output_sym_it = self_.output_symbols_.begin(); for (const TypedValue &output : cache_it_->second) frame[*output_sym_it++] = output; cache_it_++; return true; } void OrderBy::OrderByCursor::Reset() { input_cursor_->Reset(); did_pull_all_ = false; cache_.clear(); cache_it_ = cache_.begin(); } bool OrderBy::TypedValueCompare(const TypedValue &a, const TypedValue &b) { // in ordering null comes after everything else // at the same time Null is not less that null // first deal with Null < Whatever case if (a.IsNull()) return false; // now deal with NotNull < Null case if (b.IsNull()) return true; // comparisons are from this point legal only between values of // the same type, or int+float combinations if ((a.type() != b.type() && !(a.IsNumeric() && b.IsNumeric()))) throw QueryRuntimeException( "Can't compare value of type {} to value of type {}", a.type(), b.type()); switch (a.type()) { case TypedValue::Type::Bool: return !a.Value() && b.Value(); case TypedValue::Type::Int: if (b.type() == TypedValue::Type::Double) return a.Value() < b.Value(); else return a.Value() < b.Value(); case TypedValue::Type::Double: if (b.type() == TypedValue::Type::Int) return a.Value() < b.Value(); else return a.Value() < b.Value(); case TypedValue::Type::String: return a.Value() < b.Value(); case TypedValue::Type::List: case TypedValue::Type::Map: case TypedValue::Type::Vertex: case TypedValue::Type::Edge: case TypedValue::Type::Path: throw QueryRuntimeException( "Comparison is not defined for values of type {}", a.type()); default: LOG(FATAL) << "Unhandled comparison for types"; } } bool OrderBy::TypedValueVectorCompare::operator()( const std::vector &c1, const std::vector &c2) const { // ordering is invalid if there are more elements in the collections // then there are in the ordering_ vector DCHECK(c1.size() <= ordering_.size() && c2.size() <= ordering_.size()) << "Collections contain more elements then there are orderings"; auto c1_it = c1.begin(); auto c2_it = c2.begin(); auto ordering_it = ordering_.begin(); for (; c1_it != c1.end() && c2_it != c2.end(); c1_it++, c2_it++, ordering_it++) { if (OrderBy::TypedValueCompare(*c1_it, *c2_it)) return *ordering_it == Ordering::ASC; if (OrderBy::TypedValueCompare(*c2_it, *c1_it)) return *ordering_it == Ordering::DESC; } // at least one collection is exhausted // c1 is less then c2 iff c1 reached the end but c2 didn't return (c1_it == c1.end()) && (c2_it != c2.end()); } Merge::Merge(const std::shared_ptr &input, const std::shared_ptr &merge_match, const std::shared_ptr &merge_create) : input_(input ? input : std::make_shared()), merge_match_(merge_match), merge_create_(merge_create) {} bool Merge::Accept(HierarchicalLogicalOperatorVisitor &visitor) { if (visitor.PreVisit(*this)) { input_->Accept(visitor) && merge_match_->Accept(visitor) && merge_create_->Accept(visitor); } return visitor.PostVisit(*this); } std::unique_ptr Merge::MakeCursor(database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Merge::ModifiedSymbols(const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); // Match and create branches should have the same symbols, so just take one of // them. auto my_symbols = merge_match_->OutputSymbols(table); symbols.insert(symbols.end(), my_symbols.begin(), my_symbols.end()); return symbols; } Merge::MergeCursor::MergeCursor(const Merge &self, database::GraphDbAccessor &db) : input_cursor_(self.input_->MakeCursor(db)), merge_match_cursor_(self.merge_match_->MakeCursor(db)), merge_create_cursor_(self.merge_create_->MakeCursor(db)) {} bool Merge::MergeCursor::Pull(Frame &frame, Context &context) { if (pull_input_) { if (input_cursor_->Pull(frame, context)) { // after a successful input from the input // reset merge_match (it's expand iterators maintain state) // and merge_create (could have a Once at the beginning) merge_match_cursor_->Reset(); merge_create_cursor_->Reset(); } else // input is exhausted, we're done return false; } // pull from the merge_match cursor if (merge_match_cursor_->Pull(frame, context)) { // if successful, next Pull from this should not pull_input_ pull_input_ = false; return true; } else { // failed to Pull from the merge_match cursor if (pull_input_) { // if we have just now pulled from the input // and failed to pull from merge_match, we should create __attribute__((unused)) bool merge_create_pull_result = merge_create_cursor_->Pull(frame, context); DCHECK(merge_create_pull_result) << "MergeCreate must never fail"; return true; } // we have exhausted merge_match_cursor_ after 1 or more successful // Pulls // attempt next input_cursor_ pull pull_input_ = true; return Pull(frame, context); } } void Merge::MergeCursor::Reset() { input_cursor_->Reset(); merge_match_cursor_->Reset(); merge_create_cursor_->Reset(); pull_input_ = true; } Optional::Optional(const std::shared_ptr &input, const std::shared_ptr &optional, const std::vector &optional_symbols) : input_(input ? input : std::make_shared()), optional_(optional), optional_symbols_(optional_symbols) {} bool Optional::Accept(HierarchicalLogicalOperatorVisitor &visitor) { if (visitor.PreVisit(*this)) { input_->Accept(visitor) && optional_->Accept(visitor); } return visitor.PostVisit(*this); } std::unique_ptr Optional::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Optional::ModifiedSymbols(const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); auto my_symbols = optional_->ModifiedSymbols(table); symbols.insert(symbols.end(), my_symbols.begin(), my_symbols.end()); return symbols; } Optional::OptionalCursor::OptionalCursor(const Optional &self, database::GraphDbAccessor &db) : self_(self), input_cursor_(self.input_->MakeCursor(db)), optional_cursor_(self.optional_->MakeCursor(db)) {} bool Optional::OptionalCursor::Pull(Frame &frame, Context &context) { if (pull_input_) { if (input_cursor_->Pull(frame, context)) { // after a successful input from the input // reset optional_ (it's expand iterators maintain state) optional_cursor_->Reset(); } else // input is exhausted, we're done return false; } // pull from the optional_ cursor if (optional_cursor_->Pull(frame, context)) { // if successful, next Pull from this should not pull_input_ pull_input_ = false; return true; } else { // failed to Pull from the merge_match cursor if (pull_input_) { // if we have just now pulled from the input // and failed to pull from optional_ so set the // optional symbols to Null, ensure next time the // input gets pulled and return true for (const Symbol &sym : self_.optional_symbols_) frame[sym] = TypedValue::Null; pull_input_ = true; return true; } // we have exhausted optional_cursor_ after 1 or more successful Pulls // attempt next input_cursor_ pull pull_input_ = true; return Pull(frame, context); } } void Optional::OptionalCursor::Reset() { input_cursor_->Reset(); optional_cursor_->Reset(); pull_input_ = true; } Unwind::Unwind(const std::shared_ptr &input, Expression *input_expression, Symbol output_symbol) : input_(input ? input : std::make_shared()), input_expression_(input_expression), output_symbol_(output_symbol) {} ACCEPT_WITH_INPUT(Unwind) std::unique_ptr Unwind::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Unwind::ModifiedSymbols(const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); symbols.emplace_back(output_symbol_); return symbols; } Unwind::UnwindCursor::UnwindCursor(const Unwind &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_->MakeCursor(db)) {} bool Unwind::UnwindCursor::Pull(Frame &frame, Context &context) { if (db_.should_abort()) throw HintedAbortError(); // if we reached the end of our list of values // pull from the input if (input_value_it_ == input_value_.end()) { if (!input_cursor_->Pull(frame, context)) return false; // successful pull from input, initialize value and iterator ExpressionEvaluator evaluator(frame, context.parameters_, context.symbol_table_, db_); TypedValue input_value = self_.input_expression_->Accept(evaluator); if (input_value.type() != TypedValue::Type::List) throw QueryRuntimeException("UNWIND only accepts list values, got '{}'", input_value.type()); input_value_ = input_value.Value>(); input_value_it_ = input_value_.begin(); } // if we reached the end of our list of values goto back to top if (input_value_it_ == input_value_.end()) return Pull(frame, context); frame[self_.output_symbol_] = *input_value_it_++; return true; } void Unwind::UnwindCursor::Reset() { input_cursor_->Reset(); input_value_.clear(); input_value_it_ = input_value_.end(); } Distinct::Distinct(const std::shared_ptr &input, const std::vector &value_symbols) : input_(input ? input : std::make_shared()), value_symbols_(value_symbols) {} ACCEPT_WITH_INPUT(Distinct) std::unique_ptr Distinct::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Distinct::OutputSymbols( const SymbolTable &symbol_table) const { // Propagate this to potential Produce. return input_->OutputSymbols(symbol_table); } std::vector Distinct::ModifiedSymbols(const SymbolTable &table) const { return input_->ModifiedSymbols(table); } Distinct::DistinctCursor::DistinctCursor(const Distinct &self, database::GraphDbAccessor &db) : self_(self), input_cursor_(self.input_->MakeCursor(db)) {} bool Distinct::DistinctCursor::Pull(Frame &frame, Context &context) { while (true) { if (!input_cursor_->Pull(frame, context)) return false; std::vector row; row.reserve(self_.value_symbols_.size()); for (const auto &symbol : self_.value_symbols_) row.emplace_back(frame[symbol]); if (seen_rows_.insert(std::move(row)).second) return true; } } void Distinct::DistinctCursor::Reset() { input_cursor_->Reset(); seen_rows_.clear(); } CreateIndex::CreateIndex(storage::Label label, storage::Property property) : label_(label), property_(property) {} bool CreateIndex::Accept(HierarchicalLogicalOperatorVisitor &visitor) { return visitor.Visit(*this); } class CreateIndexCursor : public Cursor { public: CreateIndexCursor(const CreateIndex &self, database::GraphDbAccessor &db) : self_(self), db_(db) {} bool Pull(Frame &, Context &ctx) override { if (did_create_) return false; if (ctx.in_explicit_transaction_) { throw IndexInMulticommandTxException(); } try { db_.BuildIndex(self_.label(), self_.property()); } catch (const database::IndexExistsException &) { // Ignore creating an existing index. } ctx.is_index_created_ = did_create_ = true; return true; } void Reset() override { did_create_ = false; } private: const CreateIndex &self_; database::GraphDbAccessor &db_; bool did_create_ = false; }; std::unique_ptr CreateIndex::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } Union::Union(const std::shared_ptr &left_op, const std::shared_ptr &right_op, const std::vector &union_symbols, const std::vector &left_symbols, const std::vector &right_symbols) : left_op_(left_op), right_op_(right_op), union_symbols_(union_symbols), left_symbols_(left_symbols), right_symbols_(right_symbols) {} std::unique_ptr Union::MakeCursor(database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } bool Union::Accept(HierarchicalLogicalOperatorVisitor &visitor) { if (visitor.PreVisit(*this)) { if (left_op_->Accept(visitor)) { right_op_->Accept(visitor); } } return visitor.PostVisit(*this); } std::vector Union::OutputSymbols(const SymbolTable &) const { return union_symbols_; } std::vector Union::ModifiedSymbols(const SymbolTable &) const { return union_symbols_; } Union::UnionCursor::UnionCursor(const Union &self, database::GraphDbAccessor &db) : self_(self), left_cursor_(self.left_op_->MakeCursor(db)), right_cursor_(self.right_op_->MakeCursor(db)) {} bool Union::UnionCursor::Pull(Frame &frame, Context &context) { std::unordered_map results; if (left_cursor_->Pull(frame, context)) { // collect values from the left child for (const auto &output_symbol : self_.left_symbols_) { results[output_symbol.name()] = frame[output_symbol]; } } else if (right_cursor_->Pull(frame, context)) { // collect values from the right child for (const auto &output_symbol : self_.right_symbols_) { results[output_symbol.name()] = frame[output_symbol]; } } else { return false; } // put collected values on frame under union symbols for (const auto &symbol : self_.union_symbols_) { frame[symbol] = results[symbol.name()]; } return true; } void Union::UnionCursor::Reset() { left_cursor_->Reset(); right_cursor_->Reset(); } PullRemote::PullRemote(const std::shared_ptr &input, int64_t plan_id, const std::vector &symbols) : input_(input), plan_id_(plan_id), symbols_(symbols) {} ACCEPT_WITH_INPUT(PullRemote); std::vector PullRemote::OutputSymbols(const SymbolTable &table) const { return input_ ? input_->OutputSymbols(table) : std::vector{}; } std::vector PullRemote::ModifiedSymbols( const SymbolTable &table) const { auto symbols = symbols_; if (input_) { auto input_symbols = input_->ModifiedSymbols(table); symbols.insert(symbols.end(), input_symbols.begin(), input_symbols.end()); } return symbols; } PullRemote::PullRemoteCursor::PullRemoteCursor(const PullRemote &self, database::GraphDbAccessor &db) : self_(self), db_(db), input_cursor_(self.input_ ? self.input_->MakeCursor(db) : nullptr) { worker_ids_ = db_.db().remote_pull_clients().GetWorkerIds(); // Remove master from the worker ids list. worker_ids_.erase(std::find(worker_ids_.begin(), worker_ids_.end(), 0)); } bool PullRemote::PullRemoteCursor::Pull(Frame &frame, Context &context) { auto insert_future_for_worker = [&](int worker_id) { remote_pulls_[worker_id] = db_.db().remote_pull_clients().RemotePull( db_, worker_id, self_.plan_id(), context.parameters_, self_.symbols(), false); }; if (!remote_pulls_initialized_) { for (auto &worker_id : worker_ids_) { insert_future_for_worker(worker_id); } remote_pulls_initialized_ = true; } bool have_remote_results = false; while (!have_remote_results && !worker_ids_.empty()) { // If we don't have results for a worker, check if his remote pull // finished and save results locally. for (auto &worker_id : worker_ids_) { if (!remote_results_[worker_id].empty()) continue; auto found_it = remote_pulls_.find(worker_id); if (found_it == remote_pulls_.end()) continue; auto &remote_pull = found_it->second; if (!remote_pull.valid()) continue; auto remote_results = remote_pull.get(); switch (remote_results.pull_state) { case distributed::RemotePullState::CURSOR_EXHAUSTED: remote_results_[worker_id] = std::move(remote_results.frames); remote_pulls_.erase(found_it); break; case distributed::RemotePullState::CURSOR_IN_PROGRESS: remote_results_[worker_id] = std::move(remote_results.frames); insert_future_for_worker(worker_id); break; case distributed::RemotePullState::SERIALIZATION_ERROR: throw mvcc::SerializationError( "Serialization error occured during PullRemote !"); case distributed::RemotePullState::LOCK_TIMEOUT_ERROR: throw LockTimeoutException( "LockTimeout error occured during PullRemote !"); case distributed::RemotePullState::UPDATE_DELETED_ERROR: throw QueryRuntimeException( "RecordDeleted error ocured during PullRemote !"); case distributed::RemotePullState::RECONSTRUCTION_ERROR: throw query::ReconstructionException(); case distributed::RemotePullState::QUERY_ERROR: throw QueryRuntimeException( "Query runtime error occurred duing PullRemote !"); } } // Get locally stored results from workers in a round-robin fasion. int num_workers = worker_ids_.size(); for (int i = 0; i < num_workers; ++i) { int worker_id_index = (last_pulled_worker_id_index_ + i + 1) % num_workers; int worker_id = worker_ids_[worker_id_index]; if (!remote_results_[worker_id].empty()) { last_pulled_worker_id_index_ = worker_id_index; have_remote_results = true; break; } } if (!have_remote_results) { if (remote_pulls_.empty()) { worker_ids_.clear(); break; } // If there are no remote results available, try to pull and return local // results. if (input_cursor_ && input_cursor_->Pull(frame, context)) { return true; } // If there aren't any local/remote results available, sleep. std::this_thread::sleep_for( std::chrono::milliseconds(FLAGS_remote_pull_sleep)); } } // No more remote results, make sure local results get exhausted. if (!have_remote_results) { if (input_cursor_ && input_cursor_->Pull(frame, context)) { return true; } return false; } int pull_from_worker_id = worker_ids_[last_pulled_worker_id_index_]; { auto &result = remote_results_[pull_from_worker_id].back(); for (size_t i = 0; i < self_.symbols().size(); ++i) { frame[self_.symbols()[i]] = std::move(result[i]); } } remote_results_[pull_from_worker_id].resize( remote_results_[pull_from_worker_id].size() - 1); // Remove the worker if we exhausted all locally stored results and there // are no more pending remote pulls for that worker. if (remote_results_[pull_from_worker_id].empty() && remote_pulls_.find(pull_from_worker_id) == remote_pulls_.end()) { worker_ids_.erase(worker_ids_.begin() + last_pulled_worker_id_index_); } return true; } void PullRemote::PullRemoteCursor::Reset() { throw QueryRuntimeException("Unsupported: Reset during PullRemote!"); } std::unique_ptr PullRemote::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } bool Synchronize::Accept(HierarchicalLogicalOperatorVisitor &visitor) { if (visitor.PreVisit(*this)) { input_->Accept(visitor) && pull_remote_->Accept(visitor); } return visitor.PostVisit(*this); } std::vector Synchronize::ModifiedSymbols( const SymbolTable &table) const { auto symbols = input_->ModifiedSymbols(table); if (pull_remote_) { auto pull_symbols = pull_remote_->ModifiedSymbols(table); symbols.insert(symbols.end(), pull_symbols.begin(), pull_symbols.end()); } return symbols; } namespace { class SynchronizeCursor : public Cursor { public: SynchronizeCursor(const Synchronize &self, database::GraphDbAccessor &db) : self_(self), input_cursor_(self.input()->MakeCursor(db)), pull_remote_cursor_( self.pull_remote() ? self.pull_remote()->MakeCursor(db) : nullptr) { } bool Pull(Frame &frame, Context &context) override { if (!initial_pull_done_) { InitialPull(frame, context); initial_pull_done_ = true; } // Yield local stuff while available. if (!local_frames_.empty()) { auto &result = local_frames_.back(); for (size_t i = 0; i < frame.elems().size(); ++i) { if (self_.advance_command()) { query::ReconstructTypedValue(result[i]); } frame.elems()[i] = std::move(result[i]); } local_frames_.resize(local_frames_.size() - 1); return true; } // We're out of local stuff, yield from pull_remote if available. if (pull_remote_cursor_ && pull_remote_cursor_->Pull(frame, context)) return true; return false; } void Reset() override { throw QueryRuntimeException("Unsupported: Reset during Synchronize!"); } private: const Synchronize &self_; const std::unique_ptr input_cursor_; const std::unique_ptr pull_remote_cursor_; bool initial_pull_done_{false}; std::vector> local_frames_; void InitialPull(Frame &frame, Context &context) { auto &db = context.db_accessor_.db(); // Tell all workers to accumulate, only if there is a remote pull. std::vector> worker_accumulations; if (pull_remote_cursor_) { for (auto worker_id : db.remote_pull_clients().GetWorkerIds()) { if (worker_id == db.WorkerId()) continue; worker_accumulations.emplace_back(db.remote_pull_clients().RemotePull( context.db_accessor_, worker_id, self_.pull_remote()->plan_id(), context.parameters_, self_.pull_remote()->symbols(), true, 0)); } } // Accumulate local results while (input_cursor_->Pull(frame, context)) { local_frames_.emplace_back(); auto &local_frame = local_frames_.back(); local_frame.reserve(frame.elems().size()); for (auto &elem : frame.elems()) { local_frame.emplace_back(std::move(elem)); } } // Wait for all workers to finish accumulation (first sync point). for (auto &accu : worker_accumulations) { switch (accu.get().pull_state) { case distributed::RemotePullState::CURSOR_EXHAUSTED: continue; case distributed::RemotePullState::CURSOR_IN_PROGRESS: throw QueryRuntimeException( "Expected exhausted cursor after remote pull accumulate"); case distributed::RemotePullState::SERIALIZATION_ERROR: throw mvcc::SerializationError( "Failed to perform remote accumulate due to SerializationError"); case distributed::RemotePullState::UPDATE_DELETED_ERROR: throw QueryRuntimeException( "Failed to perform remote accumulate due to RecordDeletedError"); case distributed::RemotePullState::LOCK_TIMEOUT_ERROR: throw LockTimeoutException( "Failed to perform remote accumulate due to " "LockTimeoutException"); case distributed::RemotePullState::RECONSTRUCTION_ERROR: throw QueryRuntimeException( "Failed to perform remote accumulate due to ReconstructionError"); case distributed::RemotePullState::QUERY_ERROR: throw QueryRuntimeException( "Failed to perform remote accumulate due to Query runtime error"); } } if (self_.advance_command()) { context.db_accessor_.AdvanceCommand(); } // Make all the workers apply their deltas. auto tx_id = context.db_accessor_.transaction_id(); auto apply_futures = db.remote_updates_clients().RemoteUpdateApplyAll(db.WorkerId(), tx_id); db.remote_updates_server().Apply(tx_id); for (auto &future : apply_futures) { switch (future.get()) { case distributed::RemoteUpdateResult::SERIALIZATION_ERROR: throw mvcc::SerializationError( "Failed to apply deferred updates due to SerializationError"); case distributed::RemoteUpdateResult::UPDATE_DELETED_ERROR: throw QueryRuntimeException( "Failed to apply deferred updates due to RecordDeletedError"); case distributed::RemoteUpdateResult::LOCK_TIMEOUT_ERROR: throw LockTimeoutException( "Failed to apply deferred update due to LockTimeoutException"); case distributed::RemoteUpdateResult::DONE: break; } } // If the command advanced, let the workers know. if (self_.advance_command()) { auto futures = db.remote_pull_clients().NotifyAllTransactionCommandAdvanced(tx_id); for (auto &future : futures) future.wait(); } } }; class CartesianCursor : public Cursor { public: CartesianCursor(const Cartesian &self, database::GraphDbAccessor &db) : self_(self), left_op_cursor_(self.left_op()->MakeCursor(db)), right_op_cursor_(self_.right_op()->MakeCursor(db)) { CHECK(left_op_cursor_ != nullptr) << "CartesianCursor: Missing left operator cursor."; CHECK(right_op_cursor_ != nullptr) << "CartesianCursor: Missing right operator cursor."; } bool Pull(Frame &frame, Context &context) override { auto copy_frame = [&frame]() { std::vector result; for (auto &elem : frame.elems()) { result.emplace_back(std::move(elem)); } return result; }; if (!cartesian_pull_initialized_) { // Pull all left_op frames. while (left_op_cursor_->Pull(frame, context)) { left_op_frames_.emplace_back(copy_frame()); } // We're setting the iterator to 'end' here so it pulls the right cursor. left_op_frames_it_ = left_op_frames_.end(); cartesian_pull_initialized_ = true; } // If left operator yielded zero results there is no cartesian product. if (left_op_frames_.empty()) { return false; } auto restore_frame = [&frame](const std::vector &symbols, const std::vector &restore_from) { for (const auto &symbol : symbols) { frame[symbol] = restore_from[symbol.position()]; } }; if (left_op_frames_it_ == left_op_frames_.end()) { // Advance right_op_cursor_. if (!right_op_cursor_->Pull(frame, context)) return false; right_op_frame_ = copy_frame(); left_op_frames_it_ = left_op_frames_.begin(); } else { // Make sure right_op_cursor last pulled results are on frame. restore_frame(self_.right_symbols(), right_op_frame_); } restore_frame(self_.left_symbols(), *left_op_frames_it_); left_op_frames_it_++; return true; } void Reset() override { left_op_cursor_->Reset(); right_op_cursor_->Reset(); right_op_frame_.clear(); left_op_frames_.clear(); left_op_frames_it_ = left_op_frames_.end(); cartesian_pull_initialized_ = false; } private: const Cartesian &self_; std::vector> left_op_frames_; std::vector right_op_frame_; const std::unique_ptr left_op_cursor_; const std::unique_ptr right_op_cursor_; std::vector>::iterator left_op_frames_it_; bool cartesian_pull_initialized_{false}; }; } // namespace std::unique_ptr Synchronize::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } bool Cartesian::Accept(HierarchicalLogicalOperatorVisitor &visitor) { if (visitor.PreVisit(*this)) { left_op_->Accept(visitor) && right_op_->Accept(visitor); } return visitor.PostVisit(*this); } std::unique_ptr Cartesian::MakeCursor( database::GraphDbAccessor &db) const { return std::make_unique(*this, db); } std::vector Cartesian::ModifiedSymbols(const SymbolTable &table) const { auto symbols = left_op_->ModifiedSymbols(table); auto right = right_op_->ModifiedSymbols(table); symbols.insert(symbols.end(), right.begin(), right.end()); return symbols; } } // namespace query::plan BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Once); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::CreateNode); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::CreateExpand); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::ScanAll); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::ScanAllByLabel); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::ScanAllByLabelPropertyRange); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::ScanAllByLabelPropertyValue); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Expand); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::ExpandVariable); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Filter); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Produce); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::ConstructNamedPath); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Delete); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::SetProperty); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::SetProperties); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::SetLabels); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::RemoveProperty); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::RemoveLabels); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::ExpandUniquenessFilter); BOOST_CLASS_EXPORT_IMPLEMENT( query::plan::ExpandUniquenessFilter); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Accumulate); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Aggregate); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Skip); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Limit); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::OrderBy); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Merge); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Optional); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Unwind); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Distinct); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::CreateIndex); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Union); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::PullRemote); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Synchronize); BOOST_CLASS_EXPORT_IMPLEMENT(query::plan::Cartesian);