2017-04-11 21:11:48 +08:00
|
|
|
#include <algorithm>
|
|
|
|
#include <iterator>
|
|
|
|
#include <memory>
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
#include "gmock/gmock.h"
|
|
|
|
#include "gtest/gtest.h"
|
|
|
|
|
2018-10-05 18:37:23 +08:00
|
|
|
#include "database/single_node/graph_db.hpp"
|
2017-04-11 21:11:48 +08:00
|
|
|
#include "query/context.hpp"
|
|
|
|
#include "query/exceptions.hpp"
|
2017-04-13 16:01:16 +08:00
|
|
|
#include "query/plan/operator.hpp"
|
2017-04-11 21:11:48 +08:00
|
|
|
#include "query_plan_common.hpp"
|
|
|
|
|
|
|
|
using namespace query;
|
|
|
|
using namespace query::plan;
|
2019-08-22 20:50:57 +08:00
|
|
|
using query::test_common::ToIntList;
|
|
|
|
using query::test_common::ToIntMap;
|
2017-10-30 17:43:25 +08:00
|
|
|
using testing::UnorderedElementsAre;
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
TEST(QueryPlan, Accumulate) {
|
|
|
|
// simulate the following two query execution on an empty db
|
|
|
|
// CREATE ({x:0})-[:T]->({x:0})
|
|
|
|
// MATCH (n)--(m) SET n.x = n.x + 1, m.x = m.x + 1 RETURN n.x, m.x
|
|
|
|
// without accumulation we expected results to be [[1, 1], [2, 2]]
|
|
|
|
// with accumulation we expect them to be [[2, 2], [2, 2]]
|
|
|
|
|
|
|
|
auto check = [&](bool accumulate) {
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2019-04-15 17:36:43 +08:00
|
|
|
auto dba = db.Access();
|
2017-10-30 17:43:25 +08:00
|
|
|
auto prop = dba.Property("x");
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2017-10-30 17:43:25 +08:00
|
|
|
auto v1 = dba.InsertVertex();
|
2019-08-28 19:10:27 +08:00
|
|
|
v1.PropsSet(prop, PropertyValue(0));
|
2017-10-30 17:43:25 +08:00
|
|
|
auto v2 = dba.InsertVertex();
|
2019-08-28 19:10:27 +08:00
|
|
|
v2.PropsSet(prop, PropertyValue(0));
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.InsertEdge(v1, v2, dba.EdgeType("T"));
|
|
|
|
dba.AdvanceCommand();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-09-05 22:32:53 +08:00
|
|
|
auto r_m = MakeExpand(storage, symbol_table, n.op_, n.sym_, "r",
|
|
|
|
EdgeAtom::Direction::BOTH, {}, "m", false,
|
|
|
|
storage::View::OLD);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
auto one = LITERAL(1);
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
2017-04-11 21:11:48 +08:00
|
|
|
auto set_n_p =
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
std::make_shared<plan::SetProperty>(r_m.op_, prop, n_p, ADD(n_p, one));
|
2019-02-05 20:16:07 +08:00
|
|
|
auto m_p = PROPERTY_LOOKUP(IDENT("m")->MapTo(r_m.node_sym_), prop);
|
2017-04-11 21:11:48 +08:00
|
|
|
auto set_m_p =
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
std::make_shared<plan::SetProperty>(set_n_p, prop, m_p, ADD(m_p, one));
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
std::shared_ptr<LogicalOperator> last_op = set_m_p;
|
|
|
|
if (accumulate) {
|
|
|
|
last_op = std::make_shared<Accumulate>(
|
|
|
|
last_op, std::vector<Symbol>{n.sym_, r_m.node_sym_});
|
|
|
|
}
|
|
|
|
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p_ne =
|
|
|
|
NEXPR("n.p", n_p)->MapTo(symbol_table.CreateSymbol("n_p_ne", true));
|
|
|
|
auto m_p_ne =
|
|
|
|
NEXPR("m.p", m_p)->MapTo(symbol_table.CreateSymbol("m_p_ne", true));
|
2017-04-11 21:11:48 +08:00
|
|
|
auto produce = MakeProduce(last_op, n_p_ne, m_p_ne);
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-11 21:11:48 +08:00
|
|
|
std::vector<int> results_data;
|
2017-05-30 21:19:38 +08:00
|
|
|
for (const auto &row : results)
|
2017-04-11 21:11:48 +08:00
|
|
|
for (const auto &column : row)
|
2019-08-22 20:50:57 +08:00
|
|
|
results_data.emplace_back(column.ValueInt());
|
2017-04-11 21:11:48 +08:00
|
|
|
if (accumulate)
|
|
|
|
EXPECT_THAT(results_data, testing::ElementsAre(2, 2, 2, 2));
|
|
|
|
else
|
|
|
|
EXPECT_THAT(results_data, testing::ElementsAre(1, 1, 2, 2));
|
|
|
|
};
|
|
|
|
|
|
|
|
check(false);
|
|
|
|
check(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AccumulateAdvance) {
|
|
|
|
// we simulate 'CREATE (n) WITH n AS n MATCH (m) RETURN m'
|
|
|
|
// to get correct results we need to advance the command
|
|
|
|
auto check = [&](bool advance) {
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2018-07-26 15:08:21 +08:00
|
|
|
auto dba = db.Access();
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
2018-12-20 16:38:23 +08:00
|
|
|
NodeCreationInfo node;
|
|
|
|
node.symbol = symbol_table.CreateSymbol("n", true);
|
2018-08-30 19:31:50 +08:00
|
|
|
auto create = std::make_shared<CreateNode>(nullptr, node);
|
2017-04-11 21:11:48 +08:00
|
|
|
auto accumulate = std::make_shared<Accumulate>(
|
2018-12-20 16:38:23 +08:00
|
|
|
create, std::vector<Symbol>{node.symbol}, advance);
|
2017-04-11 21:11:48 +08:00
|
|
|
auto match = MakeScanAll(storage, symbol_table, "m", accumulate);
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
EXPECT_EQ(advance ? 1 : 0, PullAll(*match.op_, &context));
|
2017-04-11 21:11:48 +08:00
|
|
|
};
|
|
|
|
check(false);
|
|
|
|
check(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
std::shared_ptr<Produce> MakeAggregationProduce(
|
|
|
|
std::shared_ptr<LogicalOperator> input, SymbolTable &symbol_table,
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage &storage, const std::vector<Expression *> aggr_inputs,
|
2017-04-11 21:11:48 +08:00
|
|
|
const std::vector<Aggregation::Op> aggr_ops,
|
|
|
|
const std::vector<Expression *> group_by_exprs,
|
|
|
|
const std::vector<Symbol> remember) {
|
|
|
|
// prepare all the aggregations
|
|
|
|
std::vector<Aggregate::Element> aggregates;
|
|
|
|
std::vector<NamedExpression *> named_expressions;
|
|
|
|
|
|
|
|
auto aggr_inputs_it = aggr_inputs.begin();
|
|
|
|
for (auto aggr_op : aggr_ops) {
|
|
|
|
// TODO change this from using IDENT to using AGGREGATION
|
|
|
|
// once AGGREGATION is handled properly in ExpressionEvaluation
|
2019-02-05 20:16:07 +08:00
|
|
|
auto aggr_sym = symbol_table.CreateSymbol("aggregation", true);
|
|
|
|
auto named_expr =
|
|
|
|
NEXPR("", IDENT("aggregation")->MapTo(aggr_sym))
|
|
|
|
->MapTo(symbol_table.CreateSymbol("named_expression", true));
|
2017-04-11 21:11:48 +08:00
|
|
|
named_expressions.push_back(named_expr);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// the key expression is only used in COLLECT_MAP
|
|
|
|
Expression *key_expr_ptr =
|
|
|
|
aggr_op == Aggregation::Op::COLLECT_MAP ? LITERAL("key") : nullptr;
|
|
|
|
aggregates.emplace_back(
|
2019-02-05 20:16:07 +08:00
|
|
|
Aggregate::Element{*aggr_inputs_it++, key_expr_ptr, aggr_op, aggr_sym});
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// Produce will also evaluate group_by expressions and return them after the
|
|
|
|
// aggregations.
|
2017-04-11 21:11:48 +08:00
|
|
|
for (auto group_by_expr : group_by_exprs) {
|
2019-02-05 20:16:07 +08:00
|
|
|
auto named_expr =
|
|
|
|
NEXPR("", group_by_expr)
|
|
|
|
->MapTo(symbol_table.CreateSymbol("named_expression", true));
|
2017-04-11 21:11:48 +08:00
|
|
|
named_expressions.push_back(named_expr);
|
|
|
|
}
|
|
|
|
auto aggregation =
|
|
|
|
std::make_shared<Aggregate>(input, aggregates, group_by_exprs, remember);
|
|
|
|
return std::make_shared<Produce>(aggregation, named_expressions);
|
|
|
|
}
|
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
/** Test fixture for all the aggregation ops in one return. */
|
2017-05-30 15:37:24 +08:00
|
|
|
class QueryPlanAggregateOps : public ::testing::Test {
|
|
|
|
protected:
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2019-04-15 17:36:43 +08:00
|
|
|
database::GraphDbAccessor dba{db.Access()};
|
2018-01-16 17:09:15 +08:00
|
|
|
storage::Property prop = dba.Property("prop");
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
2017-05-30 15:37:24 +08:00
|
|
|
void AddData() {
|
|
|
|
// setup is several nodes most of which have an int property set
|
|
|
|
// we will take the sum, avg, min, max and count
|
|
|
|
// we won't group by anything
|
2019-08-28 19:10:27 +08:00
|
|
|
dba.InsertVertex().PropsSet(prop, PropertyValue(5));
|
|
|
|
dba.InsertVertex().PropsSet(prop, PropertyValue(7));
|
|
|
|
dba.InsertVertex().PropsSet(prop, PropertyValue(12));
|
2017-05-30 15:37:24 +08:00
|
|
|
// a missing property (null) gets ignored by all aggregations except
|
|
|
|
// COUNT(*)
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.InsertVertex();
|
|
|
|
dba.AdvanceCommand();
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2017-05-30 15:37:24 +08:00
|
|
|
auto AggregationResults(bool with_group_by,
|
|
|
|
std::vector<Aggregation::Op> ops = {
|
|
|
|
Aggregation::Op::COUNT, Aggregation::Op::COUNT,
|
|
|
|
Aggregation::Op::MIN, Aggregation::Op::MAX,
|
|
|
|
Aggregation::Op::SUM, Aggregation::Op::AVG,
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
Aggregation::Op::COLLECT_LIST,
|
|
|
|
Aggregation::Op::COLLECT_MAP}) {
|
2017-05-30 15:37:24 +08:00
|
|
|
// match all nodes and perform aggregations
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
2017-05-30 15:37:24 +08:00
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
std::vector<Expression *> aggregation_expressions(ops.size(), n_p);
|
2017-05-30 15:37:24 +08:00
|
|
|
std::vector<Expression *> group_bys;
|
|
|
|
if (with_group_by) group_bys.push_back(n_p);
|
|
|
|
aggregation_expressions[0] = nullptr;
|
|
|
|
auto produce =
|
|
|
|
MakeAggregationProduce(n.op_, symbol_table, storage,
|
|
|
|
aggregation_expressions, ops, group_bys, {});
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
return CollectProduce(*produce, &context);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
TEST_F(QueryPlanAggregateOps, WithData) {
|
|
|
|
AddData();
|
|
|
|
auto results = AggregationResults(false);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
ASSERT_EQ(results.size(), 1);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
ASSERT_EQ(results[0].size(), 8);
|
2017-05-06 23:57:39 +08:00
|
|
|
// count(*)
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 4);
|
2017-05-06 23:57:39 +08:00
|
|
|
// count
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results[0][1].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][1].ValueInt(), 3);
|
2017-05-06 23:57:39 +08:00
|
|
|
// min
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results[0][2].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][2].ValueInt(), 5);
|
2017-05-06 23:57:39 +08:00
|
|
|
// max
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results[0][3].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][3].ValueInt(), 12);
|
2017-05-06 23:57:39 +08:00
|
|
|
// sum
|
|
|
|
ASSERT_EQ(results[0][4].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][4].ValueInt(), 24);
|
2017-04-11 21:11:48 +08:00
|
|
|
// avg
|
2017-05-06 23:57:39 +08:00
|
|
|
ASSERT_EQ(results[0][5].type(), TypedValue::Type::Double);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_FLOAT_EQ(results[0][5].ValueDouble(), 24 / 3.0);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// collect list
|
2017-05-19 21:49:25 +08:00
|
|
|
ASSERT_EQ(results[0][6].type(), TypedValue::Type::List);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_THAT(ToIntList(results[0][6]), UnorderedElementsAre(5, 7, 12));
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// collect map
|
|
|
|
ASSERT_EQ(results[0][7].type(), TypedValue::Type::Map);
|
2019-08-22 20:50:57 +08:00
|
|
|
auto map = ToIntMap(results[0][7]);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
ASSERT_EQ(map.size(), 1);
|
|
|
|
EXPECT_EQ(map.begin()->first, "key");
|
|
|
|
EXPECT_FALSE(std::set<int>({5, 7, 12}).insert(map.begin()->second).second);
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
|
|
|
|
2017-05-30 15:37:24 +08:00
|
|
|
TEST_F(QueryPlanAggregateOps, WithoutDataWithGroupBy) {
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, {Aggregation::Op::COUNT});
|
|
|
|
EXPECT_EQ(results.size(), 0);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, {Aggregation::Op::SUM});
|
|
|
|
EXPECT_EQ(results.size(), 0);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, {Aggregation::Op::AVG});
|
|
|
|
EXPECT_EQ(results.size(), 0);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, {Aggregation::Op::MIN});
|
|
|
|
EXPECT_EQ(results.size(), 0);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, {Aggregation::Op::MAX});
|
|
|
|
EXPECT_EQ(results.size(), 0);
|
|
|
|
}
|
|
|
|
{
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
auto results = AggregationResults(true, {Aggregation::Op::COLLECT_LIST});
|
|
|
|
EXPECT_EQ(results.size(), 0);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, {Aggregation::Op::COLLECT_MAP});
|
2017-05-30 15:37:24 +08:00
|
|
|
EXPECT_EQ(results.size(), 0);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_F(QueryPlanAggregateOps, WithoutDataWithoutGroupBy) {
|
|
|
|
auto results = AggregationResults(false);
|
|
|
|
ASSERT_EQ(results.size(), 1);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
ASSERT_EQ(results[0].size(), 8);
|
2017-05-30 15:37:24 +08:00
|
|
|
// count(*)
|
|
|
|
ASSERT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
// count
|
|
|
|
ASSERT_EQ(results[0][1].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][1].ValueInt(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
// min
|
|
|
|
EXPECT_TRUE(results[0][2].IsNull());
|
|
|
|
// max
|
|
|
|
EXPECT_TRUE(results[0][3].IsNull());
|
|
|
|
// sum
|
|
|
|
EXPECT_TRUE(results[0][4].IsNull());
|
|
|
|
// avg
|
|
|
|
EXPECT_TRUE(results[0][5].IsNull());
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// collect list
|
2017-05-30 15:37:24 +08:00
|
|
|
ASSERT_EQ(results[0][6].type(), TypedValue::Type::List);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(ToIntList(results[0][6]).size(), 0);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// collect map
|
|
|
|
ASSERT_EQ(results[0][7].type(), TypedValue::Type::Map);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(ToIntMap(results[0][7]).size(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
|
2017-04-11 21:11:48 +08:00
|
|
|
TEST(QueryPlan, AggregateGroupByValues) {
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// Tests that distinct groups are aggregated properly for values of all types.
|
|
|
|
// Also test the "remember" part of the Aggregation API as final results are
|
|
|
|
// obtained via a property lookup of a remembered node.
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2019-04-15 17:36:43 +08:00
|
|
|
auto dba = db.Access();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
Clean-up TypedValue misuse
Summary:
In a bunch of places `TypedValue` was used where `PropertyValue` should be. A lot of times it was only because `TypedValue` serialization code could be reused for `PropertyValue`, only without providing callbacks for `VERTEX`, `EDGE` and `PATH`. So first I wrote separate serialization code for `PropertyValue` and put it into storage folder. Then I fixed all the places where `TypedValue` was incorrectly used instead of `PropertyValue`. I also disabled implicit `TypedValue` to `PropertyValue` conversion in hopes of preventing misuse in the future.
After that, I wrote code for `VertexAccessor` and `EdgeAccessor` serialization and put it into `storage` folder because it was almost duplicated in distributed BFS and pull produce RPC messages. On the sender side, some subset of records (old or new or both) is serialized, and on the reciever side, records are deserialized and immediately put into transaction cache.
Then I rewrote the `TypedValue` serialization functions (`SaveCapnpTypedValue` and `LoadCapnpTypedValue`) to not take callbacks for `VERTEX`, `EDGE` and `PATH`, but use accessor serialization functions instead. That means that any code that wants to use `TypedValue` serialization must hold a reference to `GraphDbAccessor` and `DataManager`, so that should make clients reconsider if they really want to use `TypedValue` instead of `PropertyValue`.
Reviewers: teon.banek, msantl
Reviewed By: teon.banek
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D1598
2018-09-13 18:12:07 +08:00
|
|
|
// a vector of PropertyValue to be set as property values on vertices
|
2017-04-11 21:11:48 +08:00
|
|
|
// most of them should result in a distinct group (commented where not)
|
Clean-up TypedValue misuse
Summary:
In a bunch of places `TypedValue` was used where `PropertyValue` should be. A lot of times it was only because `TypedValue` serialization code could be reused for `PropertyValue`, only without providing callbacks for `VERTEX`, `EDGE` and `PATH`. So first I wrote separate serialization code for `PropertyValue` and put it into storage folder. Then I fixed all the places where `TypedValue` was incorrectly used instead of `PropertyValue`. I also disabled implicit `TypedValue` to `PropertyValue` conversion in hopes of preventing misuse in the future.
After that, I wrote code for `VertexAccessor` and `EdgeAccessor` serialization and put it into `storage` folder because it was almost duplicated in distributed BFS and pull produce RPC messages. On the sender side, some subset of records (old or new or both) is serialized, and on the reciever side, records are deserialized and immediately put into transaction cache.
Then I rewrote the `TypedValue` serialization functions (`SaveCapnpTypedValue` and `LoadCapnpTypedValue`) to not take callbacks for `VERTEX`, `EDGE` and `PATH`, but use accessor serialization functions instead. That means that any code that wants to use `TypedValue` serialization must hold a reference to `GraphDbAccessor` and `DataManager`, so that should make clients reconsider if they really want to use `TypedValue` instead of `PropertyValue`.
Reviewers: teon.banek, msantl
Reviewed By: teon.banek
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D1598
2018-09-13 18:12:07 +08:00
|
|
|
std::vector<PropertyValue> group_by_vals;
|
2017-04-11 21:11:48 +08:00
|
|
|
group_by_vals.emplace_back(4);
|
|
|
|
group_by_vals.emplace_back(7);
|
|
|
|
group_by_vals.emplace_back(7.3);
|
|
|
|
group_by_vals.emplace_back(7.2);
|
|
|
|
group_by_vals.emplace_back("Johhny");
|
|
|
|
group_by_vals.emplace_back("Jane");
|
|
|
|
group_by_vals.emplace_back("1");
|
|
|
|
group_by_vals.emplace_back(true);
|
|
|
|
group_by_vals.emplace_back(false);
|
2019-08-28 19:10:27 +08:00
|
|
|
group_by_vals.emplace_back(std::vector<PropertyValue>{PropertyValue(1)});
|
|
|
|
group_by_vals.emplace_back(
|
|
|
|
std::vector<PropertyValue>{PropertyValue(1), PropertyValue(2)});
|
|
|
|
group_by_vals.emplace_back(
|
|
|
|
std::vector<PropertyValue>{PropertyValue(2), PropertyValue(1)});
|
2019-08-27 20:24:33 +08:00
|
|
|
group_by_vals.emplace_back(PropertyValue());
|
2017-04-11 21:11:48 +08:00
|
|
|
// should NOT result in another group because 7.0 == 7
|
|
|
|
group_by_vals.emplace_back(7.0);
|
|
|
|
// should NOT result in another group
|
2019-08-28 19:10:27 +08:00
|
|
|
group_by_vals.emplace_back(
|
|
|
|
std::vector<PropertyValue>{PropertyValue(1), PropertyValue(2.0)});
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
// generate a lot of vertices and set props on them
|
2017-10-30 17:43:25 +08:00
|
|
|
auto prop = dba.Property("prop");
|
2017-04-11 21:11:48 +08:00
|
|
|
for (int i = 0; i < 1000; ++i)
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.InsertVertex().PropsSet(prop, group_by_vals[i % group_by_vals.size()]);
|
|
|
|
dba.AdvanceCommand();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
// match all nodes and perform aggregations
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
auto produce =
|
|
|
|
MakeAggregationProduce(n.op_, symbol_table, storage, {n_p},
|
|
|
|
{Aggregation::Op::COUNT}, {n_p}, {n.sym_});
|
|
|
|
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results.size(), group_by_vals.size() - 2);
|
2019-06-03 22:54:20 +08:00
|
|
|
std::unordered_set<TypedValue, TypedValue::Hash, TypedValue::BoolEqual>
|
|
|
|
result_group_bys;
|
2017-04-11 21:11:48 +08:00
|
|
|
for (const auto &row : results) {
|
|
|
|
ASSERT_EQ(2, row.size());
|
|
|
|
result_group_bys.insert(row[1]);
|
|
|
|
}
|
|
|
|
ASSERT_EQ(result_group_bys.size(), group_by_vals.size() - 2);
|
2019-06-06 19:16:37 +08:00
|
|
|
std::vector<TypedValue> group_by_tvals;
|
|
|
|
group_by_tvals.reserve(group_by_vals.size());
|
|
|
|
for (const auto &v : group_by_vals) group_by_tvals.emplace_back(v);
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_TRUE(
|
2019-06-06 19:16:37 +08:00
|
|
|
std::is_permutation(group_by_tvals.begin(), group_by_tvals.end() - 2,
|
2017-04-12 21:47:55 +08:00
|
|
|
result_group_bys.begin(), TypedValue::BoolEqual{}));
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AggregateMultipleGroupBy) {
|
|
|
|
// in this test we have 3 different properties that have different values
|
|
|
|
// for different records and assert that we get the correct combination
|
|
|
|
// of values in our groups
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2019-04-15 17:36:43 +08:00
|
|
|
auto dba = db.Access();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2017-10-30 17:43:25 +08:00
|
|
|
auto prop1 = dba.Property("prop1");
|
|
|
|
auto prop2 = dba.Property("prop2");
|
|
|
|
auto prop3 = dba.Property("prop3");
|
2017-04-11 21:11:48 +08:00
|
|
|
for (int i = 0; i < 2 * 3 * 5; ++i) {
|
2017-10-30 17:43:25 +08:00
|
|
|
auto v = dba.InsertVertex();
|
2019-08-28 19:10:27 +08:00
|
|
|
v.PropsSet(prop1, PropertyValue(static_cast<bool>(i % 2)));
|
|
|
|
v.PropsSet(prop2, PropertyValue(i % 3));
|
|
|
|
v.PropsSet(prop3, PropertyValue("value" + std::to_string(i % 5)));
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
// match all nodes and perform aggregations
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p1 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop1);
|
|
|
|
auto n_p2 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop2);
|
|
|
|
auto n_p3 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop3);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {n_p1},
|
|
|
|
{Aggregation::Op::COUNT},
|
|
|
|
{n_p1, n_p2, n_p3}, {n.sym_});
|
|
|
|
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-11 21:11:48 +08:00
|
|
|
EXPECT_EQ(results.size(), 2 * 3 * 5);
|
|
|
|
}
|
|
|
|
|
2017-04-13 22:47:11 +08:00
|
|
|
TEST(QueryPlan, AggregateNoInput) {
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2018-07-26 15:08:21 +08:00
|
|
|
auto dba = db.Access();
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-13 22:47:11 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto two = LITERAL(2);
|
|
|
|
auto produce = MakeAggregationProduce(nullptr, symbol_table, storage, {two},
|
2017-04-28 21:14:28 +08:00
|
|
|
{Aggregation::Op::COUNT}, {}, {});
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-13 22:47:11 +08:00
|
|
|
EXPECT_EQ(1, results.size());
|
|
|
|
EXPECT_EQ(1, results[0].size());
|
|
|
|
EXPECT_EQ(TypedValue::Type::Int, results[0][0].type());
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(1, results[0][0].ValueInt());
|
2017-04-13 22:47:11 +08:00
|
|
|
}
|
|
|
|
|
2017-04-12 21:47:55 +08:00
|
|
|
TEST(QueryPlan, AggregateCountEdgeCases) {
|
|
|
|
// tests for detected bugs in the COUNT aggregation behavior
|
|
|
|
// ensure that COUNT returns correctly for
|
|
|
|
// - 0 vertices in database
|
|
|
|
// - 1 vertex in database, property not set
|
|
|
|
// - 1 vertex in database, property set
|
|
|
|
// - 2 vertices in database, property set on one
|
|
|
|
// - 2 vertices in database, property set on both
|
|
|
|
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2019-04-15 17:36:43 +08:00
|
|
|
auto dba = db.Access();
|
2017-10-30 17:43:25 +08:00
|
|
|
auto prop = dba.Property("prop");
|
2017-04-12 21:47:55 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-12 21:47:55 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
2017-04-12 21:47:55 +08:00
|
|
|
|
|
|
|
// returns -1 when there are no results
|
|
|
|
// otherwise returns MATCH (n) RETURN count(n.prop)
|
|
|
|
auto count = [&]() {
|
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {n_p},
|
|
|
|
{Aggregation::Op::COUNT}, {}, {});
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-12 21:47:55 +08:00
|
|
|
if (results.size() == 0) return -1L;
|
|
|
|
EXPECT_EQ(1, results.size());
|
|
|
|
EXPECT_EQ(1, results[0].size());
|
|
|
|
EXPECT_EQ(TypedValue::Type::Int, results[0][0].type());
|
2019-08-22 20:50:57 +08:00
|
|
|
return results[0][0].ValueInt();
|
2017-04-12 21:47:55 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
// no vertices yet in database
|
2017-05-30 15:37:24 +08:00
|
|
|
EXPECT_EQ(0, count());
|
2017-04-12 21:47:55 +08:00
|
|
|
|
|
|
|
// one vertex, no property set
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.InsertVertex();
|
|
|
|
dba.AdvanceCommand();
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_EQ(0, count());
|
|
|
|
|
|
|
|
// one vertex, property set
|
2019-09-11 22:10:53 +08:00
|
|
|
for (auto va : dba.Vertices(false)) va.PropsSet(prop, PropertyValue(42));
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_EQ(1, count());
|
|
|
|
|
|
|
|
// two vertices, one with property set
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.InsertVertex();
|
|
|
|
dba.AdvanceCommand();
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_EQ(1, count());
|
|
|
|
|
|
|
|
// two vertices, both with property set
|
2019-09-11 22:10:53 +08:00
|
|
|
for (auto va : dba.Vertices(false)) va.PropsSet(prop, PropertyValue(42));
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_EQ(2, count());
|
|
|
|
}
|
|
|
|
|
2017-04-14 23:14:14 +08:00
|
|
|
TEST(QueryPlan, AggregateFirstValueTypes) {
|
|
|
|
// testing exceptions that get emitted by the first-value
|
|
|
|
// type check
|
|
|
|
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2019-04-15 17:36:43 +08:00
|
|
|
auto dba = db.Access();
|
2017-04-14 23:14:14 +08:00
|
|
|
|
2017-10-30 17:43:25 +08:00
|
|
|
auto v1 = dba.InsertVertex();
|
|
|
|
auto prop_string = dba.Property("string");
|
2019-08-28 19:10:27 +08:00
|
|
|
v1.PropsSet(prop_string, PropertyValue("johhny"));
|
2017-10-30 17:43:25 +08:00
|
|
|
auto prop_int = dba.Property("int");
|
2019-08-28 19:10:27 +08:00
|
|
|
v1.PropsSet(prop_int, PropertyValue(12));
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-14 23:14:14 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-14 23:14:14 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_prop_string = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop_string);
|
|
|
|
auto n_prop_int = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop_int);
|
2017-04-14 23:14:14 +08:00
|
|
|
auto n_id = n_prop_string->expression_;
|
|
|
|
|
|
|
|
auto aggregate = [&](Expression *expression, Aggregation::Op aggr_op) {
|
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage,
|
|
|
|
{expression}, {aggr_op}, {}, {});
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
CollectProduce(*produce, &context);
|
2017-04-14 23:14:14 +08:00
|
|
|
};
|
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// everything except for COUNT and COLLECT fails on a Vertex
|
2017-04-14 23:14:14 +08:00
|
|
|
aggregate(n_id, Aggregation::Op::COUNT);
|
2017-06-12 21:12:31 +08:00
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-14 23:14:14 +08:00
|
|
|
|
|
|
|
// on strings AVG and SUM fail
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::MAX);
|
2017-04-28 21:14:28 +08:00
|
|
|
EXPECT_THROW(aggregate(n_prop_string, Aggregation::Op::AVG),
|
2017-06-12 21:12:31 +08:00
|
|
|
QueryRuntimeException);
|
2017-04-28 21:14:28 +08:00
|
|
|
EXPECT_THROW(aggregate(n_prop_string, Aggregation::Op::SUM),
|
2017-06-12 21:12:31 +08:00
|
|
|
QueryRuntimeException);
|
2017-04-14 23:14:14 +08:00
|
|
|
|
|
|
|
// on ints nothing fails
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::MAX);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::AVG);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::SUM);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
aggregate(n_prop_int, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::COLLECT_MAP);
|
2017-04-14 23:14:14 +08:00
|
|
|
}
|
|
|
|
|
2017-04-11 21:11:48 +08:00
|
|
|
TEST(QueryPlan, AggregateTypes) {
|
|
|
|
// testing exceptions that can get emitted by an aggregation
|
|
|
|
// does not check all combinations that can result in an exception
|
|
|
|
// (that logic is defined and tested by TypedValue)
|
|
|
|
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2019-04-15 17:36:43 +08:00
|
|
|
auto dba = db.Access();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2017-10-30 17:43:25 +08:00
|
|
|
auto p1 = dba.Property("p1"); // has only string props
|
2019-08-28 19:10:27 +08:00
|
|
|
dba.InsertVertex().PropsSet(p1, PropertyValue("string"));
|
|
|
|
dba.InsertVertex().PropsSet(p1, PropertyValue("str2"));
|
2017-10-30 17:43:25 +08:00
|
|
|
auto p2 = dba.Property("p2"); // combines int and bool
|
2019-08-28 19:10:27 +08:00
|
|
|
dba.InsertVertex().PropsSet(p2, PropertyValue(42));
|
|
|
|
dba.InsertVertex().PropsSet(p2, PropertyValue(true));
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p1 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), p1);
|
|
|
|
auto n_p2 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), p2);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
auto aggregate = [&](Expression *expression, Aggregation::Op aggr_op) {
|
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage,
|
|
|
|
{expression}, {aggr_op}, {}, {});
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
CollectProduce(*produce, &context);
|
2017-04-11 21:11:48 +08:00
|
|
|
};
|
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// everything except for COUNT and COLLECT fails on a Vertex
|
2017-04-11 21:11:48 +08:00
|
|
|
auto n_id = n_p1->expression_;
|
|
|
|
aggregate(n_id, Aggregation::Op::COUNT);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
aggregate(n_id, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_id, Aggregation::Op::COLLECT_MAP);
|
2017-06-12 21:12:31 +08:00
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
// on strings AVG and SUM fail
|
|
|
|
aggregate(n_p1, Aggregation::Op::COUNT);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
aggregate(n_p1, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_p1, Aggregation::Op::COLLECT_MAP);
|
2017-04-11 21:11:48 +08:00
|
|
|
aggregate(n_p1, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_p1, Aggregation::Op::MAX);
|
2017-06-12 21:12:31 +08:00
|
|
|
EXPECT_THROW(aggregate(n_p1, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p1, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// combination of int and bool, everything except COUNT and COLLECT fails
|
2017-04-11 21:11:48 +08:00
|
|
|
aggregate(n_p2, Aggregation::Op::COUNT);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
aggregate(n_p2, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_p2, Aggregation::Op::COLLECT_MAP);
|
2017-06-12 21:12:31 +08:00
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
2017-04-28 21:14:28 +08:00
|
|
|
|
|
|
|
TEST(QueryPlan, Unwind) {
|
2018-10-09 17:09:10 +08:00
|
|
|
database::GraphDb db;
|
2018-07-26 15:08:21 +08:00
|
|
|
auto dba = db.Access();
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-28 21:14:28 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
// UNWIND [ [1, true, "x"], [], ["bla"] ] AS x UNWIND x as y RETURN x, y
|
Clean-up TypedValue misuse
Summary:
In a bunch of places `TypedValue` was used where `PropertyValue` should be. A lot of times it was only because `TypedValue` serialization code could be reused for `PropertyValue`, only without providing callbacks for `VERTEX`, `EDGE` and `PATH`. So first I wrote separate serialization code for `PropertyValue` and put it into storage folder. Then I fixed all the places where `TypedValue` was incorrectly used instead of `PropertyValue`. I also disabled implicit `TypedValue` to `PropertyValue` conversion in hopes of preventing misuse in the future.
After that, I wrote code for `VertexAccessor` and `EdgeAccessor` serialization and put it into `storage` folder because it was almost duplicated in distributed BFS and pull produce RPC messages. On the sender side, some subset of records (old or new or both) is serialized, and on the reciever side, records are deserialized and immediately put into transaction cache.
Then I rewrote the `TypedValue` serialization functions (`SaveCapnpTypedValue` and `LoadCapnpTypedValue`) to not take callbacks for `VERTEX`, `EDGE` and `PATH`, but use accessor serialization functions instead. That means that any code that wants to use `TypedValue` serialization must hold a reference to `GraphDbAccessor` and `DataManager`, so that should make clients reconsider if they really want to use `TypedValue` instead of `PropertyValue`.
Reviewers: teon.banek, msantl
Reviewed By: teon.banek
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D1598
2018-09-13 18:12:07 +08:00
|
|
|
auto input_expr = storage.Create<PrimitiveLiteral>(std::vector<PropertyValue>{
|
2019-08-28 19:10:27 +08:00
|
|
|
PropertyValue(std::vector<PropertyValue>{
|
|
|
|
PropertyValue(1), PropertyValue(true), PropertyValue("x")}),
|
|
|
|
PropertyValue(std::vector<PropertyValue>{}),
|
|
|
|
PropertyValue(std::vector<PropertyValue>{PropertyValue("bla")})});
|
2017-04-28 21:14:28 +08:00
|
|
|
|
2017-05-12 17:37:22 +08:00
|
|
|
auto x = symbol_table.CreateSymbol("x", true);
|
2017-05-03 17:07:07 +08:00
|
|
|
auto unwind_0 = std::make_shared<plan::Unwind>(nullptr, input_expr, x);
|
2019-02-05 20:16:07 +08:00
|
|
|
auto x_expr = IDENT("x")->MapTo(x);
|
2017-05-12 17:37:22 +08:00
|
|
|
auto y = symbol_table.CreateSymbol("y", true);
|
2017-05-03 17:07:07 +08:00
|
|
|
auto unwind_1 = std::make_shared<plan::Unwind>(unwind_0, x_expr, y);
|
2017-04-28 21:14:28 +08:00
|
|
|
|
2019-02-05 20:16:07 +08:00
|
|
|
auto x_ne =
|
|
|
|
NEXPR("x", x_expr)->MapTo(symbol_table.CreateSymbol("x_ne", true));
|
|
|
|
auto y_ne = NEXPR("y", IDENT("y")->MapTo(y))
|
|
|
|
->MapTo(symbol_table.CreateSymbol("y_ne", true));
|
2017-04-28 21:14:28 +08:00
|
|
|
auto produce = MakeProduce(unwind_1, x_ne, y_ne);
|
|
|
|
|
2019-09-11 22:10:53 +08:00
|
|
|
query::DbAccessor execution_dba(&dba);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &execution_dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-28 21:14:28 +08:00
|
|
|
ASSERT_EQ(4, results.size());
|
|
|
|
const std::vector<int> expected_x_card{3, 3, 3, 1};
|
|
|
|
auto expected_x_card_it = expected_x_card.begin();
|
2019-06-05 21:50:29 +08:00
|
|
|
const std::vector<TypedValue> expected_y{TypedValue(1), TypedValue(true),
|
|
|
|
TypedValue("x"), TypedValue("bla")};
|
2017-04-28 21:14:28 +08:00
|
|
|
auto expected_y_it = expected_y.begin();
|
|
|
|
for (const auto &row : results) {
|
|
|
|
ASSERT_EQ(2, row.size());
|
|
|
|
ASSERT_EQ(row[0].type(), TypedValue::Type::List);
|
2019-06-05 21:50:29 +08:00
|
|
|
EXPECT_EQ(row[0].ValueList().size(), *expected_x_card_it);
|
2017-04-28 21:14:28 +08:00
|
|
|
EXPECT_EQ(row[1].type(), expected_y_it->type());
|
|
|
|
expected_x_card_it++;
|
|
|
|
expected_y_it++;
|
|
|
|
}
|
|
|
|
}
|