2022-02-22 20:33:45 +08:00
|
|
|
// Copyright 2022 Memgraph Ltd.
|
2021-10-26 14:53:56 +08:00
|
|
|
//
|
|
|
|
// Use of this software is governed by the Business Source License
|
|
|
|
// included in the file licenses/BSL.txt; by using this file, you agree to be bound by the terms of the Business Source
|
|
|
|
// License, and you may not use this file except in compliance with the Business Source License.
|
|
|
|
//
|
|
|
|
// As of the Change Date specified in that file, in accordance with
|
|
|
|
// the Business Source License, use of this software will be governed
|
|
|
|
// by the Apache License, Version 2.0, included in the file
|
|
|
|
// licenses/APL.txt.
|
|
|
|
|
2017-04-11 21:11:48 +08:00
|
|
|
#include <algorithm>
|
|
|
|
#include <iterator>
|
|
|
|
#include <memory>
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
#include "gmock/gmock.h"
|
|
|
|
#include "gtest/gtest.h"
|
|
|
|
|
|
|
|
#include "query/context.hpp"
|
|
|
|
#include "query/exceptions.hpp"
|
2017-04-13 16:01:16 +08:00
|
|
|
#include "query/plan/operator.hpp"
|
2017-04-11 21:11:48 +08:00
|
|
|
#include "query_plan_common.hpp"
|
|
|
|
|
2022-02-22 20:33:45 +08:00
|
|
|
using namespace memgraph::query;
|
|
|
|
using namespace memgraph::query::plan;
|
|
|
|
using memgraph::query::test_common::ToIntList;
|
|
|
|
using memgraph::query::test_common::ToIntMap;
|
2017-10-30 17:43:25 +08:00
|
|
|
using testing::UnorderedElementsAre;
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
TEST(QueryPlan, Accumulate) {
|
|
|
|
// simulate the following two query execution on an empty db
|
|
|
|
// CREATE ({x:0})-[:T]->({x:0})
|
|
|
|
// MATCH (n)--(m) SET n.x = n.x + 1, m.x = m.x + 1 RETURN n.x, m.x
|
|
|
|
// without accumulation we expected results to be [[1, 1], [2, 2]]
|
|
|
|
// with accumulation we expect them to be [[2, 2], [2, 2]]
|
|
|
|
|
|
|
|
auto check = [&](bool accumulate) {
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto prop = dba.NameToProperty("x");
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2017-10-30 17:43:25 +08:00
|
|
|
auto v1 = dba.InsertVertex();
|
2022-02-22 20:33:45 +08:00
|
|
|
ASSERT_TRUE(v1.SetProperty(prop, memgraph::storage::PropertyValue(0)).HasValue());
|
2017-10-30 17:43:25 +08:00
|
|
|
auto v2 = dba.InsertVertex();
|
2022-02-22 20:33:45 +08:00
|
|
|
ASSERT_TRUE(v2.SetProperty(prop, memgraph::storage::PropertyValue(0)).HasValue());
|
2019-11-22 01:38:01 +08:00
|
|
|
ASSERT_TRUE(dba.InsertEdge(&v1, &v2, dba.NameToEdgeType("T")).HasValue());
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2021-02-18 22:32:43 +08:00
|
|
|
auto r_m = MakeExpand(storage, symbol_table, n.op_, n.sym_, "r", EdgeAtom::Direction::BOTH, {}, "m", false,
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::View::OLD);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
auto one = LITERAL(1);
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
2021-02-18 22:32:43 +08:00
|
|
|
auto set_n_p = std::make_shared<plan::SetProperty>(r_m.op_, prop, n_p, ADD(n_p, one));
|
2019-02-05 20:16:07 +08:00
|
|
|
auto m_p = PROPERTY_LOOKUP(IDENT("m")->MapTo(r_m.node_sym_), prop);
|
2021-02-18 22:32:43 +08:00
|
|
|
auto set_m_p = std::make_shared<plan::SetProperty>(set_n_p, prop, m_p, ADD(m_p, one));
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
std::shared_ptr<LogicalOperator> last_op = set_m_p;
|
|
|
|
if (accumulate) {
|
2021-02-18 22:32:43 +08:00
|
|
|
last_op = std::make_shared<Accumulate>(last_op, std::vector<Symbol>{n.sym_, r_m.node_sym_});
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
|
|
|
|
2021-02-18 22:32:43 +08:00
|
|
|
auto n_p_ne = NEXPR("n.p", n_p)->MapTo(symbol_table.CreateSymbol("n_p_ne", true));
|
|
|
|
auto m_p_ne = NEXPR("m.p", m_p)->MapTo(symbol_table.CreateSymbol("m_p_ne", true));
|
2017-04-11 21:11:48 +08:00
|
|
|
auto produce = MakeProduce(last_op, n_p_ne, m_p_ne);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-11 21:11:48 +08:00
|
|
|
std::vector<int> results_data;
|
2017-05-30 21:19:38 +08:00
|
|
|
for (const auto &row : results)
|
2021-02-18 22:32:43 +08:00
|
|
|
for (const auto &column : row) results_data.emplace_back(column.ValueInt());
|
2017-04-11 21:11:48 +08:00
|
|
|
if (accumulate)
|
|
|
|
EXPECT_THAT(results_data, testing::ElementsAre(2, 2, 2, 2));
|
|
|
|
else
|
|
|
|
EXPECT_THAT(results_data, testing::ElementsAre(1, 1, 2, 2));
|
|
|
|
};
|
|
|
|
|
|
|
|
check(false);
|
|
|
|
check(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AccumulateAdvance) {
|
|
|
|
// we simulate 'CREATE (n) WITH n AS n MATCH (m) RETURN m'
|
|
|
|
// to get correct results we need to advance the command
|
|
|
|
auto check = [&](bool advance) {
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
2018-12-20 16:38:23 +08:00
|
|
|
NodeCreationInfo node;
|
|
|
|
node.symbol = symbol_table.CreateSymbol("n", true);
|
2018-08-30 19:31:50 +08:00
|
|
|
auto create = std::make_shared<CreateNode>(nullptr, node);
|
2021-02-18 22:32:43 +08:00
|
|
|
auto accumulate = std::make_shared<Accumulate>(create, std::vector<Symbol>{node.symbol}, advance);
|
2017-04-11 21:11:48 +08:00
|
|
|
auto match = MakeScanAll(storage, symbol_table, "m", accumulate);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
EXPECT_EQ(advance ? 1 : 0, PullAll(*match.op_, &context));
|
2017-04-11 21:11:48 +08:00
|
|
|
};
|
|
|
|
check(false);
|
|
|
|
check(true);
|
|
|
|
}
|
|
|
|
|
2021-02-18 22:32:43 +08:00
|
|
|
std::shared_ptr<Produce> MakeAggregationProduce(std::shared_ptr<LogicalOperator> input, SymbolTable &symbol_table,
|
|
|
|
AstStorage &storage, const std::vector<Expression *> aggr_inputs,
|
|
|
|
const std::vector<Aggregation::Op> aggr_ops,
|
|
|
|
const std::vector<Expression *> group_by_exprs,
|
2022-12-03 19:48:44 +08:00
|
|
|
const std::vector<Symbol> remember, const bool distinct) {
|
2017-04-11 21:11:48 +08:00
|
|
|
// prepare all the aggregations
|
|
|
|
std::vector<Aggregate::Element> aggregates;
|
|
|
|
std::vector<NamedExpression *> named_expressions;
|
|
|
|
|
|
|
|
auto aggr_inputs_it = aggr_inputs.begin();
|
|
|
|
for (auto aggr_op : aggr_ops) {
|
|
|
|
// TODO change this from using IDENT to using AGGREGATION
|
|
|
|
// once AGGREGATION is handled properly in ExpressionEvaluation
|
2019-02-05 20:16:07 +08:00
|
|
|
auto aggr_sym = symbol_table.CreateSymbol("aggregation", true);
|
|
|
|
auto named_expr =
|
2021-02-18 22:32:43 +08:00
|
|
|
NEXPR("", IDENT("aggregation")->MapTo(aggr_sym))->MapTo(symbol_table.CreateSymbol("named_expression", true));
|
2017-04-11 21:11:48 +08:00
|
|
|
named_expressions.push_back(named_expr);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// the key expression is only used in COLLECT_MAP
|
2021-02-18 22:32:43 +08:00
|
|
|
Expression *key_expr_ptr = aggr_op == Aggregation::Op::COLLECT_MAP ? LITERAL("key") : nullptr;
|
2022-12-03 19:48:44 +08:00
|
|
|
aggregates.emplace_back(Aggregate::Element{*aggr_inputs_it++, key_expr_ptr, aggr_op, aggr_sym, distinct});
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// Produce will also evaluate group_by expressions and return them after the
|
|
|
|
// aggregations.
|
2017-04-11 21:11:48 +08:00
|
|
|
for (auto group_by_expr : group_by_exprs) {
|
2021-02-18 22:32:43 +08:00
|
|
|
auto named_expr = NEXPR("", group_by_expr)->MapTo(symbol_table.CreateSymbol("named_expression", true));
|
2017-04-11 21:11:48 +08:00
|
|
|
named_expressions.push_back(named_expr);
|
|
|
|
}
|
2021-02-18 22:32:43 +08:00
|
|
|
auto aggregation = std::make_shared<Aggregate>(input, aggregates, group_by_exprs, remember);
|
2017-04-11 21:11:48 +08:00
|
|
|
return std::make_shared<Produce>(aggregation, named_expressions);
|
|
|
|
}
|
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
/** Test fixture for all the aggregation ops in one return. */
|
2017-05-30 15:37:24 +08:00
|
|
|
class QueryPlanAggregateOps : public ::testing::Test {
|
|
|
|
protected:
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
|
|
|
memgraph::storage::Storage::Accessor storage_dba{db.Access()};
|
|
|
|
memgraph::query::DbAccessor dba{&storage_dba};
|
|
|
|
memgraph::storage::PropertyId prop = db.NameToProperty("prop");
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
2017-05-30 15:37:24 +08:00
|
|
|
void AddData() {
|
|
|
|
// setup is several nodes most of which have an int property set
|
|
|
|
// we will take the sum, avg, min, max and count
|
|
|
|
// we won't group by anything
|
2022-02-22 20:33:45 +08:00
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(prop, memgraph::storage::PropertyValue(5)).HasValue());
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(prop, memgraph::storage::PropertyValue(7)).HasValue());
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(prop, memgraph::storage::PropertyValue(12)).HasValue());
|
2022-12-03 19:48:44 +08:00
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(prop, memgraph::storage::PropertyValue(5)).HasValue());
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(prop, memgraph::storage::PropertyValue(5)).HasValue());
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(prop, memgraph::storage::PropertyValue(12)).HasValue());
|
|
|
|
|
2017-05-30 15:37:24 +08:00
|
|
|
// a missing property (null) gets ignored by all aggregations except
|
|
|
|
// COUNT(*)
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.InsertVertex();
|
|
|
|
dba.AdvanceCommand();
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2022-12-03 19:48:44 +08:00
|
|
|
auto AggregationResults(bool with_group_by, bool distinct,
|
|
|
|
std::vector<Aggregation::Op> ops = {
|
|
|
|
Aggregation::Op::COUNT, Aggregation::Op::COUNT, Aggregation::Op::MIN,
|
|
|
|
Aggregation::Op::MAX, Aggregation::Op::SUM, Aggregation::Op::AVG,
|
|
|
|
Aggregation::Op::COLLECT_LIST, Aggregation::Op::COLLECT_MAP}) {
|
2017-05-30 15:37:24 +08:00
|
|
|
// match all nodes and perform aggregations
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
2017-05-30 15:37:24 +08:00
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
std::vector<Expression *> aggregation_expressions(ops.size(), n_p);
|
2017-05-30 15:37:24 +08:00
|
|
|
std::vector<Expression *> group_bys;
|
|
|
|
if (with_group_by) group_bys.push_back(n_p);
|
|
|
|
aggregation_expressions[0] = nullptr;
|
2022-12-03 19:48:44 +08:00
|
|
|
auto produce =
|
|
|
|
MakeAggregationProduce(n.op_, symbol_table, storage, aggregation_expressions, ops, group_bys, {}, distinct);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
return CollectProduce(*produce, &context);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
TEST_F(QueryPlanAggregateOps, WithData) {
|
|
|
|
AddData();
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(false, false);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
ASSERT_EQ(results.size(), 1);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
ASSERT_EQ(results[0].size(), 8);
|
2017-05-06 23:57:39 +08:00
|
|
|
// count(*)
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
2022-12-03 19:48:44 +08:00
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 7);
|
2017-05-06 23:57:39 +08:00
|
|
|
// count
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results[0][1].type(), TypedValue::Type::Int);
|
2022-12-03 19:48:44 +08:00
|
|
|
EXPECT_EQ(results[0][1].ValueInt(), 6);
|
2017-05-06 23:57:39 +08:00
|
|
|
// min
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results[0][2].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][2].ValueInt(), 5);
|
2017-05-06 23:57:39 +08:00
|
|
|
// max
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results[0][3].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][3].ValueInt(), 12);
|
2017-05-06 23:57:39 +08:00
|
|
|
// sum
|
|
|
|
ASSERT_EQ(results[0][4].type(), TypedValue::Type::Int);
|
2022-12-03 19:48:44 +08:00
|
|
|
EXPECT_EQ(results[0][4].ValueInt(), 46);
|
2017-04-11 21:11:48 +08:00
|
|
|
// avg
|
2017-05-06 23:57:39 +08:00
|
|
|
ASSERT_EQ(results[0][5].type(), TypedValue::Type::Double);
|
2022-12-03 19:48:44 +08:00
|
|
|
EXPECT_FLOAT_EQ(results[0][5].ValueDouble(), 46 / 6.0);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// collect list
|
2017-05-19 21:49:25 +08:00
|
|
|
ASSERT_EQ(results[0][6].type(), TypedValue::Type::List);
|
2022-12-03 19:48:44 +08:00
|
|
|
EXPECT_THAT(ToIntList(results[0][6]), UnorderedElementsAre(5, 7, 12, 5, 5, 12));
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// collect map
|
|
|
|
ASSERT_EQ(results[0][7].type(), TypedValue::Type::Map);
|
2019-08-22 20:50:57 +08:00
|
|
|
auto map = ToIntMap(results[0][7]);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
ASSERT_EQ(map.size(), 1);
|
|
|
|
EXPECT_EQ(map.begin()->first, "key");
|
|
|
|
EXPECT_FALSE(std::set<int>({5, 7, 12}).insert(map.begin()->second).second);
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
|
|
|
|
2017-05-30 15:37:24 +08:00
|
|
|
TEST_F(QueryPlanAggregateOps, WithoutDataWithGroupBy) {
|
|
|
|
{
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(true, false, {Aggregation::Op::COUNT});
|
2022-07-19 18:16:32 +08:00
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
{
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(true, false, {Aggregation::Op::SUM});
|
2022-07-19 18:16:32 +08:00
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
{
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(true, false, {Aggregation::Op::AVG});
|
2022-07-19 18:16:32 +08:00
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Null);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
{
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(true, false, {Aggregation::Op::MIN});
|
2022-07-19 18:16:32 +08:00
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Null);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
{
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(true, false, {Aggregation::Op::MAX});
|
2022-07-19 18:16:32 +08:00
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Null);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
{
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(true, false, {Aggregation::Op::COLLECT_LIST});
|
2022-07-19 18:16:32 +08:00
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::List);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
}
|
|
|
|
{
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(true, false, {Aggregation::Op::COLLECT_MAP});
|
2022-07-19 18:16:32 +08:00
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Map);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_F(QueryPlanAggregateOps, WithoutDataWithoutGroupBy) {
|
2022-12-03 19:48:44 +08:00
|
|
|
auto results = AggregationResults(false, false);
|
2017-05-30 15:37:24 +08:00
|
|
|
ASSERT_EQ(results.size(), 1);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
ASSERT_EQ(results[0].size(), 8);
|
2017-05-30 15:37:24 +08:00
|
|
|
// count(*)
|
|
|
|
ASSERT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
// count
|
|
|
|
ASSERT_EQ(results[0][1].type(), TypedValue::Type::Int);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(results[0][1].ValueInt(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
// min
|
|
|
|
EXPECT_TRUE(results[0][2].IsNull());
|
|
|
|
// max
|
|
|
|
EXPECT_TRUE(results[0][3].IsNull());
|
|
|
|
// sum
|
2022-07-19 18:16:32 +08:00
|
|
|
EXPECT_EQ(results[0][4].ValueInt(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
// avg
|
|
|
|
EXPECT_TRUE(results[0][5].IsNull());
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// collect list
|
2017-05-30 15:37:24 +08:00
|
|
|
ASSERT_EQ(results[0][6].type(), TypedValue::Type::List);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(ToIntList(results[0][6]).size(), 0);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// collect map
|
|
|
|
ASSERT_EQ(results[0][7].type(), TypedValue::Type::Map);
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(ToIntMap(results[0][7]).size(), 0);
|
2017-05-30 15:37:24 +08:00
|
|
|
}
|
|
|
|
|
2017-04-11 21:11:48 +08:00
|
|
|
TEST(QueryPlan, AggregateGroupByValues) {
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// Tests that distinct groups are aggregated properly for values of all types.
|
|
|
|
// Also test the "remember" part of the Aggregation API as final results are
|
|
|
|
// obtained via a property lookup of a remembered node.
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2022-02-22 20:33:45 +08:00
|
|
|
// a vector of memgraph::storage::PropertyValue to be set as property values on vertices
|
2017-04-11 21:11:48 +08:00
|
|
|
// most of them should result in a distinct group (commented where not)
|
2022-02-22 20:33:45 +08:00
|
|
|
std::vector<memgraph::storage::PropertyValue> group_by_vals;
|
2017-04-11 21:11:48 +08:00
|
|
|
group_by_vals.emplace_back(4);
|
|
|
|
group_by_vals.emplace_back(7);
|
|
|
|
group_by_vals.emplace_back(7.3);
|
|
|
|
group_by_vals.emplace_back(7.2);
|
|
|
|
group_by_vals.emplace_back("Johhny");
|
|
|
|
group_by_vals.emplace_back("Jane");
|
|
|
|
group_by_vals.emplace_back("1");
|
|
|
|
group_by_vals.emplace_back(true);
|
|
|
|
group_by_vals.emplace_back(false);
|
2022-02-22 20:33:45 +08:00
|
|
|
group_by_vals.emplace_back(std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue(1)});
|
|
|
|
group_by_vals.emplace_back(std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue(1),
|
|
|
|
memgraph::storage::PropertyValue(2)});
|
|
|
|
group_by_vals.emplace_back(std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue(2),
|
|
|
|
memgraph::storage::PropertyValue(1)});
|
|
|
|
group_by_vals.emplace_back(memgraph::storage::PropertyValue());
|
2017-04-11 21:11:48 +08:00
|
|
|
// should NOT result in another group because 7.0 == 7
|
|
|
|
group_by_vals.emplace_back(7.0);
|
|
|
|
// should NOT result in another group
|
2022-02-22 20:33:45 +08:00
|
|
|
group_by_vals.emplace_back(std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue(1),
|
|
|
|
memgraph::storage::PropertyValue(2.0)});
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
// generate a lot of vertices and set props on them
|
2019-11-22 01:38:01 +08:00
|
|
|
auto prop = dba.NameToProperty("prop");
|
2017-04-11 21:11:48 +08:00
|
|
|
for (int i = 0; i < 1000; ++i)
|
2021-02-18 22:32:43 +08:00
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(prop, group_by_vals[i % group_by_vals.size()]).HasValue());
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
// match all nodes and perform aggregations
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2022-12-03 19:48:44 +08:00
|
|
|
auto produce =
|
|
|
|
MakeAggregationProduce(n.op_, symbol_table, storage, {n_p}, {Aggregation::Op::COUNT}, {n_p}, {n.sym_}, false);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-11 21:11:48 +08:00
|
|
|
ASSERT_EQ(results.size(), group_by_vals.size() - 2);
|
2021-02-18 22:32:43 +08:00
|
|
|
std::unordered_set<TypedValue, TypedValue::Hash, TypedValue::BoolEqual> result_group_bys;
|
2017-04-11 21:11:48 +08:00
|
|
|
for (const auto &row : results) {
|
|
|
|
ASSERT_EQ(2, row.size());
|
|
|
|
result_group_bys.insert(row[1]);
|
|
|
|
}
|
|
|
|
ASSERT_EQ(result_group_bys.size(), group_by_vals.size() - 2);
|
2019-06-06 19:16:37 +08:00
|
|
|
std::vector<TypedValue> group_by_tvals;
|
|
|
|
group_by_tvals.reserve(group_by_vals.size());
|
|
|
|
for (const auto &v : group_by_vals) group_by_tvals.emplace_back(v);
|
2021-02-18 22:32:43 +08:00
|
|
|
EXPECT_TRUE(std::is_permutation(group_by_tvals.begin(), group_by_tvals.end() - 2, result_group_bys.begin(),
|
|
|
|
TypedValue::BoolEqual{}));
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AggregateMultipleGroupBy) {
|
|
|
|
// in this test we have 3 different properties that have different values
|
|
|
|
// for different records and assert that we get the correct combination
|
|
|
|
// of values in our groups
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2019-11-22 01:38:01 +08:00
|
|
|
auto prop1 = dba.NameToProperty("prop1");
|
|
|
|
auto prop2 = dba.NameToProperty("prop2");
|
|
|
|
auto prop3 = dba.NameToProperty("prop3");
|
2017-04-11 21:11:48 +08:00
|
|
|
for (int i = 0; i < 2 * 3 * 5; ++i) {
|
2017-10-30 17:43:25 +08:00
|
|
|
auto v = dba.InsertVertex();
|
2022-02-22 20:33:45 +08:00
|
|
|
ASSERT_TRUE(v.SetProperty(prop1, memgraph::storage::PropertyValue(static_cast<bool>(i % 2))).HasValue());
|
|
|
|
ASSERT_TRUE(v.SetProperty(prop2, memgraph::storage::PropertyValue(i % 3)).HasValue());
|
|
|
|
ASSERT_TRUE(v.SetProperty(prop3, memgraph::storage::PropertyValue("value" + std::to_string(i % 5))).HasValue());
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
// match all nodes and perform aggregations
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p1 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop1);
|
|
|
|
auto n_p2 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop2);
|
|
|
|
auto n_p3 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop3);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2021-02-18 22:32:43 +08:00
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {n_p1}, {Aggregation::Op::COUNT},
|
2022-12-03 19:48:44 +08:00
|
|
|
{n_p1, n_p2, n_p3}, {n.sym_}, false);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-11 21:11:48 +08:00
|
|
|
EXPECT_EQ(results.size(), 2 * 3 * 5);
|
|
|
|
}
|
|
|
|
|
2017-04-13 22:47:11 +08:00
|
|
|
TEST(QueryPlan, AggregateNoInput) {
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-13 22:47:11 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto two = LITERAL(2);
|
2022-12-03 19:48:44 +08:00
|
|
|
auto produce = MakeAggregationProduce(nullptr, symbol_table, storage, {two}, {Aggregation::Op::COUNT}, {}, {}, false);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-13 22:47:11 +08:00
|
|
|
EXPECT_EQ(1, results.size());
|
|
|
|
EXPECT_EQ(1, results[0].size());
|
|
|
|
EXPECT_EQ(TypedValue::Type::Int, results[0][0].type());
|
2019-08-22 20:50:57 +08:00
|
|
|
EXPECT_EQ(1, results[0][0].ValueInt());
|
2017-04-13 22:47:11 +08:00
|
|
|
}
|
|
|
|
|
2017-04-12 21:47:55 +08:00
|
|
|
TEST(QueryPlan, AggregateCountEdgeCases) {
|
|
|
|
// tests for detected bugs in the COUNT aggregation behavior
|
|
|
|
// ensure that COUNT returns correctly for
|
|
|
|
// - 0 vertices in database
|
|
|
|
// - 1 vertex in database, property not set
|
|
|
|
// - 1 vertex in database, property set
|
|
|
|
// - 2 vertices in database, property set on one
|
|
|
|
// - 2 vertices in database, property set on both
|
|
|
|
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto prop = dba.NameToProperty("prop");
|
2017-04-12 21:47:55 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-12 21:47:55 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
2017-04-12 21:47:55 +08:00
|
|
|
|
|
|
|
// returns -1 when there are no results
|
|
|
|
// otherwise returns MATCH (n) RETURN count(n.prop)
|
|
|
|
auto count = [&]() {
|
2022-12-03 19:48:44 +08:00
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {n_p}, {Aggregation::Op::COUNT}, {}, {}, false);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-12 21:47:55 +08:00
|
|
|
if (results.size() == 0) return -1L;
|
|
|
|
EXPECT_EQ(1, results.size());
|
|
|
|
EXPECT_EQ(1, results[0].size());
|
|
|
|
EXPECT_EQ(TypedValue::Type::Int, results[0][0].type());
|
2019-08-22 20:50:57 +08:00
|
|
|
return results[0][0].ValueInt();
|
2017-04-12 21:47:55 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
// no vertices yet in database
|
2017-05-30 15:37:24 +08:00
|
|
|
EXPECT_EQ(0, count());
|
2017-04-12 21:47:55 +08:00
|
|
|
|
|
|
|
// one vertex, no property set
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.InsertVertex();
|
|
|
|
dba.AdvanceCommand();
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_EQ(0, count());
|
|
|
|
|
|
|
|
// one vertex, property set
|
2022-02-22 20:33:45 +08:00
|
|
|
for (auto va : dba.Vertices(memgraph::storage::View::OLD))
|
|
|
|
ASSERT_TRUE(va.SetProperty(prop, memgraph::storage::PropertyValue(42)).HasValue());
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_EQ(1, count());
|
|
|
|
|
|
|
|
// two vertices, one with property set
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.InsertVertex();
|
|
|
|
dba.AdvanceCommand();
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_EQ(1, count());
|
|
|
|
|
|
|
|
// two vertices, both with property set
|
2022-02-22 20:33:45 +08:00
|
|
|
for (auto va : dba.Vertices(memgraph::storage::View::OLD))
|
|
|
|
ASSERT_TRUE(va.SetProperty(prop, memgraph::storage::PropertyValue(42)).HasValue());
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-12 21:47:55 +08:00
|
|
|
EXPECT_EQ(2, count());
|
|
|
|
}
|
|
|
|
|
2017-04-14 23:14:14 +08:00
|
|
|
TEST(QueryPlan, AggregateFirstValueTypes) {
|
|
|
|
// testing exceptions that get emitted by the first-value
|
|
|
|
// type check
|
|
|
|
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2017-04-14 23:14:14 +08:00
|
|
|
|
2017-10-30 17:43:25 +08:00
|
|
|
auto v1 = dba.InsertVertex();
|
2019-11-22 01:38:01 +08:00
|
|
|
auto prop_string = dba.NameToProperty("string");
|
2022-02-22 20:33:45 +08:00
|
|
|
ASSERT_TRUE(v1.SetProperty(prop_string, memgraph::storage::PropertyValue("johhny")).HasValue());
|
2019-11-22 01:38:01 +08:00
|
|
|
auto prop_int = dba.NameToProperty("int");
|
2022-02-22 20:33:45 +08:00
|
|
|
ASSERT_TRUE(v1.SetProperty(prop_int, memgraph::storage::PropertyValue(12)).HasValue());
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-14 23:14:14 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-14 23:14:14 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_prop_string = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop_string);
|
|
|
|
auto n_prop_int = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop_int);
|
2017-04-14 23:14:14 +08:00
|
|
|
auto n_id = n_prop_string->expression_;
|
|
|
|
|
|
|
|
auto aggregate = [&](Expression *expression, Aggregation::Op aggr_op) {
|
2022-12-03 19:48:44 +08:00
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {expression}, {aggr_op}, {}, {}, false);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
CollectProduce(*produce, &context);
|
2017-04-14 23:14:14 +08:00
|
|
|
};
|
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// everything except for COUNT and COLLECT fails on a Vertex
|
2017-04-14 23:14:14 +08:00
|
|
|
aggregate(n_id, Aggregation::Op::COUNT);
|
2017-06-12 21:12:31 +08:00
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-14 23:14:14 +08:00
|
|
|
|
|
|
|
// on strings AVG and SUM fail
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::MAX);
|
2021-02-18 22:32:43 +08:00
|
|
|
EXPECT_THROW(aggregate(n_prop_string, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_prop_string, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-14 23:14:14 +08:00
|
|
|
|
|
|
|
// on ints nothing fails
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::MAX);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::AVG);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::SUM);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
aggregate(n_prop_int, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::COLLECT_MAP);
|
2017-04-14 23:14:14 +08:00
|
|
|
}
|
|
|
|
|
2017-04-11 21:11:48 +08:00
|
|
|
TEST(QueryPlan, AggregateTypes) {
|
|
|
|
// testing exceptions that can get emitted by an aggregation
|
|
|
|
// does not check all combinations that can result in an exception
|
|
|
|
// (that logic is defined and tested by TypedValue)
|
|
|
|
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2019-11-22 01:38:01 +08:00
|
|
|
|
|
|
|
auto p1 = dba.NameToProperty("p1"); // has only string props
|
2022-02-22 20:33:45 +08:00
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(p1, memgraph::storage::PropertyValue("string")).HasValue());
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(p1, memgraph::storage::PropertyValue("str2")).HasValue());
|
2019-11-22 01:38:01 +08:00
|
|
|
auto p2 = dba.NameToProperty("p2"); // combines int and bool
|
2022-02-22 20:33:45 +08:00
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(p2, memgraph::storage::PropertyValue(42)).HasValue());
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(p2, memgraph::storage::PropertyValue(true)).HasValue());
|
2017-10-30 17:43:25 +08:00
|
|
|
dba.AdvanceCommand();
|
2017-04-11 21:11:48 +08:00
|
|
|
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-11 21:11:48 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
2019-02-05 20:16:07 +08:00
|
|
|
auto n_p1 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), p1);
|
|
|
|
auto n_p2 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), p2);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
auto aggregate = [&](Expression *expression, Aggregation::Op aggr_op) {
|
2022-12-03 19:48:44 +08:00
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {expression}, {aggr_op}, {}, {}, false);
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
CollectProduce(*produce, &context);
|
2017-04-11 21:11:48 +08:00
|
|
|
};
|
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// everything except for COUNT and COLLECT fails on a Vertex
|
2017-04-11 21:11:48 +08:00
|
|
|
auto n_id = n_p1->expression_;
|
|
|
|
aggregate(n_id, Aggregation::Op::COUNT);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
aggregate(n_id, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_id, Aggregation::Op::COLLECT_MAP);
|
2017-06-12 21:12:31 +08:00
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
|
|
|
// on strings AVG and SUM fail
|
|
|
|
aggregate(n_p1, Aggregation::Op::COUNT);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
aggregate(n_p1, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_p1, Aggregation::Op::COLLECT_MAP);
|
2017-04-11 21:11:48 +08:00
|
|
|
aggregate(n_p1, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_p1, Aggregation::Op::MAX);
|
2017-06-12 21:12:31 +08:00
|
|
|
EXPECT_THROW(aggregate(n_p1, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p1, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-11 21:11:48 +08:00
|
|
|
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
// combination of int and bool, everything except COUNT and COLLECT fails
|
2017-04-11 21:11:48 +08:00
|
|
|
aggregate(n_p2, Aggregation::Op::COUNT);
|
Collect Map added
Summary:
Tests are on the way. Please first comment if you're OK with this implementation, some points are discussable.
What works now:
```
bash:MEMGRAPH_ROOT/build/>./tests/manual/console 10
MG>MATCH (n) RETURN COLLECT("age_" + n.age, n.height)
+-----------------------------------------------------------------------------------------------------------------------------------+
| COLLECT("age_" + n.age, n.height) |
+-----------------------------------------------------------------------------------------------------------------------------------+
| {age_10: 176, age_13: 180, age_24: 172, age_25: 179, age_32: 123, age_33: 186, age_37: 147, age_43: 162, age_49: 126, age_6: 170} |
+-----------------------------------------------------------------------------------------------------------------------------------+
```
Reviewers: mislav.bradac, teon.banek, buda
Reviewed By: mislav.bradac, buda
Subscribers: pullbot
Differential Revision: https://phabricator.memgraph.io/D695
2017-08-23 16:43:45 +08:00
|
|
|
aggregate(n_p2, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_p2, Aggregation::Op::COLLECT_MAP);
|
2017-06-12 21:12:31 +08:00
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::SUM), QueryRuntimeException);
|
2017-04-11 21:11:48 +08:00
|
|
|
}
|
2017-04-28 21:14:28 +08:00
|
|
|
|
|
|
|
TEST(QueryPlan, Unwind) {
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::storage::Storage db;
|
2019-11-22 01:38:01 +08:00
|
|
|
auto storage_dba = db.Access();
|
2022-02-22 20:33:45 +08:00
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
2018-05-22 22:45:52 +08:00
|
|
|
AstStorage storage;
|
2017-04-28 21:14:28 +08:00
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
// UNWIND [ [1, true, "x"], [], ["bla"] ] AS x UNWIND x as y RETURN x, y
|
2022-02-22 20:33:45 +08:00
|
|
|
auto input_expr = storage.Create<PrimitiveLiteral>(std::vector<memgraph::storage::PropertyValue>{
|
|
|
|
memgraph::storage::PropertyValue(std::vector<memgraph::storage::PropertyValue>{
|
|
|
|
memgraph::storage::PropertyValue(1), memgraph::storage::PropertyValue(true),
|
|
|
|
memgraph::storage::PropertyValue("x")}),
|
|
|
|
memgraph::storage::PropertyValue(std::vector<memgraph::storage::PropertyValue>{}),
|
|
|
|
memgraph::storage::PropertyValue(
|
|
|
|
std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue("bla")})});
|
2017-04-28 21:14:28 +08:00
|
|
|
|
2017-05-12 17:37:22 +08:00
|
|
|
auto x = symbol_table.CreateSymbol("x", true);
|
2017-05-03 17:07:07 +08:00
|
|
|
auto unwind_0 = std::make_shared<plan::Unwind>(nullptr, input_expr, x);
|
2019-02-05 20:16:07 +08:00
|
|
|
auto x_expr = IDENT("x")->MapTo(x);
|
2017-05-12 17:37:22 +08:00
|
|
|
auto y = symbol_table.CreateSymbol("y", true);
|
2017-05-03 17:07:07 +08:00
|
|
|
auto unwind_1 = std::make_shared<plan::Unwind>(unwind_0, x_expr, y);
|
2017-04-28 21:14:28 +08:00
|
|
|
|
2021-02-18 22:32:43 +08:00
|
|
|
auto x_ne = NEXPR("x", x_expr)->MapTo(symbol_table.CreateSymbol("x_ne", true));
|
|
|
|
auto y_ne = NEXPR("y", IDENT("y")->MapTo(y))->MapTo(symbol_table.CreateSymbol("y_ne", true));
|
2017-04-28 21:14:28 +08:00
|
|
|
auto produce = MakeProduce(unwind_1, x_ne, y_ne);
|
|
|
|
|
2019-11-22 01:38:01 +08:00
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
Remove GraphDbAccessor and storage types from Ast
Summary:
This diff removes the need for a database when parsing a query and
creating an Ast. Instead of storing storage::{Label,Property,EdgeType}
in Ast nodes, we store the name and an index into all of the names. This
allows for easy creation of a map from {Label,Property,EdgeType} index
into the concrete storage type. Obviously, this comes with a performance
penalty during execution, but it should be minor. The upside is that the
query/frontend minimally depends on storage (PropertyValue), which makes
writing tests easier as well as running them a lot faster (there is no
database setup). This is most noticeable in the ast_serialization test
which took a long time due to start up of a distributed database.
Reviewers: mtomic, llugovic
Reviewed By: mtomic
Subscribers: mferencevic, pullbot
Differential Revision: https://phabricator.memgraph.io/D1774
2019-01-14 21:41:37 +08:00
|
|
|
auto results = CollectProduce(*produce, &context);
|
2017-04-28 21:14:28 +08:00
|
|
|
ASSERT_EQ(4, results.size());
|
|
|
|
const std::vector<int> expected_x_card{3, 3, 3, 1};
|
|
|
|
auto expected_x_card_it = expected_x_card.begin();
|
2021-02-18 22:32:43 +08:00
|
|
|
const std::vector<TypedValue> expected_y{TypedValue(1), TypedValue(true), TypedValue("x"), TypedValue("bla")};
|
2017-04-28 21:14:28 +08:00
|
|
|
auto expected_y_it = expected_y.begin();
|
|
|
|
for (const auto &row : results) {
|
|
|
|
ASSERT_EQ(2, row.size());
|
|
|
|
ASSERT_EQ(row[0].type(), TypedValue::Type::List);
|
2019-06-05 21:50:29 +08:00
|
|
|
EXPECT_EQ(row[0].ValueList().size(), *expected_x_card_it);
|
2017-04-28 21:14:28 +08:00
|
|
|
EXPECT_EQ(row[1].type(), expected_y_it->type());
|
|
|
|
expected_x_card_it++;
|
|
|
|
expected_y_it++;
|
|
|
|
}
|
|
|
|
}
|
2022-12-03 19:48:44 +08:00
|
|
|
|
|
|
|
TEST_F(QueryPlanAggregateOps, WithDataDistinct) {
|
|
|
|
AddData();
|
|
|
|
auto results = AggregationResults(false, true);
|
|
|
|
|
|
|
|
ASSERT_EQ(results.size(), 1);
|
|
|
|
ASSERT_EQ(results[0].size(), 8);
|
|
|
|
// count(*)
|
|
|
|
ASSERT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 7);
|
|
|
|
// count
|
|
|
|
ASSERT_EQ(results[0][1].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][1].ValueInt(), 3);
|
|
|
|
// min
|
|
|
|
ASSERT_EQ(results[0][2].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][2].ValueInt(), 5);
|
|
|
|
// max
|
|
|
|
ASSERT_EQ(results[0][3].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][3].ValueInt(), 12);
|
|
|
|
// sum
|
|
|
|
ASSERT_EQ(results[0][4].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][4].ValueInt(), 24);
|
|
|
|
// avg
|
|
|
|
ASSERT_EQ(results[0][5].type(), TypedValue::Type::Double);
|
|
|
|
EXPECT_FLOAT_EQ(results[0][5].ValueDouble(), 24 / 3.0);
|
|
|
|
// collect list
|
|
|
|
ASSERT_EQ(results[0][6].type(), TypedValue::Type::List);
|
|
|
|
EXPECT_THAT(ToIntList(results[0][6]), UnorderedElementsAre(5, 7, 12));
|
|
|
|
// collect map
|
|
|
|
ASSERT_EQ(results[0][7].type(), TypedValue::Type::Map);
|
|
|
|
auto map = ToIntMap(results[0][7]);
|
|
|
|
ASSERT_EQ(map.size(), 1);
|
|
|
|
EXPECT_EQ(map.begin()->first, "key");
|
|
|
|
EXPECT_FALSE(std::set<int>({5, 7, 12}).insert(map.begin()->second).second);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_F(QueryPlanAggregateOps, WithoutDataWithDistinctAndWithGroupBy) {
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, true, {Aggregation::Op::COUNT});
|
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 0);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, true, {Aggregation::Op::SUM});
|
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 0);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, true, {Aggregation::Op::AVG});
|
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Null);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, true, {Aggregation::Op::MIN});
|
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Null);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, true, {Aggregation::Op::MAX});
|
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Null);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, true, {Aggregation::Op::COLLECT_LIST});
|
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::List);
|
|
|
|
}
|
|
|
|
{
|
|
|
|
auto results = AggregationResults(true, true, {Aggregation::Op::COLLECT_MAP});
|
|
|
|
EXPECT_EQ(results.size(), 1);
|
|
|
|
EXPECT_EQ(results[0][0].type(), TypedValue::Type::Map);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_F(QueryPlanAggregateOps, WithoutDataWithDistinctAndWithoutGroupBy) {
|
|
|
|
auto results = AggregationResults(false, true);
|
|
|
|
ASSERT_EQ(results.size(), 1);
|
|
|
|
ASSERT_EQ(results[0].size(), 8);
|
|
|
|
// count(*)
|
|
|
|
ASSERT_EQ(results[0][0].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][0].ValueInt(), 0);
|
|
|
|
// count
|
|
|
|
ASSERT_EQ(results[0][1].type(), TypedValue::Type::Int);
|
|
|
|
EXPECT_EQ(results[0][1].ValueInt(), 0);
|
|
|
|
// min
|
|
|
|
EXPECT_TRUE(results[0][2].IsNull());
|
|
|
|
// max
|
|
|
|
EXPECT_TRUE(results[0][3].IsNull());
|
|
|
|
// sum
|
|
|
|
EXPECT_EQ(results[0][4].ValueInt(), 0);
|
|
|
|
// avg
|
|
|
|
EXPECT_TRUE(results[0][5].IsNull());
|
|
|
|
// collect list
|
|
|
|
ASSERT_EQ(results[0][6].type(), TypedValue::Type::List);
|
|
|
|
EXPECT_EQ(ToIntList(results[0][6]).size(), 0);
|
|
|
|
// collect map
|
|
|
|
ASSERT_EQ(results[0][7].type(), TypedValue::Type::Map);
|
|
|
|
EXPECT_EQ(ToIntMap(results[0][7]).size(), 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AggregateGroupByValuesWithDistinct) {
|
|
|
|
// Tests that distinct groups are aggregated properly for values of all types.
|
|
|
|
// Also test the "remember" part of the Aggregation API as final results are
|
|
|
|
// obtained via a property lookup of a remembered node.
|
|
|
|
memgraph::storage::Storage db;
|
|
|
|
auto storage_dba = db.Access();
|
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
|
|
|
|
|
|
|
// a vector of memgraph::storage::PropertyValue to be set as property values on vertices
|
|
|
|
// most of them should result in a distinct group (commented where not)
|
|
|
|
std::vector<memgraph::storage::PropertyValue> group_by_vals;
|
|
|
|
group_by_vals.emplace_back(4);
|
|
|
|
group_by_vals.emplace_back(7);
|
|
|
|
group_by_vals.emplace_back(7.3);
|
|
|
|
group_by_vals.emplace_back(7.2);
|
|
|
|
group_by_vals.emplace_back("Johhny");
|
|
|
|
group_by_vals.emplace_back("Jane");
|
|
|
|
group_by_vals.emplace_back("1");
|
|
|
|
group_by_vals.emplace_back(true);
|
|
|
|
group_by_vals.emplace_back(false);
|
|
|
|
group_by_vals.emplace_back(std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue(1)});
|
|
|
|
group_by_vals.emplace_back(std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue(1),
|
|
|
|
memgraph::storage::PropertyValue(2)});
|
|
|
|
group_by_vals.emplace_back(std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue(2),
|
|
|
|
memgraph::storage::PropertyValue(1)});
|
|
|
|
group_by_vals.emplace_back(memgraph::storage::PropertyValue());
|
|
|
|
// should NOT result in another group because 7.0 == 7
|
|
|
|
group_by_vals.emplace_back(7.0);
|
|
|
|
// should NOT result in another group
|
|
|
|
group_by_vals.emplace_back(std::vector<memgraph::storage::PropertyValue>{memgraph::storage::PropertyValue(1),
|
|
|
|
memgraph::storage::PropertyValue(2.0)});
|
|
|
|
|
|
|
|
// generate a lot of vertices and set props on them
|
|
|
|
auto prop = dba.NameToProperty("prop");
|
|
|
|
for (int i = 0; i < 1000; ++i)
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(prop, group_by_vals[i % group_by_vals.size()]).HasValue());
|
|
|
|
dba.AdvanceCommand();
|
|
|
|
|
|
|
|
AstStorage storage;
|
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
// match all nodes and perform aggregations
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
|
|
|
|
|
|
|
auto produce =
|
|
|
|
MakeAggregationProduce(n.op_, symbol_table, storage, {n_p}, {Aggregation::Op::COUNT}, {n_p}, {n.sym_}, true);
|
|
|
|
|
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
|
|
|
auto results = CollectProduce(*produce, &context);
|
|
|
|
ASSERT_EQ(results.size(), group_by_vals.size() - 2);
|
|
|
|
std::unordered_set<TypedValue, TypedValue::Hash, TypedValue::BoolEqual> result_group_bys;
|
|
|
|
for (const auto &row : results) {
|
|
|
|
ASSERT_EQ(2, row.size());
|
|
|
|
if (!row[1].IsNull()) {
|
|
|
|
ASSERT_EQ(1, row[0].ValueInt());
|
|
|
|
}
|
|
|
|
result_group_bys.insert(row[1]);
|
|
|
|
}
|
|
|
|
ASSERT_EQ(result_group_bys.size(), group_by_vals.size() - 2);
|
|
|
|
std::vector<TypedValue> group_by_tvals;
|
|
|
|
group_by_tvals.reserve(group_by_vals.size());
|
|
|
|
for (const auto &v : group_by_vals) group_by_tvals.emplace_back(v);
|
|
|
|
EXPECT_TRUE(std::is_permutation(group_by_tvals.begin(), group_by_tvals.end() - 2, result_group_bys.begin(),
|
|
|
|
TypedValue::BoolEqual{}));
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AggregateMultipleGroupByWithDistinct) {
|
|
|
|
// in this test we have 3 different properties that have different values
|
|
|
|
// for different records and assert that we get the correct combination
|
|
|
|
// of values in our groups
|
|
|
|
memgraph::storage::Storage db;
|
|
|
|
auto storage_dba = db.Access();
|
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
|
|
|
|
|
|
|
auto prop1 = dba.NameToProperty("prop1");
|
|
|
|
auto prop2 = dba.NameToProperty("prop2");
|
|
|
|
auto prop3 = dba.NameToProperty("prop3");
|
|
|
|
for (int i = 0; i < 2 * 3 * 5; ++i) {
|
|
|
|
auto v = dba.InsertVertex();
|
|
|
|
ASSERT_TRUE(v.SetProperty(prop1, memgraph::storage::PropertyValue(static_cast<bool>(i % 2))).HasValue());
|
|
|
|
ASSERT_TRUE(v.SetProperty(prop2, memgraph::storage::PropertyValue(i % 3)).HasValue());
|
|
|
|
ASSERT_TRUE(v.SetProperty(prop3, memgraph::storage::PropertyValue("value" + std::to_string(i % 5))).HasValue());
|
|
|
|
}
|
|
|
|
dba.AdvanceCommand();
|
|
|
|
|
|
|
|
AstStorage storage;
|
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
// match all nodes and perform aggregations
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
|
|
|
auto n_p1 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop1);
|
|
|
|
auto n_p2 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop2);
|
|
|
|
|
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {n_p1}, {Aggregation::Op::COUNT}, {n_p1, n_p2},
|
|
|
|
{n.sym_}, true);
|
|
|
|
|
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
|
|
|
auto results = CollectProduce(*produce, &context);
|
|
|
|
for (const auto &row : results) {
|
|
|
|
ASSERT_EQ(1, row[0].ValueInt());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AggregateNoInputWithDistinct) {
|
|
|
|
memgraph::storage::Storage db;
|
|
|
|
auto storage_dba = db.Access();
|
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
|
|
|
AstStorage storage;
|
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto two = LITERAL(2);
|
|
|
|
auto produce = MakeAggregationProduce(nullptr, symbol_table, storage, {two}, {Aggregation::Op::COUNT}, {}, {}, true);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
|
|
|
auto results = CollectProduce(*produce, &context);
|
|
|
|
EXPECT_EQ(1, results.size());
|
|
|
|
EXPECT_EQ(1, results[0].size());
|
|
|
|
EXPECT_EQ(TypedValue::Type::Int, results[0][0].type());
|
|
|
|
EXPECT_EQ(1, results[0][0].ValueInt());
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AggregateCountEdgeCasesWithDistinct) {
|
|
|
|
// tests for detected bugs in the COUNT aggregation behavior
|
|
|
|
// ensure that COUNT returns correctly for
|
|
|
|
// - 0 vertices in database
|
|
|
|
// - 1 vertex in database, property not set
|
|
|
|
// - 1 vertex in database, property set
|
|
|
|
// - 2 vertices in database, property set on one
|
|
|
|
// - 2 vertices in database, property set on both
|
|
|
|
|
|
|
|
memgraph::storage::Storage db;
|
|
|
|
auto storage_dba = db.Access();
|
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
|
|
|
auto prop = dba.NameToProperty("prop");
|
|
|
|
|
|
|
|
AstStorage storage;
|
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
|
|
|
auto n_p = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop);
|
|
|
|
|
|
|
|
// returns -1 when there are no results
|
|
|
|
// otherwise returns MATCH (n) RETURN count(n.prop)
|
|
|
|
auto count = [&]() {
|
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {n_p}, {Aggregation::Op::COUNT}, {}, {}, true);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
|
|
|
auto results = CollectProduce(*produce, &context);
|
|
|
|
if (results.size() == 0) return -1L;
|
|
|
|
EXPECT_EQ(1, results.size());
|
|
|
|
EXPECT_EQ(1, results[0].size());
|
|
|
|
EXPECT_EQ(TypedValue::Type::Int, results[0][0].type());
|
|
|
|
return results[0][0].ValueInt();
|
|
|
|
};
|
|
|
|
|
|
|
|
// no vertices yet in database
|
|
|
|
EXPECT_EQ(0, count());
|
|
|
|
|
|
|
|
// one vertex, no property set
|
|
|
|
dba.InsertVertex();
|
|
|
|
dba.AdvanceCommand();
|
|
|
|
EXPECT_EQ(0, count());
|
|
|
|
|
|
|
|
// one vertex, property set
|
|
|
|
for (auto va : dba.Vertices(memgraph::storage::View::OLD))
|
|
|
|
ASSERT_TRUE(va.SetProperty(prop, memgraph::storage::PropertyValue(42)).HasValue());
|
|
|
|
dba.AdvanceCommand();
|
|
|
|
EXPECT_EQ(1, count());
|
|
|
|
|
|
|
|
// two vertices, one with property set
|
|
|
|
dba.InsertVertex();
|
|
|
|
dba.AdvanceCommand();
|
|
|
|
EXPECT_EQ(1, count());
|
|
|
|
|
|
|
|
// two vertices, both with property set
|
|
|
|
for (auto va : dba.Vertices(memgraph::storage::View::OLD))
|
|
|
|
ASSERT_TRUE(va.SetProperty(prop, memgraph::storage::PropertyValue(42)).HasValue());
|
|
|
|
dba.AdvanceCommand();
|
|
|
|
EXPECT_EQ(1, count());
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AggregateFirstValueTypesWithDistinct) {
|
|
|
|
// testing exceptions that get emitted by the first-value
|
|
|
|
// type check
|
|
|
|
|
|
|
|
memgraph::storage::Storage db;
|
|
|
|
auto storage_dba = db.Access();
|
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
|
|
|
|
|
|
|
auto v1 = dba.InsertVertex();
|
|
|
|
auto prop_string = dba.NameToProperty("string");
|
|
|
|
ASSERT_TRUE(v1.SetProperty(prop_string, memgraph::storage::PropertyValue("johhny")).HasValue());
|
|
|
|
auto prop_int = dba.NameToProperty("int");
|
|
|
|
ASSERT_TRUE(v1.SetProperty(prop_int, memgraph::storage::PropertyValue(12)).HasValue());
|
|
|
|
dba.AdvanceCommand();
|
|
|
|
|
|
|
|
AstStorage storage;
|
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
|
|
|
auto n_prop_string = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop_string);
|
|
|
|
auto n_prop_int = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), prop_int);
|
|
|
|
auto n_id = n_prop_string->expression_;
|
|
|
|
|
|
|
|
auto aggregate = [&](Expression *expression, Aggregation::Op aggr_op) {
|
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {expression}, {aggr_op}, {}, {}, true);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
|
|
|
CollectProduce(*produce, &context);
|
|
|
|
};
|
|
|
|
|
|
|
|
// everything except for COUNT and COLLECT fails on a Vertex
|
|
|
|
aggregate(n_id, Aggregation::Op::COUNT);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::SUM), QueryRuntimeException);
|
|
|
|
|
|
|
|
// on strings AVG and SUM fail
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_prop_string, Aggregation::Op::MAX);
|
|
|
|
EXPECT_THROW(aggregate(n_prop_string, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_prop_string, Aggregation::Op::SUM), QueryRuntimeException);
|
|
|
|
|
|
|
|
// on ints nothing fails
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::MAX);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::AVG);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::SUM);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_prop_int, Aggregation::Op::COLLECT_MAP);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST(QueryPlan, AggregateTypesWithDistinct) {
|
|
|
|
// testing exceptions that can get emitted by an aggregation
|
|
|
|
// does not check all combinations that can result in an exception
|
|
|
|
// (that logic is defined and tested by TypedValue)
|
|
|
|
|
|
|
|
memgraph::storage::Storage db;
|
|
|
|
auto storage_dba = db.Access();
|
|
|
|
memgraph::query::DbAccessor dba(&storage_dba);
|
|
|
|
|
|
|
|
auto p1 = dba.NameToProperty("p1"); // has only string props
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(p1, memgraph::storage::PropertyValue("string")).HasValue());
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(p1, memgraph::storage::PropertyValue("str2")).HasValue());
|
|
|
|
auto p2 = dba.NameToProperty("p2"); // combines int and bool
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(p2, memgraph::storage::PropertyValue(42)).HasValue());
|
|
|
|
ASSERT_TRUE(dba.InsertVertex().SetProperty(p2, memgraph::storage::PropertyValue(true)).HasValue());
|
|
|
|
dba.AdvanceCommand();
|
|
|
|
|
|
|
|
AstStorage storage;
|
|
|
|
SymbolTable symbol_table;
|
|
|
|
|
|
|
|
auto n = MakeScanAll(storage, symbol_table, "n");
|
|
|
|
auto n_p1 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), p1);
|
|
|
|
auto n_p2 = PROPERTY_LOOKUP(IDENT("n")->MapTo(n.sym_), p2);
|
|
|
|
|
|
|
|
auto aggregate = [&](Expression *expression, Aggregation::Op aggr_op) {
|
|
|
|
auto produce = MakeAggregationProduce(n.op_, symbol_table, storage, {expression}, {aggr_op}, {}, {}, true);
|
|
|
|
auto context = MakeContext(storage, symbol_table, &dba);
|
|
|
|
CollectProduce(*produce, &context);
|
|
|
|
};
|
|
|
|
|
|
|
|
// everything except for COUNT and COLLECT fails on a Vertex
|
|
|
|
auto n_id = n_p1->expression_;
|
|
|
|
aggregate(n_id, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_id, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_id, Aggregation::Op::COLLECT_MAP);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_id, Aggregation::Op::SUM), QueryRuntimeException);
|
|
|
|
|
|
|
|
// on strings AVG and SUM fail
|
|
|
|
aggregate(n_p1, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_p1, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_p1, Aggregation::Op::COLLECT_MAP);
|
|
|
|
aggregate(n_p1, Aggregation::Op::MIN);
|
|
|
|
aggregate(n_p1, Aggregation::Op::MAX);
|
|
|
|
EXPECT_THROW(aggregate(n_p1, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p1, Aggregation::Op::SUM), QueryRuntimeException);
|
|
|
|
|
|
|
|
// combination of int and bool, everything except COUNT and COLLECT fails
|
|
|
|
aggregate(n_p2, Aggregation::Op::COUNT);
|
|
|
|
aggregate(n_p2, Aggregation::Op::COLLECT_LIST);
|
|
|
|
aggregate(n_p2, Aggregation::Op::COLLECT_MAP);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::MIN), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::MAX), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::AVG), QueryRuntimeException);
|
|
|
|
EXPECT_THROW(aggregate(n_p2, Aggregation::Op::SUM), QueryRuntimeException);
|
|
|
|
}
|