2016-02-03 07:18:20 +08:00
|
|
|
#pragma once
|
|
|
|
|
2016-07-05 20:20:33 +08:00
|
|
|
#include <iostream>
|
2016-02-03 07:18:20 +08:00
|
|
|
#include <string>
|
2016-02-04 09:45:12 +08:00
|
|
|
#include <tuple>
|
2016-02-22 05:21:15 +08:00
|
|
|
#include <unordered_map>
|
2016-06-06 17:29:52 +08:00
|
|
|
#include <utility>
|
2016-02-03 07:18:20 +08:00
|
|
|
|
|
|
|
#include "cypher/cypher.h"
|
2016-11-02 23:05:02 +08:00
|
|
|
#include "logging/loggable.hpp"
|
|
|
|
#include "query/language/cypher/tokenizer/cypher_lexer.hpp"
|
|
|
|
#include "query/strip/stripped.hpp"
|
2016-06-06 17:29:52 +08:00
|
|
|
#include "storage/model/properties/all.hpp"
|
2016-07-24 10:47:48 +08:00
|
|
|
#include "utils/hashing/fnv.hpp"
|
2016-06-06 17:29:52 +08:00
|
|
|
#include "utils/string/transform.hpp"
|
|
|
|
#include "utils/variadic/variadic.hpp"
|
2016-02-03 07:18:20 +08:00
|
|
|
|
2016-09-05 17:02:48 +08:00
|
|
|
// TODO: Maybe std::move(v) is faster, but it must be cheked for validity.
|
2016-06-06 17:29:52 +08:00
|
|
|
template <class T, class V>
|
2016-11-02 23:05:02 +08:00
|
|
|
void store_query_param(plan_args_t &arguments, V &&v)
|
2016-02-22 05:21:15 +08:00
|
|
|
{
|
2016-09-05 17:02:48 +08:00
|
|
|
arguments.emplace_back(Property(T(std::move(v)), T::type));
|
2016-02-22 05:21:15 +08:00
|
|
|
}
|
|
|
|
|
2016-06-06 17:29:52 +08:00
|
|
|
template <typename... Ts>
|
2016-11-02 23:05:02 +08:00
|
|
|
class QueryStripper : public Loggable
|
2016-02-03 07:18:20 +08:00
|
|
|
{
|
|
|
|
public:
|
2016-11-02 23:05:02 +08:00
|
|
|
QueryStripper(Ts &&... strip_types) : Loggable("QueryStripper"),
|
2016-08-30 12:34:08 +08:00
|
|
|
strip_types(std::make_tuple(std::forward<Ts>(strip_types)...)),
|
2016-06-06 17:29:52 +08:00
|
|
|
lexer(std::make_unique<CypherLexer>())
|
|
|
|
{
|
|
|
|
}
|
2016-02-03 07:18:20 +08:00
|
|
|
|
2016-06-06 17:29:52 +08:00
|
|
|
QueryStripper(QueryStripper &other) = delete;
|
2016-02-22 05:21:15 +08:00
|
|
|
|
2016-11-02 23:05:02 +08:00
|
|
|
QueryStripper(QueryStripper &&other) : Loggable("QueryStripper"),
|
|
|
|
strip_types(std::move(other.strip_types)),
|
2016-06-06 17:29:52 +08:00
|
|
|
lexer(std::move(other.lexer))
|
|
|
|
{
|
|
|
|
}
|
2016-02-03 07:18:20 +08:00
|
|
|
|
2016-07-24 10:47:48 +08:00
|
|
|
auto strip_space(const std::string &query)
|
|
|
|
{
|
2016-11-02 23:05:02 +08:00
|
|
|
return strip(query, " ");
|
2016-07-24 10:47:48 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
auto strip(const std::string &query, const std::string &separator = "")
|
2016-02-03 07:18:20 +08:00
|
|
|
{
|
2016-03-20 15:56:13 +08:00
|
|
|
// TODO write this more optimal (resplace string
|
2016-02-22 05:21:15 +08:00
|
|
|
// concatenation with something smarter)
|
|
|
|
// TODO: in place substring replacement
|
|
|
|
|
2016-02-06 20:45:45 +08:00
|
|
|
auto tokenizer = lexer->tokenize(query);
|
2016-02-22 05:21:15 +08:00
|
|
|
|
|
|
|
// TMP size of supported token types
|
2016-02-04 09:45:12 +08:00
|
|
|
constexpr auto size = std::tuple_size<decltype(strip_types)>::value;
|
2016-02-22 05:21:15 +08:00
|
|
|
|
|
|
|
int counter = 0;
|
2016-11-02 23:05:02 +08:00
|
|
|
plan_args_t stripped_arguments;
|
2016-02-22 05:21:15 +08:00
|
|
|
std::string stripped_query;
|
|
|
|
stripped_query.reserve(query.size());
|
|
|
|
|
2016-11-02 23:05:02 +08:00
|
|
|
while (auto token = tokenizer.lookup())
|
|
|
|
{
|
|
|
|
if (_or(token.id, strip_types, std::make_index_sequence<size>{}))
|
|
|
|
{
|
2016-02-22 05:21:15 +08:00
|
|
|
auto index = counter++;
|
|
|
|
switch (token.id) {
|
2016-07-24 10:47:48 +08:00
|
|
|
case TK_LONG:
|
|
|
|
store_query_param<Int64>(stripped_arguments,
|
|
|
|
std::stol(token.value));
|
2016-06-06 17:29:52 +08:00
|
|
|
break;
|
|
|
|
case TK_STR:
|
2016-08-30 12:34:08 +08:00
|
|
|
// TODO: remove quotes view lexertl
|
|
|
|
token.value.erase(0, 1);
|
|
|
|
token.value.erase(token.value.length() - 1, 1);
|
|
|
|
// TODO: remove
|
2016-06-06 17:29:52 +08:00
|
|
|
store_query_param<String>(stripped_arguments, token.value);
|
|
|
|
break;
|
|
|
|
case TK_BOOL: {
|
|
|
|
bool value = token.value[0] == 'T' || token.value[0] == 't';
|
|
|
|
store_query_param<Bool>(stripped_arguments, value);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case TK_FLOAT:
|
|
|
|
store_query_param<Float>(stripped_arguments,
|
|
|
|
std::stof(token.value));
|
|
|
|
break;
|
2016-09-05 17:02:48 +08:00
|
|
|
default:
|
2016-11-02 23:05:02 +08:00
|
|
|
// TODO: other properties
|
2016-09-05 17:02:48 +08:00
|
|
|
assert(false);
|
2016-02-22 05:21:15 +08:00
|
|
|
}
|
2016-07-24 10:47:48 +08:00
|
|
|
stripped_query += std::to_string(index) + separator;
|
2016-02-03 07:18:20 +08:00
|
|
|
} else {
|
2016-03-13 03:16:19 +08:00
|
|
|
// TODO: lowercase only keywords like (MATCH, CREATE, ...)
|
2016-07-24 10:47:48 +08:00
|
|
|
stripped_query += token.value + separator;
|
2016-02-03 07:18:20 +08:00
|
|
|
}
|
|
|
|
}
|
2016-02-22 05:21:15 +08:00
|
|
|
|
2016-11-02 23:05:02 +08:00
|
|
|
auto hash = fnv(stripped_query);
|
|
|
|
return QueryStripped(std::move(stripped_query),
|
|
|
|
std::move(stripped_arguments),
|
|
|
|
hash);
|
2016-02-03 07:18:20 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
2016-02-04 09:45:12 +08:00
|
|
|
std::tuple<Ts...> strip_types;
|
2016-02-06 20:45:45 +08:00
|
|
|
CypherLexer::uptr lexer;
|
2016-02-04 09:45:12 +08:00
|
|
|
|
2016-06-06 17:29:52 +08:00
|
|
|
template <typename Value, typename Tuple, std::size_t... index>
|
|
|
|
bool _or(Value &&value, Tuple &&tuple, std::index_sequence<index...>)
|
2016-02-04 09:45:12 +08:00
|
|
|
{
|
|
|
|
return or_vargs(std::forward<Value>(value),
|
|
|
|
std::get<index>(std::forward<Tuple>(tuple))...);
|
|
|
|
}
|
2016-02-03 07:18:20 +08:00
|
|
|
};
|
2016-02-06 20:45:45 +08:00
|
|
|
|
2016-06-06 17:29:52 +08:00
|
|
|
template <typename... Ts>
|
|
|
|
decltype(auto) make_query_stripper(Ts &&... ts)
|
|
|
|
{
|
2016-02-06 20:45:45 +08:00
|
|
|
return QueryStripper<Ts...>(std::forward<Ts>(ts)...);
|
|
|
|
}
|