2016-08-23 02:03:45 +08:00
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include <algorithm>
|
|
|
|
#include <chrono>
|
|
|
|
#include <cstring>
|
|
|
|
#include <ctime>
|
|
|
|
#include <fstream>
|
|
|
|
#include <iostream>
|
|
|
|
#include <queue>
|
|
|
|
#include <regex>
|
|
|
|
#include <sstream>
|
|
|
|
#include <string>
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
#include "import/element_skeleton.hpp"
|
|
|
|
#include "import/fillings/filler.hpp"
|
2016-09-13 03:13:04 +08:00
|
|
|
#include "logging/default.hpp"
|
2016-08-23 02:03:45 +08:00
|
|
|
#include "storage/model/properties/flags.hpp"
|
|
|
|
#include "storage/vertex_accessor.hpp"
|
|
|
|
#include "utils/option.hpp"
|
|
|
|
|
|
|
|
using namespace std;
|
|
|
|
|
2016-08-25 22:29:45 +08:00
|
|
|
static Option<VertexAccessor> empty_op_vacc;
|
2016-08-23 02:03:45 +08:00
|
|
|
|
|
|
|
// Base importer with common facilities.
|
|
|
|
class BaseImporter
|
|
|
|
{
|
|
|
|
|
|
|
|
public:
|
2016-09-13 03:13:04 +08:00
|
|
|
BaseImporter(DbAccessor &db, Logger &&logger)
|
|
|
|
: db(db), logger(std::move(logger))
|
2016-08-23 02:03:45 +08:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
char *cstr(string &str) { return &str[0]; }
|
|
|
|
|
|
|
|
bool split(string &str, char mark, vector<char *> &sub_str)
|
|
|
|
{
|
|
|
|
return split(cstr(str), mark, sub_str);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Occurances of mark are changed with '\0'. sub_str is filled with
|
|
|
|
// pointers to parts of str splited by mark in ascending order. Empty
|
|
|
|
// sub_str are included. Doesn't split inside quotations and
|
|
|
|
// open_bracket,closed_bracket.
|
|
|
|
// Returns true if it was succesfully parsed.
|
|
|
|
bool split(char *str, char mark, vector<char *> &sub_str)
|
|
|
|
{
|
|
|
|
|
|
|
|
int head = 0;
|
|
|
|
bool in_text = false;
|
|
|
|
bool in_array = false;
|
|
|
|
|
|
|
|
for (int i = 0; str[i] != '\0'; i++) {
|
|
|
|
char &c = str[i];
|
|
|
|
|
|
|
|
// IN TEXT check
|
|
|
|
if (c == quotations_mark) {
|
|
|
|
in_text = !in_text;
|
|
|
|
if (in_text && head == i) {
|
|
|
|
c = '\0';
|
|
|
|
head = i + 1;
|
|
|
|
} else if (!in_text && !in_array) {
|
|
|
|
c = '\0';
|
|
|
|
}
|
|
|
|
continue;
|
|
|
|
} else if (in_text) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// IN ARRAY check
|
|
|
|
if (c == open_bracket) {
|
|
|
|
if (in_array) {
|
2016-09-13 03:13:04 +08:00
|
|
|
logger.error("Nested arrays aren't supported.");
|
2016-08-23 02:03:45 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
in_array = true;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (in_array) {
|
|
|
|
if (c == closed_bracket) {
|
|
|
|
in_array = false;
|
|
|
|
}
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// SPLIT CHECK
|
|
|
|
if (c == mark) {
|
|
|
|
c = '\0';
|
|
|
|
sub_str.push_back(&str[head]);
|
|
|
|
head = i + 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
sub_str.push_back(&str[head]);
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2016-09-19 06:22:36 +08:00
|
|
|
// Extracts parts of str while stripping parts of array chars and qutation
|
|
|
|
// marks. Parts are separated with delimiter.
|
2016-08-23 02:03:45 +08:00
|
|
|
void extract(char *str, const char delimiter, vector<char *> &sub_str)
|
|
|
|
{
|
|
|
|
int head = 0;
|
|
|
|
bool in_text = false;
|
|
|
|
|
|
|
|
for (int i = 0; str[i] != '\0'; i++) {
|
|
|
|
char &c = str[i];
|
|
|
|
|
|
|
|
// IN TEXT check
|
|
|
|
if (c == quotations_mark) {
|
|
|
|
in_text = !in_text;
|
|
|
|
if (in_text) {
|
|
|
|
} else {
|
|
|
|
c = '\0';
|
|
|
|
sub_str.push_back(&str[head]);
|
|
|
|
head = i + 1;
|
|
|
|
}
|
|
|
|
head = i + 1;
|
|
|
|
continue;
|
|
|
|
} else if (in_text) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// IN ARRAY check
|
|
|
|
if (c == open_bracket) {
|
|
|
|
head = i + 1;
|
|
|
|
continue;
|
|
|
|
} else if (c == closed_bracket) {
|
|
|
|
c = '\0';
|
|
|
|
if (i > head) {
|
|
|
|
sub_str.push_back(&str[head]);
|
|
|
|
}
|
|
|
|
head = i + 1;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// SPLIT CHECK
|
|
|
|
if (c == delimiter) {
|
|
|
|
c = '\0';
|
|
|
|
if (i > head) {
|
|
|
|
sub_str.push_back(&str[head]);
|
|
|
|
}
|
|
|
|
head = i + 1;
|
|
|
|
} else if (c == ' ' && i == head) {
|
|
|
|
head++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
sub_str.push_back(&str[head]);
|
|
|
|
}
|
|
|
|
|
2016-09-19 06:22:36 +08:00
|
|
|
// Optionaly return vertex with given import local id if it exists.
|
2016-08-25 22:29:45 +08:00
|
|
|
Option<VertexAccessor> const &get_vertex(size_t id)
|
2016-08-23 02:03:45 +08:00
|
|
|
{
|
|
|
|
if (vertices.size() > id) {
|
|
|
|
return vertices[id];
|
|
|
|
} else {
|
|
|
|
cout << vertices.size() << " -> " << id << endl;
|
|
|
|
return empty_op_vacc;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public:
|
|
|
|
DbAccessor &db;
|
2016-09-13 03:13:04 +08:00
|
|
|
Logger logger;
|
2016-08-23 02:03:45 +08:00
|
|
|
|
2016-09-19 06:22:36 +08:00
|
|
|
// Varius marks and delimiters. They can be freely changed here and
|
|
|
|
// everything will work.
|
2016-08-23 02:03:45 +08:00
|
|
|
char parts_mark = ',';
|
|
|
|
char parts_array_mark = ',';
|
|
|
|
char type_mark = ':';
|
|
|
|
char quotations_mark = '"';
|
|
|
|
char open_bracket = '[';
|
|
|
|
char closed_bracket = ']';
|
|
|
|
|
|
|
|
protected:
|
2016-09-19 06:22:36 +08:00
|
|
|
// All created vertices which have import local id.
|
2016-08-25 22:29:45 +08:00
|
|
|
vector<Option<VertexAccessor>> vertices;
|
2016-08-23 02:03:45 +08:00
|
|
|
};
|