memgraph/tests/unit/slk_streams.cpp

421 lines
16 KiB
C++
Raw Normal View History

// Copyright 2023 Memgraph Ltd.
//
// Use of this software is governed by the Business Source License
// included in the file licenses/BSL.txt; by using this file, you agree to be bound by the terms of the Business Source
// License, and you may not use this file except in compliance with the Business Source License.
//
// As of the Change Date specified in that file, in accordance with
// the Business Source License, use of this software will be governed
// by the Apache License, Version 2.0, included in the file
// licenses/APL.txt.
#include <gtest/gtest.h>
#include <cstring>
#include <memory>
#include <random>
#include <vector>
#include "slk/streams.hpp"
class BinaryData {
public:
BinaryData(const uint8_t *data, size_t size) : data_(new uint8_t[size]), size_(size) {
memcpy(data_.get(), data, size);
}
BinaryData(std::unique_ptr<uint8_t[]> data, size_t size) : data_(std::move(data)), size_(size) {}
const uint8_t *data() const { return data_.get(); }
size_t size() const { return size_; }
bool operator==(const BinaryData &other) const {
if (size_ != other.size_) return false;
for (size_t i = 0; i < size_; ++i) {
if (data_[i] != other.data_[i]) return false;
}
return true;
}
private:
std::unique_ptr<uint8_t[]> data_;
size_t size_;
};
BinaryData operator+(const BinaryData &a, const BinaryData &b) {
std::unique_ptr<uint8_t[]> data(new uint8_t[a.size() + b.size()]);
memcpy(data.get(), a.data(), a.size());
memcpy(data.get() + a.size(), b.data(), b.size());
return BinaryData(std::move(data), a.size() + b.size());
}
BinaryData GetRandomData(size_t size) {
std::mt19937 gen(std::random_device{}());
std::uniform_int_distribution<uint8_t> dis(0, 255);
std::unique_ptr<uint8_t[]> ret(new uint8_t[size]);
auto data = ret.get();
for (size_t i = 0; i < size; ++i) {
data[i] = dis(gen);
}
return BinaryData(std::move(ret), size);
}
std::vector<BinaryData> BufferToBinaryData(const uint8_t *data, size_t size, std::vector<size_t> sizes) {
std::vector<BinaryData> ret;
ret.reserve(sizes.size());
size_t pos = 0;
for (size_t i = 0; i < sizes.size(); ++i) {
EXPECT_GE(size, pos + sizes[i]);
ret.emplace_back(data + pos, sizes[i]);
pos += sizes[i];
}
return ret;
}
2022-02-22 20:33:45 +08:00
BinaryData SizeToBinaryData(memgraph::slk::SegmentSize size) {
return BinaryData(reinterpret_cast<const uint8_t *>(&size), sizeof(memgraph::slk::SegmentSize));
}
TEST(Builder, SingleSegment) {
std::vector<uint8_t> buffer;
2022-02-22 20:33:45 +08:00
memgraph::slk::Builder builder([&buffer](const uint8_t *data, size_t size, bool have_more) {
for (size_t i = 0; i < size; ++i) buffer.push_back(data[i]);
});
auto input = GetRandomData(5);
builder.Save(input.data(), input.size());
builder.Finalize();
2022-02-22 20:33:45 +08:00
ASSERT_EQ(buffer.size(), input.size() + 2 * sizeof(memgraph::slk::SegmentSize));
2022-02-22 20:33:45 +08:00
auto splits =
BufferToBinaryData(buffer.data(), buffer.size(),
{sizeof(memgraph::slk::SegmentSize), input.size(), sizeof(memgraph::slk::SegmentSize)});
auto header_expected = SizeToBinaryData(input.size());
ASSERT_EQ(splits[0], header_expected);
ASSERT_EQ(splits[1], input);
auto footer_expected = SizeToBinaryData(0);
ASSERT_EQ(splits[2], footer_expected);
}
TEST(Builder, MultipleSegments) {
std::vector<uint8_t> buffer;
2022-02-22 20:33:45 +08:00
memgraph::slk::Builder builder([&buffer](const uint8_t *data, size_t size, bool have_more) {
for (size_t i = 0; i < size; ++i) buffer.push_back(data[i]);
});
2022-02-22 20:33:45 +08:00
auto input = GetRandomData(memgraph::slk::kSegmentMaxDataSize + 100);
builder.Save(input.data(), input.size());
builder.Finalize();
2022-02-22 20:33:45 +08:00
ASSERT_EQ(buffer.size(), input.size() + 3 * sizeof(memgraph::slk::SegmentSize));
2022-02-22 20:33:45 +08:00
auto splits = BufferToBinaryData(
buffer.data(), buffer.size(),
{sizeof(memgraph::slk::SegmentSize), memgraph::slk::kSegmentMaxDataSize, sizeof(memgraph::slk::SegmentSize),
input.size() - memgraph::slk::kSegmentMaxDataSize, sizeof(memgraph::slk::SegmentSize)});
2022-02-22 20:33:45 +08:00
auto datas =
BufferToBinaryData(input.data(), input.size(),
{memgraph::slk::kSegmentMaxDataSize, input.size() - memgraph::slk::kSegmentMaxDataSize});
2022-02-22 20:33:45 +08:00
auto header1_expected = SizeToBinaryData(memgraph::slk::kSegmentMaxDataSize);
ASSERT_EQ(splits[0], header1_expected);
ASSERT_EQ(splits[1], datas[0]);
2022-02-22 20:33:45 +08:00
auto header2_expected = SizeToBinaryData(input.size() - memgraph::slk::kSegmentMaxDataSize);
ASSERT_EQ(splits[2], header2_expected);
ASSERT_EQ(splits[3], datas[1]);
auto footer_expected = SizeToBinaryData(0);
ASSERT_EQ(splits[4], footer_expected);
}
TEST(Reader, SingleSegment) {
std::vector<uint8_t> buffer;
2022-02-22 20:33:45 +08:00
memgraph::slk::Builder builder([&buffer](const uint8_t *data, size_t size, bool have_more) {
for (size_t i = 0; i < size; ++i) buffer.push_back(data[i]);
});
auto input = GetRandomData(5);
builder.Save(input.data(), input.size());
builder.Finalize();
// test with missing data
for (size_t i = 0; i < buffer.size(); ++i) {
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), i);
uint8_t block[memgraph::slk::kSegmentMaxDataSize];
ASSERT_THROW(
{
reader.Load(block, input.size());
reader.Finalize();
},
2022-02-22 20:33:45 +08:00
memgraph::slk::SlkReaderException);
}
// test with complete data
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize];
reader.Load(block, input.size());
reader.Finalize();
auto output = BinaryData(block, input.size());
ASSERT_EQ(output, input);
}
// test with leftover data
{
auto extended_buffer = BinaryData(buffer.data(), buffer.size()) + GetRandomData(5);
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(extended_buffer.data(), extended_buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize];
reader.Load(block, input.size());
reader.Finalize();
auto output = BinaryData(block, input.size());
ASSERT_EQ(output, input);
}
// read more data than there is in the stream
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize];
ASSERT_THROW(reader.Load(block, memgraph::slk::kSegmentMaxDataSize), memgraph::slk::SlkReaderException);
}
// don't consume all data from the stream
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize];
reader.Load(block, input.size() / 2);
2022-02-22 20:33:45 +08:00
ASSERT_THROW(reader.Finalize(), memgraph::slk::SlkReaderException);
}
// read data with several loads
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize];
for (size_t i = 0; i < input.size(); ++i) {
reader.Load(block + i, 1);
}
reader.Finalize();
auto output = BinaryData(block, input.size());
ASSERT_EQ(output, input);
}
// modify the end mark
buffer[buffer.size() - 1] = 1;
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize];
reader.Load(block, input.size());
2022-02-22 20:33:45 +08:00
ASSERT_THROW(reader.Finalize(), memgraph::slk::SlkReaderException);
}
}
TEST(Reader, MultipleSegments) {
std::vector<uint8_t> buffer;
2022-02-22 20:33:45 +08:00
memgraph::slk::Builder builder([&buffer](const uint8_t *data, size_t size, bool have_more) {
for (size_t i = 0; i < size; ++i) buffer.push_back(data[i]);
});
2022-02-22 20:33:45 +08:00
auto input = GetRandomData(memgraph::slk::kSegmentMaxDataSize + 100);
builder.Save(input.data(), input.size());
builder.Finalize();
// test with missing data
for (size_t i = 0; i < buffer.size(); ++i) {
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), i);
uint8_t block[memgraph::slk::kSegmentMaxDataSize * 2];
ASSERT_THROW(
{
reader.Load(block, input.size());
reader.Finalize();
},
2022-02-22 20:33:45 +08:00
memgraph::slk::SlkReaderException);
}
// test with complete data
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize * 2];
reader.Load(block, input.size());
reader.Finalize();
auto output = BinaryData(block, input.size());
ASSERT_EQ(output, input);
}
// test with leftover data
{
auto extended_buffer = BinaryData(buffer.data(), buffer.size()) + GetRandomData(5);
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(extended_buffer.data(), extended_buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize * 2];
reader.Load(block, input.size());
reader.Finalize();
auto output = BinaryData(block, input.size());
ASSERT_EQ(output, input);
}
// read more data than there is in the stream
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize * 2];
ASSERT_THROW(reader.Load(block, memgraph::slk::kSegmentMaxDataSize * 2), memgraph::slk::SlkReaderException);
}
// don't consume all data from the stream
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize * 2];
reader.Load(block, input.size() / 2);
2022-02-22 20:33:45 +08:00
ASSERT_THROW(reader.Finalize(), memgraph::slk::SlkReaderException);
}
// read data with several loads
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize * 2];
for (size_t i = 0; i < input.size(); ++i) {
reader.Load(block + i, 1);
}
reader.Finalize();
auto output = BinaryData(block, input.size());
ASSERT_EQ(output, input);
}
// modify the end mark
buffer[buffer.size() - 1] = 1;
{
2022-02-22 20:33:45 +08:00
memgraph::slk::Reader reader(buffer.data(), buffer.size());
uint8_t block[memgraph::slk::kSegmentMaxDataSize * 2];
reader.Load(block, input.size());
2022-02-22 20:33:45 +08:00
ASSERT_THROW(reader.Finalize(), memgraph::slk::SlkReaderException);
}
}
TEST(CheckStreamComplete, SingleSegment) {
std::vector<uint8_t> buffer;
2022-02-22 20:33:45 +08:00
memgraph::slk::Builder builder([&buffer](const uint8_t *data, size_t size, bool have_more) {
for (size_t i = 0; i < size; ++i) buffer.push_back(data[i]);
});
auto input = GetRandomData(5);
builder.Save(input.data(), input.size());
builder.Finalize();
// test with missing data
2022-02-22 20:33:45 +08:00
for (size_t i = 0; i < sizeof(memgraph::slk::SegmentSize); ++i) {
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), i);
ASSERT_EQ(status, memgraph::slk::StreamStatus::PARTIAL);
ASSERT_EQ(stream_size, memgraph::slk::kSegmentMaxTotalSize);
ASSERT_EQ(data_size, 0);
}
2022-02-22 20:33:45 +08:00
for (size_t i = sizeof(memgraph::slk::SegmentSize); i < sizeof(memgraph::slk::SegmentSize) + input.size(); ++i) {
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), i);
ASSERT_EQ(status, memgraph::slk::StreamStatus::PARTIAL);
ASSERT_EQ(stream_size, memgraph::slk::kSegmentMaxTotalSize + sizeof(memgraph::slk::SegmentSize));
ASSERT_EQ(data_size, 0);
}
2022-02-22 20:33:45 +08:00
for (size_t i = sizeof(memgraph::slk::SegmentSize) + input.size(); i < buffer.size(); ++i) {
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), i);
ASSERT_EQ(status, memgraph::slk::StreamStatus::PARTIAL);
ASSERT_EQ(stream_size, memgraph::slk::kSegmentMaxTotalSize + sizeof(memgraph::slk::SegmentSize) + input.size());
ASSERT_EQ(data_size, input.size());
}
// test with complete data
{
2022-02-22 20:33:45 +08:00
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), buffer.size());
ASSERT_EQ(status, memgraph::slk::StreamStatus::COMPLETE);
ASSERT_EQ(stream_size, buffer.size());
ASSERT_EQ(data_size, input.size());
}
// test with leftover data
{
auto extended_buffer = BinaryData(buffer.data(), buffer.size()) + GetRandomData(5);
2022-02-22 20:33:45 +08:00
auto [status, stream_size, data_size] =
memgraph::slk::CheckStreamComplete(extended_buffer.data(), extended_buffer.size());
ASSERT_EQ(status, memgraph::slk::StreamStatus::COMPLETE);
ASSERT_EQ(stream_size, buffer.size());
ASSERT_EQ(data_size, input.size());
}
}
TEST(CheckStreamComplete, MultipleSegments) {
std::vector<uint8_t> buffer;
2022-02-22 20:33:45 +08:00
memgraph::slk::Builder builder([&buffer](const uint8_t *data, size_t size, bool have_more) {
for (size_t i = 0; i < size; ++i) buffer.push_back(data[i]);
});
2022-02-22 20:33:45 +08:00
auto input = GetRandomData(memgraph::slk::kSegmentMaxDataSize + 100);
builder.Save(input.data(), input.size());
builder.Finalize();
// test with missing data
2022-02-22 20:33:45 +08:00
for (size_t i = 0; i < sizeof(memgraph::slk::SegmentSize); ++i) {
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), i);
ASSERT_EQ(status, memgraph::slk::StreamStatus::PARTIAL);
ASSERT_EQ(stream_size, memgraph::slk::kSegmentMaxTotalSize);
ASSERT_EQ(data_size, 0);
}
2022-02-22 20:33:45 +08:00
for (size_t i = sizeof(memgraph::slk::SegmentSize);
i < sizeof(memgraph::slk::SegmentSize) + memgraph::slk::kSegmentMaxDataSize; ++i) {
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), i);
ASSERT_EQ(status, memgraph::slk::StreamStatus::PARTIAL);
ASSERT_EQ(stream_size, memgraph::slk::kSegmentMaxTotalSize + sizeof(memgraph::slk::SegmentSize));
ASSERT_EQ(data_size, 0);
}
2022-02-22 20:33:45 +08:00
for (size_t i = sizeof(memgraph::slk::SegmentSize) + memgraph::slk::kSegmentMaxDataSize;
i < sizeof(memgraph::slk::SegmentSize) * 2 + memgraph::slk::kSegmentMaxDataSize; ++i) {
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), i);
ASSERT_EQ(status, memgraph::slk::StreamStatus::PARTIAL);
ASSERT_EQ(stream_size, sizeof(memgraph::slk::SegmentSize) + memgraph::slk::kSegmentMaxDataSize +
memgraph::slk::kSegmentMaxTotalSize);
ASSERT_EQ(data_size, memgraph::slk::kSegmentMaxDataSize);
}
2022-02-22 20:33:45 +08:00
for (size_t i = sizeof(memgraph::slk::SegmentSize) * 2 + memgraph::slk::kSegmentMaxDataSize;
i < sizeof(memgraph::slk::SegmentSize) * 2 + input.size(); ++i) {
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), i);
ASSERT_EQ(status, memgraph::slk::StreamStatus::PARTIAL);
ASSERT_EQ(stream_size, sizeof(memgraph::slk::SegmentSize) * 2 + memgraph::slk::kSegmentMaxDataSize +
memgraph::slk::kSegmentMaxTotalSize);
ASSERT_EQ(data_size, memgraph::slk::kSegmentMaxDataSize);
}
2022-02-22 20:33:45 +08:00
for (size_t i = sizeof(memgraph::slk::SegmentSize) * 2 + input.size(); i < buffer.size(); ++i) {
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), i);
ASSERT_EQ(status, memgraph::slk::StreamStatus::PARTIAL);
ASSERT_EQ(stream_size, memgraph::slk::kSegmentMaxTotalSize + sizeof(memgraph::slk::SegmentSize) * 2 + input.size());
ASSERT_EQ(data_size, input.size());
}
// test with complete data
{
2022-02-22 20:33:45 +08:00
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(buffer.data(), buffer.size());
ASSERT_EQ(status, memgraph::slk::StreamStatus::COMPLETE);
ASSERT_EQ(stream_size, buffer.size());
ASSERT_EQ(data_size, input.size());
}
// test with leftover data
{
auto extended_buffer = BinaryData(buffer.data(), buffer.size()) + GetRandomData(5);
2022-02-22 20:33:45 +08:00
auto [status, stream_size, data_size] =
memgraph::slk::CheckStreamComplete(extended_buffer.data(), extended_buffer.size());
ASSERT_EQ(status, memgraph::slk::StreamStatus::COMPLETE);
ASSERT_EQ(stream_size, buffer.size());
ASSERT_EQ(data_size, input.size());
}
}
TEST(CheckStreamComplete, InvalidSegment) {
auto input = SizeToBinaryData(0);
2022-02-22 20:33:45 +08:00
auto [status, stream_size, data_size] = memgraph::slk::CheckStreamComplete(input.data(), input.size());
ASSERT_EQ(status, memgraph::slk::StreamStatus::INVALID);
ASSERT_EQ(stream_size, 0);
ASSERT_EQ(data_size, 0);
}