#include "gmock/gmock.h" #include "gtest/gtest.h" #include "utils/csv_parsing.hpp" #include "utils/string.hpp" class CsvReaderTest : public ::testing::Test { protected: const std::filesystem::path csv_directory{std::filesystem::temp_directory_path() / "csv_testing"}; void SetUp() override { Clear(); CreateCsvDir(); } void TearDown() override { Clear(); } private: void CreateCsvDir() { if (!std::filesystem::exists(csv_directory)) { std::filesystem::create_directory(csv_directory); } } void Clear() { if (!std::filesystem::exists(csv_directory)) return; std::filesystem::remove_all(csv_directory); } }; namespace { class FileWriter { public: explicit FileWriter(const std::filesystem::path path) { stream_.open(path); } FileWriter(const FileWriter &) = delete; FileWriter &operator=(const FileWriter &) = delete; FileWriter(FileWriter &&) = delete; FileWriter &operator=(FileWriter &&) = delete; void Close() { stream_.close(); } size_t WriteLine(const std::string_view line) { if (!stream_.is_open()) { return 0; } stream_ << line << std::endl; // including the newline character return line.size() + 1; } private: std::ofstream stream_; }; std::string CreateRow(const std::vector &columns, const std::string_view delim) { return utils::Join(columns, delim); } auto ToPmrColumns(const std::vector &columns) { utils::pmr::vector pmr_columns(utils::NewDeleteResource()); for (const auto &col : columns) { pmr_columns.emplace_back(col); } return pmr_columns; } } // namespace TEST_F(CsvReaderTest, CommaDelimiter) { // create a file with a single valid row; const auto filepath = csv_directory / "bla.csv"; auto writer = FileWriter(filepath); const std::vector columns{"A", "B", "C"}; writer.WriteLine(CreateRow(columns, ",")); writer.Close(); utils::MemoryResource *mem{utils::NewDeleteResource()}; bool with_header = false; bool ignore_bad = false; utils::pmr::string delimiter{",", mem}; utils::pmr::string quote{"\"", mem}; csv::Reader::Config cfg{with_header, ignore_bad, delimiter, quote}; auto reader = csv::Reader(filepath, cfg, mem); auto parsed_row = reader.GetNextRow(); ASSERT_EQ(parsed_row, ToPmrColumns(columns)); } TEST_F(CsvReaderTest, SemicolonDelimiter) { const auto filepath = csv_directory / "bla.csv"; auto writer = FileWriter(filepath); utils::MemoryResource *mem(utils::NewDeleteResource()); const utils::pmr::string delimiter{";", mem}; const utils::pmr::string quote{"\"", mem}; const std::vector columns{"A", "B", "C"}; writer.WriteLine(CreateRow(columns, delimiter)); writer.Close(); const bool with_header = false; const bool ignore_bad = false; const csv::Reader::Config cfg{with_header, ignore_bad, delimiter, quote}; auto reader = csv::Reader(filepath, cfg, mem); auto parsed_row = reader.GetNextRow(); ASSERT_EQ(parsed_row, ToPmrColumns(columns)); } TEST_F(CsvReaderTest, SkipBad) { // create a file with invalid first two rows (containing a string with a // missing closing quote); // the last row is valid; const auto filepath = csv_directory / "bla.csv"; auto writer = FileWriter(filepath); utils::MemoryResource *mem(utils::NewDeleteResource()); const utils::pmr::string delimiter{";", mem}; const utils::pmr::string quote{"\"", mem}; const std::vector columns_bad{"A", "B", "\"\"C"}; writer.WriteLine(CreateRow(columns_bad, delimiter)); writer.WriteLine(CreateRow(columns_bad, delimiter)); const std::vector columns_good{"A", "B", "C"}; writer.WriteLine(CreateRow(columns_good, delimiter)); writer.Close(); { // we set the 'ignore_bad' flag in the read configuration to 'true'; // parser's output should be solely the valid row; const bool with_header = false; const bool ignore_bad = true; const csv::Reader::Config cfg{with_header, ignore_bad, delimiter, quote}; auto reader = csv::Reader(filepath, cfg, mem); auto parsed_row = reader.GetNextRow(); ASSERT_EQ(parsed_row, ToPmrColumns(columns_good)); } { // we set the 'ignore_bad' flag in the read configuration to 'false'; // an exception must be thrown; const bool with_header = false; const bool ignore_bad = false; const csv::Reader::Config cfg{with_header, ignore_bad, delimiter, quote}; auto reader = csv::Reader(filepath, cfg, mem); EXPECT_THROW(reader.GetNextRow(), csv::CsvReadException); } } TEST_F(CsvReaderTest, AllRowsValid) { // create a file with all rows valid; // parser should return 'std::nullopt' const auto filepath = csv_directory / "bla.csv"; auto writer = FileWriter(filepath); utils::MemoryResource *mem(utils::NewDeleteResource()); const utils::pmr::string delimiter{",", mem}; const utils::pmr::string quote{"\"", mem}; std::vector columns{"A", "B", "C"}; writer.WriteLine(CreateRow(columns, delimiter)); writer.WriteLine(CreateRow(columns, delimiter)); writer.WriteLine(CreateRow(columns, delimiter)); writer.Close(); const bool with_header = false; const bool ignore_bad = false; const csv::Reader::Config cfg{with_header, ignore_bad, delimiter, quote}; auto reader = csv::Reader(filepath, cfg); const auto pmr_columns = ToPmrColumns(columns); while (auto parsed_row = reader.GetNextRow()) { ASSERT_EQ(parsed_row, pmr_columns); } } TEST_F(CsvReaderTest, SkipAllRows) { // create a file with all rows invalid (containing a string with a missing closing quote); // parser should return 'std::nullopt' const auto filepath = csv_directory / "bla.csv"; auto writer = FileWriter(filepath); utils::MemoryResource *mem(utils::NewDeleteResource()); const utils::pmr::string delimiter{",", mem}; const utils::pmr::string quote{"\"", mem}; const std::vector columns_bad{"A", "B", "\"\"C"}; writer.WriteLine(CreateRow(columns_bad, delimiter)); writer.WriteLine(CreateRow(columns_bad, delimiter)); writer.WriteLine(CreateRow(columns_bad, delimiter)); writer.Close(); const bool with_header = false; const bool ignore_bad = true; const csv::Reader::Config cfg{with_header, ignore_bad, delimiter, quote}; auto reader = csv::Reader(filepath, cfg); auto parsed_row = reader.GetNextRow(); ASSERT_EQ(parsed_row, std::nullopt); } TEST_F(CsvReaderTest, WithHeader) { const auto filepath = csv_directory / "bla.csv"; auto writer = FileWriter(filepath); utils::MemoryResource *mem(utils::NewDeleteResource()); const utils::pmr::string delimiter{",", mem}; const utils::pmr::string quote{"\"", mem}; const std::vector header{"A", "B", "C"}; const std::vector columns{"1", "2", "3"}; writer.WriteLine(CreateRow(header, delimiter)); writer.WriteLine(CreateRow(columns, delimiter)); writer.WriteLine(CreateRow(columns, delimiter)); writer.WriteLine(CreateRow(columns, delimiter)); writer.Close(); const bool with_header = true; const bool ignore_bad = false; const csv::Reader::Config cfg(with_header, ignore_bad, delimiter, quote); auto reader = csv::Reader(filepath, cfg); const auto pmr_header = ToPmrColumns(header); ASSERT_EQ(reader.GetHeader(), pmr_header); const auto pmr_columns = ToPmrColumns(columns); while (auto parsed_row = reader.GetNextRow()) { ASSERT_EQ(parsed_row, pmr_columns); } }