2021-01-23 21:39:18 +01:00
|
|
|
#include "test_helpers.hpp"
|
2020-12-10 19:26:56 +01:00
|
|
|
#include <algorithm>
|
|
|
|
#include <filesystem>
|
2021-01-19 20:26:36 +01:00
|
|
|
#include <fstream>
|
2021-02-23 01:02:15 +01:00
|
|
|
#include <iomanip>
|
2023-07-29 20:41:31 +02:00
|
|
|
#include <iostream>
|
2021-01-19 20:26:36 +01:00
|
|
|
#include <ss/parser.hpp>
|
2021-02-23 01:02:15 +01:00
|
|
|
#include <sstream>
|
2023-07-25 00:56:38 +02:00
|
|
|
#include <unordered_map>
|
|
|
|
#include <unordered_set>
|
2021-02-23 01:02:15 +01:00
|
|
|
|
2023-07-29 20:41:31 +02:00
|
|
|
namespace {
|
|
|
|
[[maybe_unused]] void replace_all(std::string& s, const std::string& from,
|
|
|
|
const std::string& to) {
|
2021-02-23 01:02:15 +01:00
|
|
|
if (from.empty()) return;
|
|
|
|
size_t start_pos = 0;
|
|
|
|
while ((start_pos = s.find(from, start_pos)) != std::string::npos) {
|
|
|
|
s.replace(start_pos, from.length(), to);
|
|
|
|
start_pos += to.length();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-05 13:49:10 +02:00
|
|
|
template <typename... Ts>
|
|
|
|
void expect_error_on_command(ss::parser<Ts...>& p,
|
|
|
|
const std::function<void()> command) {
|
|
|
|
if (ss::setup<Ts...>::throw_on_error) {
|
|
|
|
try {
|
|
|
|
command();
|
|
|
|
} catch (const std::exception& e) {
|
|
|
|
CHECK_FALSE(std::string{e.what()}.empty());
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
command();
|
|
|
|
CHECK(!p.valid());
|
|
|
|
if constexpr (ss::setup<Ts...>::string_error) {
|
|
|
|
CHECK_FALSE(p.error_msg().empty());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
[[maybe_unused]] void update_if_crlf(std::string& s) {
|
2021-02-23 01:02:15 +01:00
|
|
|
#ifdef _WIN32
|
|
|
|
replace_all(s, "\r\n", "\n");
|
|
|
|
#else
|
|
|
|
(void)(s);
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2020-12-10 19:26:56 +01:00
|
|
|
struct X {
|
2020-12-26 00:46:42 +01:00
|
|
|
constexpr static auto delim = ",";
|
2023-08-05 19:58:00 +02:00
|
|
|
constexpr static auto empty = "_EMPTY_";
|
2020-12-26 00:46:42 +01:00
|
|
|
int i;
|
|
|
|
double d;
|
|
|
|
std::string s;
|
|
|
|
|
|
|
|
std::string to_string() const {
|
2023-08-05 19:58:00 +02:00
|
|
|
if (s == empty) {
|
2022-03-28 19:11:41 +02:00
|
|
|
return "";
|
|
|
|
}
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
return std::to_string(i)
|
|
|
|
.append(delim)
|
|
|
|
.append(std::to_string(d))
|
|
|
|
.append(delim)
|
|
|
|
.append(s);
|
|
|
|
}
|
2022-03-27 21:04:02 +02:00
|
|
|
auto tied() const {
|
|
|
|
return std::tie(i, d, s);
|
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
template <typename T>
|
|
|
|
std::enable_if_t<ss::has_m_tied_t<T>, bool> operator==(const T& lhs,
|
|
|
|
const T& rhs) {
|
2020-12-26 00:46:42 +01:00
|
|
|
return lhs.tied() == rhs.tied();
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
template <typename T>
|
|
|
|
static void make_and_write(const std::string& file_name,
|
2022-03-27 21:04:02 +02:00
|
|
|
const std::vector<T>& data,
|
|
|
|
const std::vector<std::string>& header = {}) {
|
2020-12-26 00:46:42 +01:00
|
|
|
std::ofstream out{file_name};
|
2021-02-23 01:02:15 +01:00
|
|
|
|
|
|
|
#ifdef _WIN32
|
|
|
|
std::vector<const char*> new_lines = {"\n"};
|
|
|
|
#else
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<const char*> new_lines = {"\n", "\r\n"};
|
2021-02-23 01:02:15 +01:00
|
|
|
#endif
|
|
|
|
|
2022-03-27 21:04:02 +02:00
|
|
|
for (const auto& i : header) {
|
|
|
|
if (&i != &header.front()) {
|
|
|
|
out << T::delim;
|
|
|
|
}
|
|
|
|
out << i;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (!header.empty()) {
|
|
|
|
out << new_lines.front();
|
|
|
|
}
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
for (size_t i = 0; i < data.size(); ++i) {
|
|
|
|
out << data[i].to_string() << new_lines[i % new_lines.size()];
|
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
2024-02-17 00:55:36 +01:00
|
|
|
|
|
|
|
std::string make_buffer(const std::string& file_name) {
|
|
|
|
std::ifstream in{file_name, std::ios::binary};
|
|
|
|
std::string tmp;
|
|
|
|
std::string out;
|
|
|
|
out.reserve(sizeof(out) + 1);
|
|
|
|
while (in >> tmp) {
|
|
|
|
out += tmp;
|
2024-02-17 17:43:33 +01:00
|
|
|
if (in.peek() == '\n') {
|
|
|
|
out += "\n";
|
|
|
|
}
|
|
|
|
if (in.peek() == '\r') {
|
|
|
|
out += "\r\n";
|
|
|
|
}
|
2024-02-17 00:55:36 +01:00
|
|
|
}
|
|
|
|
return out;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <bool buffer_mode, typename... Ts>
|
|
|
|
std::tuple<ss::parser<Ts...>, std::string> make_parser(
|
|
|
|
const std::string& file_name, const std::string& delim) {
|
|
|
|
if (buffer_mode) {
|
|
|
|
auto buffer = make_buffer(file_name);
|
|
|
|
return {ss::parser<Ts...>{buffer.data(), buffer.size(), delim},
|
|
|
|
std::move(buffer)};
|
|
|
|
} else {
|
|
|
|
return {ss::parser<Ts...>{file_name, delim}, std::string{}};
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-29 20:41:31 +02:00
|
|
|
} /* namespace */
|
2021-02-24 22:08:11 +01:00
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
TEST_CASE("test file not found") {
|
|
|
|
unique_file_name f{"test_parser"};
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser p{f.name, ","};
|
|
|
|
CHECK_FALSE(p.valid());
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<ss::string_error> p{f.name, ","};
|
|
|
|
CHECK_FALSE(p.valid());
|
|
|
|
}
|
|
|
|
|
|
|
|
try {
|
|
|
|
ss::parser<ss::throw_on_error> p{f.name, ","};
|
|
|
|
FAIL("Expected exception...");
|
|
|
|
} catch (const std::exception& e) {
|
|
|
|
CHECK_FALSE(std::string{e.what()}.empty());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
template <bool buffer_mode, typename... Ts>
|
2023-08-04 16:48:07 +02:00
|
|
|
void test_various_cases() {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> data = {{1, 2, "x"}, {3, 4, "y"}, {5, 6, "z"},
|
|
|
|
{7, 8, "u"}, {9, 10, "v"}, {11, 12, "w"}};
|
|
|
|
make_and_write(f.name, data);
|
2024-02-17 00:55:36 +01:00
|
|
|
auto csv_data_buffer = make_buffer(f.name);
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2022-03-27 21:41:46 +02:00
|
|
|
ss::parser p0{std::move(p)};
|
|
|
|
p = std::move(p0);
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> i;
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p2, __] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i2;
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto move_rotate = [&p = p, &p0 = p0] {
|
2023-08-05 12:05:17 +02:00
|
|
|
auto p1 = std::move(p);
|
|
|
|
p0 = std::move(p1);
|
|
|
|
p = std::move(p0);
|
|
|
|
};
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
while (!p.eof()) {
|
2023-08-05 12:05:17 +02:00
|
|
|
move_rotate();
|
2023-08-04 16:48:07 +02:00
|
|
|
auto a = p.template get_next<int, double, std::string>();
|
2020-12-26 00:46:42 +01:00
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
for (const auto& a : p2.template iterate<int, double, std::string>()) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i2.emplace_back(ss::to_object<X>(a));
|
|
|
|
}
|
|
|
|
|
2021-02-27 13:53:06 +01:00
|
|
|
CHECK_EQ(i, data);
|
2021-02-28 19:22:54 +01:00
|
|
|
CHECK_EQ(i2, data);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> i;
|
2021-02-28 19:22:54 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p2, __] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i2;
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p3, ___] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i3;
|
|
|
|
|
2021-02-21 02:49:23 +01:00
|
|
|
std::vector<X> expected = {std::begin(data) + 1, std::end(data)};
|
2021-02-28 19:22:54 +01:00
|
|
|
using tup = std::tuple<int, double, std::string>;
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
p.ignore_next();
|
|
|
|
while (!p.eof()) {
|
2024-02-17 00:55:36 +01:00
|
|
|
auto a = p.template get_next<tup>();
|
2020-12-26 00:46:42 +01:00
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
|
|
|
|
2021-02-28 19:22:54 +01:00
|
|
|
p2.ignore_next();
|
2024-02-17 00:55:36 +01:00
|
|
|
for (const auto& a : p2.template iterate<tup>()) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i2.emplace_back(ss::to_object<X>(a));
|
|
|
|
}
|
|
|
|
|
|
|
|
p3.ignore_next();
|
2024-02-17 00:55:36 +01:00
|
|
|
for (auto it = p3.template iterate<tup>().begin();
|
|
|
|
it != p3.template iterate<tup>().end(); ++it) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i3.emplace_back(ss::to_object<X>(*it));
|
|
|
|
}
|
|
|
|
|
2021-02-21 02:49:23 +01:00
|
|
|
CHECK_EQ(i, expected);
|
2021-02-28 19:22:54 +01:00
|
|
|
CHECK_EQ(i2, expected);
|
|
|
|
CHECK_EQ(i3, expected);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> i;
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p2, __] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i2;
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
while (!p.eof()) {
|
2024-02-17 00:55:36 +01:00
|
|
|
i.push_back(p.template get_object<X, int, double, std::string>());
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
for (auto&& a :
|
|
|
|
p2.template iterate_object<X, int, double, std::string>()) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i2.push_back(std::move(a));
|
|
|
|
}
|
|
|
|
|
2021-02-20 15:53:18 +01:00
|
|
|
CHECK_EQ(i, data);
|
2021-02-28 19:22:54 +01:00
|
|
|
CHECK_EQ(i2, data);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> i;
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
for (auto&& a :
|
|
|
|
p.template iterate_object<X, int, double, std::string>()) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i.push_back(std::move(a));
|
|
|
|
}
|
|
|
|
|
|
|
|
CHECK_EQ(i, data);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i;
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p2, __] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i2;
|
|
|
|
|
|
|
|
using tup = std::tuple<int, double, std::string>;
|
2020-12-26 00:46:42 +01:00
|
|
|
while (!p.eof()) {
|
2024-02-17 00:55:36 +01:00
|
|
|
i.push_back(p.template get_object<X, tup>());
|
2020-12-26 00:36:08 +01:00
|
|
|
}
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
for (auto it = p2.template iterate_object<X, tup>().begin();
|
|
|
|
it != p2.template iterate_object<X, tup>().end(); it++) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i2.push_back({it->i, it->d, it->s});
|
|
|
|
}
|
|
|
|
|
|
|
|
CHECK_EQ(i, data);
|
|
|
|
CHECK_EQ(i2, data);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i;
|
|
|
|
|
|
|
|
using tup = std::tuple<int, double, std::string>;
|
2024-02-17 00:55:36 +01:00
|
|
|
for (auto&& a : p.template iterate_object<X, tup>()) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i.push_back(std::move(a));
|
|
|
|
}
|
|
|
|
|
2021-02-20 15:53:18 +01:00
|
|
|
CHECK_EQ(i, data);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> i;
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
while (!p.eof()) {
|
2024-02-17 00:55:36 +01:00
|
|
|
i.push_back(p.template get_next<X>());
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
|
|
|
|
2021-02-20 15:53:18 +01:00
|
|
|
CHECK_EQ(i, data);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2021-02-28 19:22:54 +01:00
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i;
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
for (auto&& a : p.template iterate<X>()) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i.push_back(std::move(a));
|
|
|
|
}
|
|
|
|
|
|
|
|
CHECK_EQ(i, data);
|
|
|
|
}
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
|
|
|
constexpr int excluded = 3;
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> i;
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p2, __] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i2;
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
while (!p.eof()) {
|
2024-02-17 00:55:36 +01:00
|
|
|
try {
|
|
|
|
auto a = p.template get_object<X, ss::ax<int, excluded>, double,
|
|
|
|
std::string>();
|
|
|
|
if (p.valid()) {
|
|
|
|
i.push_back(a);
|
|
|
|
}
|
|
|
|
} catch (...) {
|
|
|
|
// ignore
|
|
|
|
};
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2021-02-21 02:49:23 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
if (!ss::setup<Ts...>::throw_on_error) {
|
|
|
|
for (auto&& a : p2.template iterate_object<X, ss::ax<int, excluded>,
|
|
|
|
double, std::string>()) {
|
|
|
|
if (p2.valid()) {
|
|
|
|
i2.push_back(std::move(a));
|
|
|
|
}
|
2021-02-28 19:22:54 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-02-21 02:49:23 +01:00
|
|
|
std::vector<X> expected;
|
|
|
|
for (auto& x : data) {
|
|
|
|
if (x.i != excluded) {
|
|
|
|
expected.push_back(x);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::copy_if(data.begin(), data.end(), expected.begin(),
|
2023-07-29 16:51:34 +02:00
|
|
|
[&](const X& x) { return x.i != excluded; });
|
2021-02-21 02:49:23 +01:00
|
|
|
CHECK_EQ(i, expected);
|
2024-02-17 00:55:36 +01:00
|
|
|
|
|
|
|
if (!ss::setup<Ts...>::throw_on_error) {
|
|
|
|
CHECK_EQ(i2, expected);
|
|
|
|
}
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> i;
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p2, __] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i2;
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
while (!p.eof()) {
|
2024-02-17 00:55:36 +01:00
|
|
|
try {
|
|
|
|
auto a = p.template get_object<X, ss::nx<int, 3>, double,
|
|
|
|
std::string>();
|
|
|
|
if (p.valid()) {
|
|
|
|
i.push_back(a);
|
|
|
|
}
|
|
|
|
} catch (...) {
|
|
|
|
// ignore
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
2021-02-28 19:22:54 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
if (!ss::setup<Ts...>::throw_on_error) {
|
|
|
|
for (auto&& a : p2.template iterate_object<X, ss::nx<int, 3>,
|
|
|
|
double, std::string>()) {
|
|
|
|
if (p2.valid()) {
|
|
|
|
i2.push_back(std::move(a));
|
|
|
|
}
|
2021-02-28 19:22:54 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> expected = {{3, 4, "y"}};
|
2021-02-21 02:49:23 +01:00
|
|
|
CHECK_EQ(i, expected);
|
2024-02-17 00:55:36 +01:00
|
|
|
if (!ss::setup<Ts...>::throw_on_error) {
|
|
|
|
CHECK_EQ(i2, expected);
|
|
|
|
}
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name empty_f{"test_parser"};
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> empty_data = {};
|
2021-02-28 19:22:54 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
make_and_write(empty_f.name, empty_data);
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(empty_f.name, ",");
|
2020-12-26 00:46:42 +01:00
|
|
|
std::vector<X> i;
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p2, __] = make_parser<buffer_mode, Ts...>(empty_f.name, ",");
|
2021-02-28 19:22:54 +01:00
|
|
|
std::vector<X> i2;
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
while (!p.eof()) {
|
2024-02-17 00:55:36 +01:00
|
|
|
i.push_back(p.template get_next<X>());
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
2021-02-28 19:22:54 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
for (auto&& a : p2.template iterate<X>()) {
|
2021-02-28 19:22:54 +01:00
|
|
|
i2.push_back(std::move(a));
|
|
|
|
}
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
CHECK(i.empty());
|
2021-02-28 19:22:54 +01:00
|
|
|
CHECK(i2.empty());
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
TEST_CASE("parser test various cases") {
|
2024-02-17 00:55:36 +01:00
|
|
|
test_various_cases<false>();
|
|
|
|
test_various_cases<false, ss::string_error>();
|
|
|
|
test_various_cases<false, ss::throw_on_error>();
|
|
|
|
test_various_cases<true>();
|
|
|
|
test_various_cases<true, ss::string_error>();
|
|
|
|
test_various_cases<true, ss::throw_on_error>();
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
|
2020-12-26 00:36:08 +01:00
|
|
|
using test_tuple = std::tuple<double, char, double>;
|
|
|
|
struct test_struct {
|
2020-12-26 00:46:42 +01:00
|
|
|
int i;
|
|
|
|
double d;
|
|
|
|
char c;
|
2022-03-27 21:04:02 +02:00
|
|
|
auto tied() {
|
|
|
|
return std::tie(i, d, c);
|
|
|
|
}
|
2020-12-26 00:36:08 +01:00
|
|
|
};
|
|
|
|
|
2023-07-29 20:41:31 +02:00
|
|
|
static inline void expect_test_struct(const test_struct&) {
|
2022-03-27 21:04:02 +02:00
|
|
|
}
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
template <bool buffer_mode, typename... Ts>
|
2023-08-04 16:48:07 +02:00
|
|
|
void test_composite_conversion() {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
|
|
|
std::ofstream out{f.name};
|
2021-01-01 23:52:14 +01:00
|
|
|
for (auto& i :
|
|
|
|
{"10,a,11.1", "10,20,11.1", "junk", "10,11.1", "1,11.1,a", "junk",
|
2021-01-03 17:27:21 +01:00
|
|
|
"10,junk", "11,junk", "10,11.1,c", "10,20", "10,22.2,f"}) {
|
2020-12-26 00:46:42 +01:00
|
|
|
out << i << std::endl;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
auto [p, _] = make_parser<buffer_mode, Ts...>(f.name, ",");
|
2020-12-26 00:46:42 +01:00
|
|
|
auto fail = [] { FAIL(""); };
|
|
|
|
auto expect_error = [](auto error) { CHECK(!error.empty()); };
|
2023-08-04 16:48:07 +02:00
|
|
|
auto ignore_error = [] {};
|
2020-12-26 00:46:42 +01:00
|
|
|
|
|
|
|
REQUIRE(p.valid());
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(p.eof());
|
2020-12-26 00:46:42 +01:00
|
|
|
|
|
|
|
{
|
|
|
|
constexpr static auto expectedData = std::tuple{10, 'a', 11.1};
|
|
|
|
|
|
|
|
auto [d1, d2, d3, d4] =
|
2023-08-04 16:48:07 +02:00
|
|
|
p.template try_next<int, int, double>(fail)
|
|
|
|
.template or_else<test_struct>(fail)
|
|
|
|
.template or_else<int, char, double>(
|
2023-07-29 16:51:34 +02:00
|
|
|
[&](auto&& data) { CHECK_EQ(data, expectedData); })
|
2020-12-26 00:46:42 +01:00
|
|
|
.on_error(fail)
|
2023-08-04 16:48:07 +02:00
|
|
|
.template or_else<test_tuple>(fail)
|
2020-12-26 00:46:42 +01:00
|
|
|
.values();
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
REQUIRE(p.valid());
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d1);
|
|
|
|
REQUIRE_FALSE(d2);
|
2020-12-26 00:46:42 +01:00
|
|
|
REQUIRE(d3);
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d4);
|
|
|
|
CHECK_EQ(*d3, expectedData);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
REQUIRE(!p.eof());
|
|
|
|
constexpr static auto expectedData = std::tuple{10, 20, 11.1};
|
|
|
|
|
|
|
|
auto [d1, d2, d3, d4] =
|
2023-08-04 16:48:07 +02:00
|
|
|
p.template try_next<int, int, double>(
|
|
|
|
[&](auto& i1, auto i2, double d) {
|
|
|
|
CHECK_EQ(std::tie(i1, i2, d), expectedData);
|
|
|
|
})
|
2020-12-26 00:46:42 +01:00
|
|
|
.on_error(fail)
|
2023-08-04 16:48:07 +02:00
|
|
|
.template or_object<test_struct, int, double, char>(fail)
|
2020-12-26 00:46:42 +01:00
|
|
|
.on_error(fail)
|
2023-08-04 16:48:07 +02:00
|
|
|
.template or_else<test_tuple>(fail)
|
2020-12-26 00:46:42 +01:00
|
|
|
.on_error(fail)
|
2023-08-04 16:48:07 +02:00
|
|
|
.template or_else<int, char, double>(fail)
|
2020-12-26 00:46:42 +01:00
|
|
|
.values();
|
2020-12-26 00:36:08 +01:00
|
|
|
|
|
|
|
REQUIRE(p.valid());
|
2020-12-26 00:46:42 +01:00
|
|
|
REQUIRE(d1);
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d2);
|
|
|
|
REQUIRE_FALSE(d3);
|
|
|
|
REQUIRE_FALSE(d4);
|
2021-02-21 02:49:23 +01:00
|
|
|
CHECK_EQ(*d1, expectedData);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
2020-12-26 00:36:08 +01:00
|
|
|
REQUIRE(!p.eof());
|
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
auto [d1, d2, d3, d4, d5] =
|
2023-08-04 16:48:07 +02:00
|
|
|
p.template try_object<test_struct, int, double, char>(fail)
|
2020-12-26 00:46:42 +01:00
|
|
|
.on_error(expect_error)
|
2023-08-04 16:48:07 +02:00
|
|
|
.template or_else<int, char, char>(fail)
|
|
|
|
.template or_else<test_struct>(fail)
|
|
|
|
.template or_else<test_tuple>(fail)
|
|
|
|
.template or_else<int, char, double>(fail)
|
2020-12-26 00:46:42 +01:00
|
|
|
.values();
|
|
|
|
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(p.valid());
|
|
|
|
REQUIRE_FALSE(d1);
|
|
|
|
REQUIRE_FALSE(d2);
|
|
|
|
REQUIRE_FALSE(d3);
|
|
|
|
REQUIRE_FALSE(d4);
|
|
|
|
REQUIRE_FALSE(d5);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
REQUIRE(!p.eof());
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
auto [d1, d2] =
|
2023-08-04 16:48:07 +02:00
|
|
|
p.template try_next<int, double>([](auto& i, auto& d) {
|
2021-02-21 02:49:23 +01:00
|
|
|
REQUIRE_EQ(std::tie(i, d), std::tuple{10, 11.1});
|
2020-12-26 00:46:42 +01:00
|
|
|
})
|
2023-08-04 16:48:07 +02:00
|
|
|
.template or_else<int, double>([](auto&, auto&) { FAIL(""); })
|
2020-12-26 00:46:42 +01:00
|
|
|
.values();
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
REQUIRE(p.valid());
|
|
|
|
REQUIRE(d1);
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d2);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
|
|
|
REQUIRE(!p.eof());
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
auto [d1, d2] =
|
|
|
|
p.template try_next<int, double>([](auto&, auto&) { FAIL(""); })
|
|
|
|
.template or_else<test_struct>(expect_test_struct)
|
|
|
|
.values();
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
REQUIRE(p.valid());
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d1);
|
2020-12-26 00:46:42 +01:00
|
|
|
REQUIRE(d2);
|
2021-02-20 15:53:18 +01:00
|
|
|
CHECK_EQ(d2->tied(), std::tuple{1, 11.1, 'a'});
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
{
|
|
|
|
REQUIRE(!p.eof());
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
auto [d1, d2, d3, d4, d5] =
|
2023-08-04 16:48:07 +02:00
|
|
|
p.template try_next<int, int, double>(fail)
|
|
|
|
.template or_object<test_struct, int, double, char>()
|
|
|
|
.template or_else<test_struct>(expect_test_struct)
|
|
|
|
.template or_else<test_tuple>(fail)
|
|
|
|
.template or_else<std::tuple<int, double>>(fail)
|
|
|
|
.on_error(ignore_error)
|
2020-12-26 00:46:42 +01:00
|
|
|
.on_error(expect_error)
|
|
|
|
.values();
|
|
|
|
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(p.valid());
|
|
|
|
REQUIRE_FALSE(d1);
|
|
|
|
REQUIRE_FALSE(d2);
|
|
|
|
REQUIRE_FALSE(d3);
|
|
|
|
REQUIRE_FALSE(d4);
|
|
|
|
REQUIRE_FALSE(d5);
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
REQUIRE(!p.eof());
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
auto [d1, d2] =
|
|
|
|
p.template try_next<int, std::optional<int>>()
|
|
|
|
.on_error(ignore_error)
|
|
|
|
.on_error(fail)
|
|
|
|
.template or_else<std::tuple<int, std::string>>(fail)
|
|
|
|
.on_error(ignore_error)
|
|
|
|
.on_error(fail)
|
|
|
|
.on_error(ignore_error)
|
|
|
|
.values();
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
REQUIRE(p.valid());
|
|
|
|
REQUIRE(d1);
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d2);
|
|
|
|
CHECK_EQ(*d1, std::tuple{10, std::nullopt});
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(p.eof());
|
2020-12-26 00:46:42 +01:00
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
auto [d1, d2] =
|
|
|
|
p.template try_next<int, std::variant<int, std::string>>()
|
|
|
|
.on_error(fail)
|
|
|
|
.template or_else<std::tuple<int, std::string>>(fail)
|
|
|
|
.on_error(fail)
|
|
|
|
.values();
|
2020-12-26 00:46:42 +01:00
|
|
|
|
|
|
|
REQUIRE(p.valid());
|
|
|
|
REQUIRE(d1);
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d2);
|
|
|
|
CHECK_EQ(*d1, std::tuple{11, std::variant<int, std::string>{"junk"}});
|
2020-12-26 00:46:42 +01:00
|
|
|
}
|
2021-01-01 23:52:14 +01:00
|
|
|
|
|
|
|
{
|
|
|
|
REQUIRE(!p.eof());
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
auto [d1, d2] = p.template try_object<test_struct, int, double, char>()
|
|
|
|
.template or_else<int>(fail)
|
2021-01-01 23:52:14 +01:00
|
|
|
.values();
|
|
|
|
REQUIRE(p.valid());
|
|
|
|
REQUIRE(d1);
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d2);
|
|
|
|
CHECK_EQ(d1->tied(), std::tuple{10, 11.1, 'c'});
|
2021-01-01 23:52:14 +01:00
|
|
|
}
|
|
|
|
|
2021-01-03 17:27:21 +01:00
|
|
|
{
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(p.eof());
|
2021-01-03 17:27:21 +01:00
|
|
|
|
|
|
|
auto [d1, d2, d3, d4] =
|
2023-08-04 16:48:07 +02:00
|
|
|
p.template try_next<int, int>([] { return false; })
|
|
|
|
.template or_else<int, double>([](auto&) { return false; })
|
|
|
|
.template or_else<int, int>()
|
|
|
|
.template or_else<int, int>(fail)
|
2021-01-03 17:27:21 +01:00
|
|
|
.values();
|
|
|
|
|
|
|
|
REQUIRE(p.valid());
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d1);
|
|
|
|
REQUIRE_FALSE(d2);
|
2021-01-03 17:27:21 +01:00
|
|
|
REQUIRE(d3);
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d4);
|
|
|
|
CHECK_EQ(d3.value(), std::tuple{10, 20});
|
2021-01-03 17:27:21 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
REQUIRE(!p.eof());
|
|
|
|
|
|
|
|
auto [d1, d2, d3, d4] =
|
2023-08-04 16:48:07 +02:00
|
|
|
p.template try_object<test_struct, int, double, char>(
|
|
|
|
[] { return false; })
|
|
|
|
.template or_else<int, double>([](auto&) { return false; })
|
|
|
|
.template or_object<test_struct, int, double, char>()
|
|
|
|
.template or_else<int, int>(fail)
|
2021-01-03 17:27:21 +01:00
|
|
|
.values();
|
|
|
|
|
|
|
|
REQUIRE(p.valid());
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d1);
|
|
|
|
REQUIRE_FALSE(d2);
|
2021-01-03 17:27:21 +01:00
|
|
|
REQUIRE(d3);
|
2021-02-20 15:53:18 +01:00
|
|
|
REQUIRE_FALSE(d4);
|
|
|
|
CHECK_EQ(d3->tied(), std::tuple{10, 22.2, 'f'});
|
2021-01-03 17:27:21 +01:00
|
|
|
}
|
|
|
|
|
2021-01-01 23:52:14 +01:00
|
|
|
CHECK(p.eof());
|
2020-12-26 00:36:08 +01:00
|
|
|
}
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
// various scenarios
|
|
|
|
TEST_CASE("parser test composite conversion") {
|
2024-02-17 00:55:36 +01:00
|
|
|
test_composite_conversion<false, ss::string_error>();
|
|
|
|
test_composite_conversion<true, ss::string_error>();
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
|
2020-12-10 19:26:56 +01:00
|
|
|
struct my_string {
|
2020-12-26 00:46:42 +01:00
|
|
|
char* data{nullptr};
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
my_string() = default;
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2022-03-27 21:04:02 +02:00
|
|
|
~my_string() {
|
|
|
|
delete[] data;
|
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
// make sure no object is copied
|
|
|
|
my_string(const my_string&) = delete;
|
|
|
|
my_string& operator=(const my_string&) = delete;
|
2020-12-10 19:26:56 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
my_string(my_string&& other) : data{other.data} {
|
|
|
|
other.data = nullptr;
|
|
|
|
}
|
2020-12-26 00:36:08 +01:00
|
|
|
|
2020-12-26 00:46:42 +01:00
|
|
|
my_string& operator=(my_string&& other) {
|
|
|
|
data = other.data;
|
|
|
|
return *this;
|
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
template <>
|
|
|
|
inline bool ss::extract(const char* begin, const char* end, my_string& s) {
|
2020-12-26 00:46:42 +01:00
|
|
|
size_t size = end - begin;
|
|
|
|
s.data = new char[size + 1];
|
|
|
|
strncpy(s.data, begin, size);
|
|
|
|
s.data[size] = '\0';
|
|
|
|
return true;
|
2020-12-10 19:26:56 +01:00
|
|
|
}
|
|
|
|
|
2020-12-26 00:36:08 +01:00
|
|
|
struct xyz {
|
2020-12-26 00:46:42 +01:00
|
|
|
my_string x;
|
|
|
|
my_string y;
|
|
|
|
my_string z;
|
2022-03-27 21:04:02 +02:00
|
|
|
auto tied() {
|
|
|
|
return std::tie(x, y, z);
|
|
|
|
}
|
2020-12-10 19:26:56 +01:00
|
|
|
};
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
template <bool buffer_mode, typename... Ts>
|
2023-08-04 16:48:07 +02:00
|
|
|
void test_moving_of_parsed_composite_values() {
|
2020-12-26 00:46:42 +01:00
|
|
|
// to compile is enough
|
|
|
|
return;
|
2023-08-04 16:48:07 +02:00
|
|
|
ss::parser<Ts...> p{"", ""};
|
|
|
|
p.template try_next<my_string, my_string, my_string>()
|
|
|
|
.template or_else<my_string, my_string, my_string, my_string>(
|
|
|
|
[](auto&&) {})
|
|
|
|
.template or_else<my_string>([](auto&) {})
|
|
|
|
.template or_else<xyz>([](auto&&) {})
|
|
|
|
.template or_object<xyz, my_string, my_string, my_string>([](auto&&) {})
|
|
|
|
.template or_else<std::tuple<my_string, my_string, my_string>>(
|
2020-12-26 00:46:42 +01:00
|
|
|
[](auto&, auto&, auto&) {});
|
2020-12-26 00:36:08 +01:00
|
|
|
}
|
2020-12-27 16:51:59 +01:00
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
TEST_CASE("parser test the moving of parsed composite values") {
|
2024-02-17 00:55:36 +01:00
|
|
|
test_moving_of_parsed_composite_values<false>();
|
|
|
|
test_moving_of_parsed_composite_values<false, ss::string_error>();
|
|
|
|
test_moving_of_parsed_composite_values<true>();
|
|
|
|
test_moving_of_parsed_composite_values<true, ss::string_error>();
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
|
2021-02-07 21:24:41 +01:00
|
|
|
TEST_CASE("parser test error mode") {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2020-12-27 16:51:59 +01:00
|
|
|
{
|
|
|
|
std::ofstream out{f.name};
|
|
|
|
out << "junk" << std::endl;
|
|
|
|
out << "junk" << std::endl;
|
|
|
|
}
|
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
{
|
|
|
|
auto [p, _] = make_parser<false, ss::string_error>(f.name, ",");
|
2020-12-27 16:51:59 +01:00
|
|
|
|
2024-02-17 00:55:36 +01:00
|
|
|
REQUIRE_FALSE(p.eof());
|
|
|
|
p.get_next<int>();
|
|
|
|
CHECK_FALSE(p.valid());
|
|
|
|
CHECK_FALSE(p.error_msg().empty());
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
auto [p, _] = make_parser<true, ss::string_error>(f.name, ",");
|
|
|
|
|
|
|
|
REQUIRE_FALSE(p.eof());
|
|
|
|
p.get_next<int>();
|
|
|
|
CHECK_FALSE(p.valid());
|
|
|
|
CHECK_FALSE(p.error_msg().empty());
|
|
|
|
}
|
2020-12-27 16:51:59 +01:00
|
|
|
}
|
2021-01-31 23:08:46 +01:00
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
TEST_CASE("parser throw on error mode") {
|
|
|
|
unique_file_name f{"test_parser"};
|
|
|
|
{
|
|
|
|
std::ofstream out{f.name};
|
|
|
|
out << "junk" << std::endl;
|
|
|
|
out << "junk" << std::endl;
|
|
|
|
}
|
|
|
|
|
2024-02-17 17:43:33 +01:00
|
|
|
{
|
|
|
|
auto [p, _] = make_parser<false, ss::throw_on_error>(f.name, ",");
|
2023-08-04 16:48:07 +02:00
|
|
|
|
2024-02-17 17:43:33 +01:00
|
|
|
REQUIRE_FALSE(p.eof());
|
|
|
|
try {
|
|
|
|
p.get_next<int>();
|
|
|
|
FAIL("Expected exception...");
|
|
|
|
} catch (const std::exception& e) {
|
|
|
|
CHECK_FALSE(std::string{e.what()}.empty());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
auto [p, _] = make_parser<true, ss::throw_on_error>(f.name, ",");
|
|
|
|
|
|
|
|
REQUIRE_FALSE(p.eof());
|
|
|
|
try {
|
|
|
|
p.get_next<int>();
|
|
|
|
FAIL("Expected exception...");
|
|
|
|
} catch (const std::exception& e) {
|
|
|
|
CHECK_FALSE(std::string{e.what()}.empty());
|
|
|
|
}
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-29 20:41:31 +02:00
|
|
|
static inline std::string no_quote(const std::string& s) {
|
2021-01-31 23:08:46 +01:00
|
|
|
if (!s.empty() && s[0] == '"') {
|
|
|
|
return {std::next(begin(s)), std::prev(end(s))};
|
|
|
|
}
|
|
|
|
return s;
|
|
|
|
}
|
|
|
|
|
2024-02-17 17:43:33 +01:00
|
|
|
template <bool buffer_mode, typename... Ts>
|
2023-08-05 13:30:14 +02:00
|
|
|
void test_quote_multiline() {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2021-02-23 01:02:15 +01:00
|
|
|
std::vector<X> data = {{1, 2, "\"x\r\nx\nx\""},
|
|
|
|
{3, 4, "\"y\ny\r\ny\""},
|
|
|
|
{5, 6, "\"z\nz\""},
|
|
|
|
{7, 8, "\"u\"\"\""},
|
|
|
|
{9, 10, "v"},
|
|
|
|
{11, 12, "\"w\n\""}};
|
|
|
|
for (auto& [_, __, s] : data) {
|
|
|
|
update_if_crlf(s);
|
|
|
|
}
|
|
|
|
|
2021-01-31 23:08:46 +01:00
|
|
|
make_and_write(f.name, data);
|
|
|
|
for (auto& [_, __, s] : data) {
|
|
|
|
s = no_quote(s);
|
|
|
|
if (s[0] == 'u') {
|
|
|
|
s = "u\"";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-02-17 17:43:33 +01:00
|
|
|
auto [p, buff] =
|
|
|
|
make_parser<buffer_mode, ss::multiline, ss::quote<'"'>, Ts...>(f.name,
|
|
|
|
",");
|
|
|
|
|
2021-01-31 23:08:46 +01:00
|
|
|
std::vector<X> i;
|
|
|
|
|
|
|
|
while (!p.eof()) {
|
2023-08-05 13:30:14 +02:00
|
|
|
auto a = p.template get_next<int, double, std::string>();
|
2021-01-31 23:08:46 +01:00
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
|
|
|
}
|
|
|
|
|
2021-02-23 01:02:15 +01:00
|
|
|
for (auto& [_, __, s] : i) {
|
|
|
|
update_if_crlf(s);
|
|
|
|
}
|
2021-02-20 15:53:18 +01:00
|
|
|
CHECK_EQ(i, data);
|
2021-02-13 01:14:25 +01:00
|
|
|
|
2024-02-17 17:43:33 +01:00
|
|
|
auto [p_no_multiline, __] =
|
|
|
|
make_parser<buffer_mode, ss::quote<'"'>, Ts...>(f.name, ",");
|
2021-02-13 01:14:25 +01:00
|
|
|
while (!p.eof()) {
|
2024-02-17 17:43:33 +01:00
|
|
|
auto command = [&p_no_multiline = p_no_multiline] {
|
2023-08-05 13:30:14 +02:00
|
|
|
p_no_multiline.template get_next<int, double, std::string>();
|
|
|
|
};
|
|
|
|
expect_error_on_command(p_no_multiline, command);
|
2021-02-13 01:14:25 +01:00
|
|
|
}
|
2021-01-31 23:08:46 +01:00
|
|
|
}
|
|
|
|
|
2023-08-05 13:30:14 +02:00
|
|
|
TEST_CASE("parser test csv on multiple lines with quotes") {
|
2024-02-17 17:43:33 +01:00
|
|
|
test_quote_multiline<false>();
|
|
|
|
test_quote_multiline<false, ss::string_error>();
|
|
|
|
test_quote_multiline<false, ss::throw_on_error>();
|
|
|
|
test_quote_multiline<true>();
|
|
|
|
test_quote_multiline<true, ss::string_error>();
|
|
|
|
test_quote_multiline<true, ss::throw_on_error>();
|
2023-08-05 13:30:14 +02:00
|
|
|
}
|
|
|
|
|
2023-07-29 20:41:31 +02:00
|
|
|
static inline std::string no_escape(std::string& s) {
|
2021-01-31 23:08:46 +01:00
|
|
|
s.erase(std::remove(begin(s), end(s), '\\'), end(s));
|
|
|
|
return s;
|
|
|
|
}
|
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
template <typename... Ts>
|
|
|
|
void test_escape_multiline() {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2021-02-23 01:02:15 +01:00
|
|
|
std::vector<X> data = {{1, 2, "x\\\nx\\\r\nx"},
|
|
|
|
{5, 6, "z\\\nz\\\nz"},
|
|
|
|
{7, 8, "u"},
|
|
|
|
{3, 4, "y\\\ny\\\ny"},
|
|
|
|
{9, 10, "v\\\\"},
|
|
|
|
{11, 12, "w\\\n"}};
|
|
|
|
for (auto& [_, __, s] : data) {
|
|
|
|
update_if_crlf(s);
|
|
|
|
}
|
2021-01-31 23:08:46 +01:00
|
|
|
|
|
|
|
make_and_write(f.name, data);
|
|
|
|
for (auto& [_, __, s] : data) {
|
|
|
|
s = no_escape(s);
|
|
|
|
if (s == "v") {
|
|
|
|
s = "v\\";
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
ss::parser<ss::multiline, ss::escape<'\\'>, Ts...> p{f.name, ","};
|
2021-01-31 23:08:46 +01:00
|
|
|
std::vector<X> i;
|
|
|
|
|
|
|
|
while (!p.eof()) {
|
2023-08-05 18:11:13 +02:00
|
|
|
auto a = p.template get_next<int, double, std::string>();
|
2021-01-31 23:08:46 +01:00
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
|
|
|
}
|
|
|
|
|
2021-02-23 01:02:15 +01:00
|
|
|
for (auto& [_, __, s] : i) {
|
|
|
|
update_if_crlf(s);
|
|
|
|
}
|
2021-02-20 15:53:18 +01:00
|
|
|
CHECK_EQ(i, data);
|
2021-02-13 01:14:25 +01:00
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
ss::parser<ss::escape<'\\'>, Ts...> p_no_multiline{f.name, ","};
|
2021-02-13 01:14:25 +01:00
|
|
|
while (!p.eof()) {
|
2023-08-05 18:11:13 +02:00
|
|
|
auto command = [&] {
|
|
|
|
auto a =
|
|
|
|
p_no_multiline.template get_next<int, double, std::string>();
|
|
|
|
};
|
|
|
|
expect_error_on_command(p_no_multiline, command);
|
2021-02-20 15:53:18 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
TEST_CASE("parser test csv on multiple lines with escapes") {
|
|
|
|
test_escape_multiline();
|
|
|
|
test_escape_multiline<ss::string_error>();
|
|
|
|
test_escape_multiline<ss::throw_on_error>();
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename... Ts>
|
|
|
|
void test_quote_escape_multiline() {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2021-02-20 15:53:18 +01:00
|
|
|
{
|
|
|
|
std::ofstream out{f.name};
|
2021-02-21 02:49:23 +01:00
|
|
|
out << "1,2,\"just\\\n\nstrings\"" << std::endl;
|
2021-02-23 01:02:15 +01:00
|
|
|
#ifndef _WIN32
|
|
|
|
out << "3,4,\"just\r\nsome\\\r\n\n\\\nstrings\"" << std::endl;
|
|
|
|
out << "5,6,\"just\\\n\\\r\n\r\n\nstrings" << std::endl;
|
|
|
|
#else
|
2021-02-21 02:49:23 +01:00
|
|
|
out << "3,4,\"just\nsome\\\n\n\\\nstrings\"" << std::endl;
|
|
|
|
out << "5,6,\"just\\\n\\\n\n\nstrings" << std::endl;
|
2021-02-23 01:02:15 +01:00
|
|
|
#endif
|
2021-02-21 02:49:23 +01:00
|
|
|
out << "7,8,\"just strings\"" << std::endl;
|
|
|
|
out << "9,10,just strings" << std::endl;
|
2021-02-13 01:14:25 +01:00
|
|
|
}
|
2023-08-05 18:11:13 +02:00
|
|
|
size_t bad_lines = 1;
|
|
|
|
auto num_errors = 0;
|
2021-02-20 15:53:18 +01:00
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
ss::parser<ss::multiline, ss::escape<'\\'>, ss::quote<'"'>, Ts...> p{
|
|
|
|
f.name};
|
2021-02-20 15:53:18 +01:00
|
|
|
std::vector<X> i;
|
|
|
|
|
|
|
|
while (!p.eof()) {
|
2023-08-05 18:11:13 +02:00
|
|
|
try {
|
|
|
|
auto a = p.template get_next<int, double, std::string>();
|
|
|
|
if (p.valid()) {
|
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
|
|
|
} else {
|
|
|
|
++num_errors;
|
|
|
|
}
|
|
|
|
} catch (const std::exception& e) {
|
|
|
|
++num_errors;
|
2021-02-20 15:53:18 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
CHECK(bad_lines == num_errors);
|
|
|
|
|
2021-02-20 15:53:18 +01:00
|
|
|
std::vector<X> data = {{1, 2, "just\n\nstrings"},
|
2021-02-23 01:02:15 +01:00
|
|
|
#ifndef _WIN32
|
|
|
|
{3, 4, "just\r\nsome\r\n\n\nstrings"},
|
|
|
|
#else
|
2021-02-20 15:53:18 +01:00
|
|
|
{3, 4, "just\nsome\n\n\nstrings"},
|
2021-02-23 01:02:15 +01:00
|
|
|
#endif
|
2021-02-20 15:53:18 +01:00
|
|
|
{9, 10, "just strings"}};
|
|
|
|
|
2021-02-23 01:02:15 +01:00
|
|
|
for (auto& [_, __, s] : i) {
|
|
|
|
update_if_crlf(s);
|
|
|
|
}
|
2021-02-20 15:53:18 +01:00
|
|
|
CHECK_EQ(i, data);
|
|
|
|
}
|
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
TEST_CASE("parser test csv on multiple lines with quotes and escapes") {
|
|
|
|
test_quote_escape_multiline();
|
|
|
|
test_quote_escape_multiline<ss::string_error>();
|
|
|
|
test_quote_escape_multiline<ss::throw_on_error>();
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename... Ts>
|
|
|
|
void test_multiline_restricted() {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2021-02-20 15:53:18 +01:00
|
|
|
{
|
|
|
|
std::ofstream out{f.name};
|
2021-02-21 02:49:23 +01:00
|
|
|
out << "1,2,\"just\n\nstrings\"" << std::endl;
|
2021-02-23 01:02:15 +01:00
|
|
|
#ifndef _WIN32
|
|
|
|
out << "3,4,\"ju\n\r\n\nnk\"" << std::endl;
|
|
|
|
out << "5,6,just\\\n\\\r\nstrings" << std::endl;
|
|
|
|
#else
|
2021-02-21 02:49:23 +01:00
|
|
|
out << "3,4,\"ju\n\n\nnk\"" << std::endl;
|
|
|
|
out << "5,6,just\\\n\\\nstrings" << std::endl;
|
2021-02-23 01:02:15 +01:00
|
|
|
#endif
|
2021-02-21 02:49:23 +01:00
|
|
|
out << "7,8,ju\\\n\\\n\\\nnk" << std::endl;
|
|
|
|
out << "9,10,\"just\\\n\nstrings\"" << std::endl;
|
2021-02-20 15:53:18 +01:00
|
|
|
out << "11,12,\"ju\\\n|\n\n\n\n\nk\"" << std::endl;
|
2021-02-21 02:49:23 +01:00
|
|
|
out << "13,14,\"ju\\\n\\\n15,16\"\\\n\\\\\n\nnk\"" << std::endl;
|
|
|
|
out << "17,18,\"ju\\\n\\\n\\\n\\\\\n\nnk\"" << std::endl;
|
2021-02-20 15:53:18 +01:00
|
|
|
out << "19,20,just strings" << std::endl;
|
|
|
|
}
|
2023-08-05 18:11:13 +02:00
|
|
|
auto bad_lines = 15;
|
|
|
|
auto num_errors = 0;
|
2021-02-20 15:53:18 +01:00
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
ss::parser<ss::multiline_restricted<2>, ss::quote<'"'>, ss::escape<'\\'>,
|
|
|
|
Ts...>
|
2021-02-20 15:53:18 +01:00
|
|
|
p{f.name, ","};
|
|
|
|
std::vector<X> i;
|
|
|
|
|
|
|
|
while (!p.eof()) {
|
2023-08-05 18:11:13 +02:00
|
|
|
try {
|
|
|
|
auto a = p.template get_next<int, double, std::string>();
|
|
|
|
if (p.valid()) {
|
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
|
|
|
} else {
|
|
|
|
++num_errors;
|
|
|
|
}
|
|
|
|
} catch (const std::exception& e) {
|
|
|
|
++num_errors;
|
2021-02-20 15:53:18 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
CHECK(bad_lines == num_errors);
|
|
|
|
|
2021-02-20 15:53:18 +01:00
|
|
|
std::vector<X> data = {{1, 2, "just\n\nstrings"},
|
2021-02-23 01:02:15 +01:00
|
|
|
#ifndef _WIN32
|
|
|
|
{5, 6, "just\n\r\nstrings"},
|
|
|
|
#else
|
2021-02-20 15:53:18 +01:00
|
|
|
{5, 6, "just\n\nstrings"},
|
2021-02-23 01:02:15 +01:00
|
|
|
#endif
|
2021-02-20 15:53:18 +01:00
|
|
|
{9, 10, "just\n\nstrings"},
|
|
|
|
{19, 20, "just strings"}};
|
2021-02-23 01:02:15 +01:00
|
|
|
|
|
|
|
for (auto& [_, __, s] : i) {
|
|
|
|
update_if_crlf(s);
|
|
|
|
}
|
2023-07-10 02:39:24 +02:00
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
if (i.size() != data.size()) {
|
|
|
|
CHECK_EQ(i.size(), data.size());
|
|
|
|
}
|
|
|
|
|
2021-02-21 02:49:23 +01:00
|
|
|
CHECK_EQ(i, data);
|
2021-01-31 23:08:46 +01:00
|
|
|
}
|
2022-03-27 21:04:02 +02:00
|
|
|
|
2023-08-05 18:11:13 +02:00
|
|
|
TEST_CASE("parser test multiline restricted") {
|
|
|
|
test_multiline_restricted();
|
|
|
|
test_multiline_restricted<ss::string_error>();
|
|
|
|
test_multiline_restricted<ss::throw_on_error>();
|
|
|
|
}
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
template <typename... Ts>
|
|
|
|
void test_unterminated_line_impl(const std::vector<std::string>& lines,
|
|
|
|
size_t bad_line) {
|
|
|
|
unique_file_name f{"test_parser"};
|
|
|
|
std::ofstream out{f.name};
|
|
|
|
for (const auto& line : lines) {
|
|
|
|
out << line << std::endl;
|
|
|
|
}
|
|
|
|
out.close();
|
|
|
|
|
|
|
|
ss::parser<Ts...> p{f.name};
|
|
|
|
size_t line = 0;
|
|
|
|
while (!p.eof()) {
|
|
|
|
auto command = [&] { p.template get_next<int, double, std::string>(); };
|
|
|
|
|
|
|
|
if (line == bad_line) {
|
|
|
|
expect_error_on_command(p, command);
|
|
|
|
break;
|
|
|
|
} else {
|
2023-08-06 17:39:09 +02:00
|
|
|
command();
|
2023-08-04 16:48:07 +02:00
|
|
|
CHECK(p.valid());
|
|
|
|
++line;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename... Ts>
|
|
|
|
void test_unterminated_line(const std::vector<std::string>& lines,
|
|
|
|
size_t bad_line) {
|
|
|
|
test_unterminated_line_impl<Ts...>(lines, bad_line);
|
|
|
|
test_unterminated_line_impl<Ts..., ss::string_error>(lines, bad_line);
|
|
|
|
test_unterminated_line_impl<Ts..., ss::throw_on_error>(lines, bad_line);
|
|
|
|
}
|
|
|
|
|
2023-08-06 17:39:09 +02:00
|
|
|
TEST_CASE("parser test csv on multiline with errors") {
|
2023-08-04 16:48:07 +02:00
|
|
|
using multiline = ss::multiline_restricted<3>;
|
|
|
|
using escape = ss::escape<'\\'>;
|
|
|
|
using quote = ss::quote<'"'>;
|
|
|
|
|
|
|
|
// unterminated escape
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,just\\"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 0);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
}
|
|
|
|
|
2023-08-06 17:39:09 +02:00
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,just\\", "9,8,second"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 0);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first", "1,2,just\\"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first", "1,2,just\\",
|
|
|
|
"3,4,third"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first",
|
|
|
|
"1,2,just\\\nstrings\\",
|
|
|
|
"3,4,th\\\nird"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first", "3,4,second",
|
|
|
|
"1,2,just\\"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 2);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 2);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,\\first", "3,4,second",
|
|
|
|
"1,2,jus\\t\\"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 2);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 2);
|
|
|
|
}
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
// unterminated quote
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,\"just"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 0);
|
|
|
|
}
|
|
|
|
|
2023-08-06 17:39:09 +02:00
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,\"just", "9,8,second"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first", "1,2,\"just"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first", "1,2,\"just",
|
|
|
|
"3,4,th\\,ird"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first", "3,4,second",
|
|
|
|
"1,2,\"just"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 2);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 2);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,\"first\"",
|
|
|
|
"\"3\",4,\"sec,ond\"",
|
|
|
|
"1,2,\"ju\"\"st"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 2);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 2);
|
|
|
|
}
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
// unterminated quote and escape
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,\"just\\"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
2023-08-06 17:39:09 +02:00
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,\"just\\\n\\"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,\"just\n\\"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
}
|
|
|
|
|
2023-08-06 17:39:09 +02:00
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first", "1,2,\"just\n\\"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first", "1,2,\"just\n\\",
|
|
|
|
"4,3,thrid"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,f\\\nirst", "1,2,\"just\n\\",
|
|
|
|
"4,3,thrid"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,\"f\ni\nrst\"",
|
|
|
|
"1,2,\"just\n\\", "4,3,thrid"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
// multiline limmit reached escape
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,\\\n\\\n\\\n\\\njust"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 0);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
}
|
|
|
|
|
2023-08-06 17:39:09 +02:00
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first",
|
|
|
|
"1,2,\\\n\\\n\\\n\\\njust"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,fi\\\nrs\\\nt",
|
|
|
|
"1,2,\\\n\\\n\\\n\\\njust"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first",
|
|
|
|
"1,2,\\\n\\\n\\\n\\\njust",
|
|
|
|
"4,3,third"};
|
|
|
|
test_unterminated_line<multiline, escape>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
// multiline limmit reached quote
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,\"\n\n\n\n\njust\""};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 0);
|
|
|
|
}
|
|
|
|
|
2023-08-06 17:39:09 +02:00
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first",
|
|
|
|
"1,2,\"\n\n\n\n\njust\""};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,\"fir\nst\"",
|
|
|
|
"1,2,\"\n\n\n\n\njust\""};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
test_unterminated_line<multiline, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
// multiline limmit reached quote and escape
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"1,2,\"\\\n\n\\\n\\\n\\\njust"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 0);
|
|
|
|
}
|
2023-08-06 17:39:09 +02:00
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,first",
|
|
|
|
"1,2,\"\\\n\n\\\n\\\n\\\njust"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,fi\\\nrst",
|
|
|
|
"1,2,\"\\\n\n\\\n\\\n\\\njust"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,\"fi\nrst\"",
|
|
|
|
"1,2,\"\\\n\n\\\n\\\n\\\njust"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
const std::vector<std::string> lines{"9,8,\"fi\nr\\\nst\"",
|
|
|
|
"1,2,\"\\\n\n\\\n\\\n\\\njust"};
|
|
|
|
test_unterminated_line<multiline, escape, quote>(lines, 1);
|
|
|
|
}
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
|
2022-03-27 21:04:02 +02:00
|
|
|
template <typename T, typename Tuple>
|
|
|
|
struct has_type;
|
|
|
|
|
|
|
|
template <typename T, typename... Us>
|
|
|
|
struct has_type<T, std::tuple<Us...>>
|
|
|
|
: std::disjunction<std::is_same<T, Us>...> {};
|
|
|
|
|
2023-07-29 20:41:31 +02:00
|
|
|
static inline void check_size(size_t size1, size_t size2) {
|
2022-03-27 21:04:02 +02:00
|
|
|
CHECK_EQ(size1, size2);
|
|
|
|
}
|
|
|
|
|
2023-08-05 19:58:00 +02:00
|
|
|
template <typename Setup, typename... Ts>
|
|
|
|
static void test_fields_impl(const std::string file_name,
|
|
|
|
const std::vector<X>& data,
|
|
|
|
const std::vector<std::string>& fields) {
|
2022-03-27 21:04:02 +02:00
|
|
|
using CaseType = std::tuple<Ts...>;
|
|
|
|
|
2023-08-05 19:58:00 +02:00
|
|
|
ss::parser<Setup> p{file_name, ","};
|
2022-03-28 19:30:39 +02:00
|
|
|
CHECK_FALSE(p.field_exists("Unknown"));
|
2022-03-27 21:04:02 +02:00
|
|
|
p.use_fields(fields);
|
|
|
|
std::vector<CaseType> i;
|
|
|
|
|
2023-08-05 19:58:00 +02:00
|
|
|
for (const auto& a : p.template iterate<CaseType>()) {
|
2022-03-27 21:04:02 +02:00
|
|
|
i.push_back(a);
|
|
|
|
}
|
|
|
|
|
2023-07-25 00:56:38 +02:00
|
|
|
check_size(i.size(), data.size());
|
2022-03-27 21:04:02 +02:00
|
|
|
for (size_t j = 0; j < i.size(); ++j) {
|
|
|
|
if constexpr (has_type<int, CaseType>::value) {
|
|
|
|
CHECK_EQ(std::get<int>(i[j]), data[j].i);
|
|
|
|
}
|
|
|
|
if constexpr (has_type<double, CaseType>::value) {
|
|
|
|
CHECK_EQ(std::get<double>(i[j]), data[j].d);
|
|
|
|
}
|
|
|
|
if constexpr (has_type<std::string, CaseType>::value) {
|
|
|
|
CHECK_EQ(std::get<std::string>(i[j]), data[j].s);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-05 19:58:00 +02:00
|
|
|
template <typename... Ts>
|
|
|
|
static void test_fields(const std::string file_name, const std::vector<X>& data,
|
|
|
|
const std::vector<std::string>& fields) {
|
|
|
|
test_fields_impl<ss::setup<>, Ts...>(file_name, data, fields);
|
|
|
|
test_fields_impl<ss::setup<ss::string_error>, Ts...>(file_name, data,
|
|
|
|
fields);
|
|
|
|
test_fields_impl<ss::setup<ss::throw_on_error>, Ts...>(file_name, data,
|
|
|
|
fields);
|
|
|
|
}
|
|
|
|
|
2022-03-27 21:04:02 +02:00
|
|
|
TEST_CASE("parser test various cases with header") {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2022-03-27 21:04:02 +02:00
|
|
|
constexpr static auto Int = "Int";
|
|
|
|
constexpr static auto Dbl = "Double";
|
|
|
|
constexpr static auto Str = "String";
|
|
|
|
using str = std::string;
|
|
|
|
|
|
|
|
std::vector<std::string> header{Int, Dbl, Str};
|
|
|
|
|
|
|
|
std::vector<X> data = {{1, 2, "x"}, {3, 4, "y"}, {5, 6, "z"},
|
|
|
|
{7, 8, "u"}, {9, 10, "v"}, {11, 12, "w"}};
|
|
|
|
|
|
|
|
make_and_write(f.name, data, header);
|
|
|
|
const auto& o = f.name;
|
|
|
|
const auto& d = data;
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<ss::string_error> p{f.name, ","};
|
|
|
|
std::vector<X> i;
|
|
|
|
|
|
|
|
for (const auto& a : p.iterate<int, double, std::string>()) {
|
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
|
|
|
}
|
|
|
|
|
|
|
|
CHECK_NE(i, data);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<ss::string_error> p{f.name, ","};
|
|
|
|
std::vector<X> i;
|
|
|
|
|
|
|
|
p.ignore_next();
|
|
|
|
for (const auto& a : p.iterate<int, double, std::string>()) {
|
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
|
|
|
}
|
|
|
|
|
|
|
|
CHECK_EQ(i, data);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<ss::ignore_header> p{f.name, ","};
|
|
|
|
std::vector<X> i;
|
|
|
|
|
|
|
|
for (const auto& a : p.iterate<int, double, std::string>()) {
|
|
|
|
i.emplace_back(ss::to_object<X>(a));
|
|
|
|
}
|
|
|
|
|
|
|
|
CHECK_EQ(i, data);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<ss::ignore_header, ss::string_error> p{f.name, ","};
|
|
|
|
p.use_fields(Int, Dbl, Str);
|
|
|
|
CHECK_FALSE(p.valid());
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<ss::ignore_header, ss::string_error> p{f.name, ","};
|
2022-03-28 19:30:39 +02:00
|
|
|
CHECK_FALSE(p.field_exists("Unknown"));
|
|
|
|
|
2022-03-27 21:04:02 +02:00
|
|
|
p.use_fields(Int, "Unknown");
|
|
|
|
CHECK_FALSE(p.valid());
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<ss::ignore_header, ss::string_error> p{f.name, ","};
|
|
|
|
p.use_fields(Int, Int);
|
|
|
|
CHECK_FALSE(p.valid());
|
|
|
|
}
|
|
|
|
|
2022-03-28 19:30:39 +02:00
|
|
|
{
|
|
|
|
ss::parser<ss::string_error> p{f.name, ","};
|
|
|
|
p.use_fields(Int, Dbl);
|
|
|
|
|
|
|
|
{
|
|
|
|
auto [int_, double_] = p.get_next<int, double>();
|
|
|
|
CHECK_EQ(int_, data[0].i);
|
|
|
|
CHECK_EQ(double_, data[0].d);
|
|
|
|
}
|
|
|
|
|
|
|
|
p.use_fields(Dbl, Int);
|
|
|
|
|
|
|
|
{
|
|
|
|
auto [double_, int_] = p.get_next<double, int>();
|
|
|
|
CHECK_EQ(int_, data[1].i);
|
|
|
|
CHECK_EQ(double_, data[1].d);
|
|
|
|
}
|
|
|
|
|
|
|
|
p.use_fields(Str);
|
|
|
|
|
|
|
|
{
|
|
|
|
auto string_ = p.get_next<std::string>();
|
|
|
|
CHECK_EQ(string_, data[2].s);
|
|
|
|
}
|
|
|
|
|
|
|
|
p.use_fields(Str, Int, Dbl);
|
|
|
|
|
|
|
|
{
|
|
|
|
auto [string_, int_, double_] =
|
|
|
|
p.get_next<std::string, int, double>();
|
|
|
|
CHECK_EQ(double_, data[3].d);
|
|
|
|
CHECK_EQ(int_, data[3].i);
|
|
|
|
CHECK_EQ(string_, data[3].s);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-03-27 21:04:02 +02:00
|
|
|
/* python used to generate permutations
|
|
|
|
import itertools
|
|
|
|
|
|
|
|
header = {'str': 'Str',
|
|
|
|
'double': 'Dbl',
|
|
|
|
'int': 'Int'}
|
|
|
|
|
|
|
|
keys = ['str', 'int', 'double']
|
|
|
|
|
|
|
|
for r in range (1, 3):
|
|
|
|
combinations = list(itertools.permutations(keys, r = r))
|
|
|
|
|
|
|
|
for combination in combinations:
|
|
|
|
template_params = []
|
|
|
|
arg_params = []
|
|
|
|
for type in combination:
|
|
|
|
template_params.append(type)
|
|
|
|
arg_params.append(header[type])
|
|
|
|
call = 'testFields<' + ', '.join(template_params) + \
|
|
|
|
'>(o, d, {' + ', '.join(arg_params) + '});'
|
|
|
|
print(call)
|
|
|
|
*/
|
|
|
|
|
2023-07-25 00:56:38 +02:00
|
|
|
test_fields<str>(o, d, {Str});
|
|
|
|
test_fields<int>(o, d, {Int});
|
|
|
|
test_fields<double>(o, d, {Dbl});
|
|
|
|
test_fields<str, int>(o, d, {Str, Int});
|
|
|
|
test_fields<str, double>(o, d, {Str, Dbl});
|
|
|
|
test_fields<int, str>(o, d, {Int, Str});
|
|
|
|
test_fields<int, double>(o, d, {Int, Dbl});
|
|
|
|
test_fields<double, str>(o, d, {Dbl, Str});
|
|
|
|
test_fields<double, int>(o, d, {Dbl, Int});
|
|
|
|
test_fields<str, int, double>(o, d, {Str, Int, Dbl});
|
|
|
|
test_fields<str, double, int>(o, d, {Str, Dbl, Int});
|
|
|
|
test_fields<int, str, double>(o, d, {Int, Str, Dbl});
|
|
|
|
test_fields<int, double, str>(o, d, {Int, Dbl, Str});
|
|
|
|
test_fields<double, str, int>(o, d, {Dbl, Str, Int});
|
|
|
|
test_fields<double, int, str>(o, d, {Dbl, Int, Str});
|
2022-03-27 21:04:02 +02:00
|
|
|
}
|
2022-03-28 19:11:41 +02:00
|
|
|
|
2023-08-04 16:48:07 +02:00
|
|
|
template <typename... Ts>
|
|
|
|
void test_invalid_fields_impl(const std::vector<std::string>& lines,
|
|
|
|
const std::vector<std::string>& fields) {
|
|
|
|
unique_file_name f{"test_parser"};
|
|
|
|
std::ofstream out{f.name};
|
|
|
|
for (const auto& line : lines) {
|
|
|
|
out << line << std::endl;
|
|
|
|
}
|
|
|
|
out.close();
|
|
|
|
|
|
|
|
{
|
|
|
|
// No fields specified
|
|
|
|
ss::parser<Ts...> p{f.name, ","};
|
2023-08-04 21:22:23 +02:00
|
|
|
auto command = [&] { p.use_fields(); };
|
|
|
|
expect_error_on_command(p, command);
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
// Unknown field
|
|
|
|
ss::parser<Ts...> p{f.name, ","};
|
|
|
|
auto command = [&] { p.use_fields("Unknown"); };
|
|
|
|
expect_error_on_command(p, command);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
// Field used multiple times
|
|
|
|
ss::parser<Ts...> p{f.name, ","};
|
2023-08-06 16:55:52 +02:00
|
|
|
auto command = [&] { p.use_fields(fields.at(0), fields.at(0)); };
|
|
|
|
if (!fields.empty()) {
|
|
|
|
expect_error_on_command(p, command);
|
|
|
|
}
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
// Mapping out of range
|
|
|
|
ss::parser<Ts...> p{f.name, ","};
|
|
|
|
auto command = [&] {
|
2023-08-06 16:55:52 +02:00
|
|
|
p.use_fields(fields.at(0));
|
2023-08-04 16:48:07 +02:00
|
|
|
p.template get_next<std::string, std::string>();
|
|
|
|
};
|
2023-08-06 16:55:52 +02:00
|
|
|
if (!fields.empty()) {
|
|
|
|
expect_error_on_command(p, command);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
// Invalid header
|
|
|
|
ss::parser<Ts...> p{f.name, ","};
|
|
|
|
auto command = [&] { p.use_fields(fields); };
|
|
|
|
|
|
|
|
if (!fields.empty()) {
|
|
|
|
// Pass if there are no duplicates, fail otherwise
|
|
|
|
if (std::unordered_set<std::string>{fields.begin(), fields.end()}
|
|
|
|
.size() != fields.size()) {
|
|
|
|
expect_error_on_command(p, command);
|
|
|
|
} else {
|
|
|
|
command();
|
|
|
|
CHECK(p.valid());
|
|
|
|
if (!p.valid()) {
|
|
|
|
if constexpr (ss::setup<Ts...>::string_error) {
|
|
|
|
std::cout << p.error_msg() << std::endl;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename... Ts>
|
|
|
|
void test_invalid_fields(const std::vector<std::string>& lines,
|
|
|
|
const std::vector<std::string>& fields) {
|
|
|
|
test_invalid_fields_impl(lines, fields);
|
|
|
|
test_invalid_fields_impl<ss::string_error>(lines, fields);
|
|
|
|
test_invalid_fields_impl<ss::throw_on_error>(lines, fields);
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE("parser test invalid header fields usage") {
|
2023-08-06 16:55:52 +02:00
|
|
|
test_invalid_fields({}, {});
|
|
|
|
|
|
|
|
test_invalid_fields({"Int"}, {"Int"});
|
|
|
|
test_invalid_fields({"Int", "1"}, {"Int"});
|
|
|
|
test_invalid_fields({"Int", "1", "2"}, {"Int"});
|
|
|
|
|
|
|
|
test_invalid_fields({"Int,String"}, {"Int", "String"});
|
|
|
|
test_invalid_fields({"Int,String", "1,hi"}, {"Int", "String"});
|
|
|
|
test_invalid_fields({"Int,String", "2,hello"}, {"Int", "String"});
|
|
|
|
|
|
|
|
test_invalid_fields({"Int,String,Double"}, {"Int", "String", "Double"});
|
2023-08-04 16:48:07 +02:00
|
|
|
test_invalid_fields({"Int,String,Double", "1,hi,2.34"},
|
|
|
|
{"Int", "String", "Double"});
|
2023-08-06 16:55:52 +02:00
|
|
|
test_invalid_fields({"Int,String,Double", "1,hi,2.34", "2,hello,3.45"},
|
|
|
|
{"Int", "String", "Double"});
|
|
|
|
|
|
|
|
test_invalid_fields({"Int,Int,Int"}, {"Int", "Int", "Int"});
|
|
|
|
test_invalid_fields({"Int,Int,Int", "1,2,3"}, {"Int", "Int", "Int"});
|
2023-08-06 15:55:23 +02:00
|
|
|
|
2023-08-06 16:55:52 +02:00
|
|
|
test_invalid_fields({"Int,String,Int"}, {"Int", "String", "Int"});
|
|
|
|
test_invalid_fields({"Int,String,Int", "1,hi,3"}, {"Int", "String", "Int"});
|
2023-08-04 16:48:07 +02:00
|
|
|
}
|
|
|
|
|
2023-08-08 11:07:26 +02:00
|
|
|
template <typename... Ts>
|
|
|
|
void test_invalid_rows_with_header() {
|
|
|
|
unique_file_name f{"test_parser"};
|
|
|
|
{
|
|
|
|
std::ofstream out{f.name};
|
|
|
|
out << "Int,String,Double" << std::endl;
|
|
|
|
out << "1,line1,2.34" << std::endl;
|
|
|
|
out << "2,line2" << std::endl;
|
|
|
|
out << "3,line3,67.8" << std::endl;
|
|
|
|
out << "4,line4,67.8,9" << std::endl;
|
|
|
|
out << "5,line5,9.10" << std::endl;
|
|
|
|
out << "six,line6,10.11" << std::endl;
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<Ts...> p{f.name};
|
|
|
|
|
|
|
|
p.use_fields("Int", "String", "Double");
|
|
|
|
using data = std::tuple<int, std::string, double>;
|
|
|
|
std::vector<data> i;
|
|
|
|
|
|
|
|
CHECK(p.valid());
|
|
|
|
|
|
|
|
while (!p.eof()) {
|
|
|
|
try {
|
|
|
|
const auto& t = p.template get_next<data>();
|
|
|
|
if (p.valid()) {
|
|
|
|
i.push_back(t);
|
|
|
|
}
|
|
|
|
} catch (const ss::exception&) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<data> expected = {{1, "line1", 2.34},
|
|
|
|
{3, "line3", 67.8},
|
|
|
|
{5, "line5", 9.10}};
|
|
|
|
CHECK_EQ(i, expected);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<Ts...> p{f.name};
|
|
|
|
|
|
|
|
p.use_fields("Double", "Int");
|
|
|
|
using data = std::tuple<double, int>;
|
|
|
|
std::vector<data> i;
|
|
|
|
|
|
|
|
CHECK(p.valid());
|
|
|
|
|
|
|
|
while (!p.eof()) {
|
|
|
|
try {
|
|
|
|
const auto& t = p.template get_next<data>();
|
|
|
|
if (p.valid()) {
|
|
|
|
i.push_back(t);
|
|
|
|
}
|
|
|
|
} catch (const ss::exception&) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<data> expected = {{2.34, 1}, {67.8, 3}, {9.10, 5}};
|
|
|
|
CHECK_EQ(i, expected);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
ss::parser<Ts...> p{f.name};
|
|
|
|
|
|
|
|
p.use_fields("String", "Double");
|
|
|
|
using data = std::tuple<std::string, double>;
|
|
|
|
std::vector<data> i;
|
|
|
|
|
|
|
|
CHECK(p.valid());
|
|
|
|
|
|
|
|
while (!p.eof()) {
|
|
|
|
try {
|
|
|
|
const auto& t = p.template get_next<data>();
|
|
|
|
if (p.valid()) {
|
|
|
|
i.push_back(t);
|
|
|
|
}
|
|
|
|
} catch (const ss::exception&) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<data> expected = {{"line1", 2.34},
|
|
|
|
{"line3", 67.8},
|
|
|
|
{"line5", 9.10},
|
|
|
|
{"line6", 10.11}};
|
|
|
|
CHECK_EQ(i, expected);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
TEST_CASE("parser test invalid rows with header") {
|
|
|
|
test_invalid_rows_with_header();
|
|
|
|
test_invalid_rows_with_header<ss::string_error>();
|
|
|
|
test_invalid_rows_with_header<ss::throw_on_error>();
|
|
|
|
}
|
|
|
|
|
2023-08-05 19:58:00 +02:00
|
|
|
template <typename... Ts>
|
|
|
|
void test_ignore_empty_impl(const std::vector<X>& data) {
|
2023-07-29 20:41:31 +02:00
|
|
|
unique_file_name f{"test_parser"};
|
2022-03-28 19:11:41 +02:00
|
|
|
make_and_write(f.name, data);
|
|
|
|
|
|
|
|
std::vector<X> expected;
|
|
|
|
for (const auto& d : data) {
|
2023-08-05 19:58:00 +02:00
|
|
|
if (d.s != X::empty) {
|
2022-03-28 19:11:41 +02:00
|
|
|
expected.push_back(d);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
2023-08-05 19:58:00 +02:00
|
|
|
ss::parser<ss::ignore_empty, Ts...> p{f.name, ","};
|
2022-03-28 19:11:41 +02:00
|
|
|
|
|
|
|
std::vector<X> i;
|
2023-08-05 19:58:00 +02:00
|
|
|
for (const auto& a : p.template iterate<X>()) {
|
2022-03-28 19:11:41 +02:00
|
|
|
i.push_back(a);
|
|
|
|
}
|
|
|
|
|
|
|
|
CHECK_EQ(i, expected);
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
2023-08-05 19:58:00 +02:00
|
|
|
ss::parser<Ts...> p{f.name, ","};
|
2022-03-28 19:11:41 +02:00
|
|
|
std::vector<X> i;
|
|
|
|
size_t n = 0;
|
2023-08-05 19:58:00 +02:00
|
|
|
while (!p.eof()) {
|
|
|
|
try {
|
|
|
|
++n;
|
|
|
|
const auto& a = p.template get_next<X>();
|
|
|
|
if (data.at(n - 1).s == X::empty) {
|
|
|
|
CHECK_FALSE(p.valid());
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
i.push_back(a);
|
|
|
|
} catch (...) {
|
|
|
|
CHECK_EQ(data.at(n - 1).s, X::empty);
|
2022-03-28 19:11:41 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-05 19:58:00 +02:00
|
|
|
CHECK_EQ(i, expected);
|
2022-03-28 19:11:41 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-08-05 19:58:00 +02:00
|
|
|
template <typename... Ts>
|
|
|
|
void test_ignore_empty(const std::vector<X>& data) {
|
|
|
|
test_ignore_empty_impl(data);
|
|
|
|
test_ignore_empty_impl<ss::string_error>(data);
|
|
|
|
test_ignore_empty_impl<ss::throw_on_error>(data);
|
|
|
|
}
|
|
|
|
|
2022-03-28 19:11:41 +02:00
|
|
|
TEST_CASE("parser test various cases with empty lines") {
|
2023-07-25 00:56:38 +02:00
|
|
|
test_ignore_empty({{1, 2, "x"}, {3, 4, "y"}, {9, 10, "v"}, {11, 12, "w"}});
|
2022-03-28 19:11:41 +02:00
|
|
|
|
2023-07-25 00:56:38 +02:00
|
|
|
test_ignore_empty(
|
2023-08-05 19:58:00 +02:00
|
|
|
{{1, 2, X::empty}, {3, 4, "y"}, {9, 10, "v"}, {11, 12, "w"}});
|
|
|
|
|
|
|
|
test_ignore_empty(
|
|
|
|
{{1, 2, "x"}, {3, 4, "y"}, {9, 10, "v"}, {11, 12, X::empty}});
|
|
|
|
|
|
|
|
test_ignore_empty(
|
|
|
|
{{1, 2, "x"}, {5, 6, X::empty}, {9, 10, "v"}, {11, 12, "w"}});
|
|
|
|
|
|
|
|
test_ignore_empty(
|
|
|
|
{{1, 2, X::empty}, {5, 6, X::empty}, {9, 10, "v"}, {11, 12, "w"}});
|
2022-03-28 19:11:41 +02:00
|
|
|
|
2023-07-25 00:56:38 +02:00
|
|
|
test_ignore_empty(
|
2023-08-05 19:58:00 +02:00
|
|
|
{{1, 2, X::empty}, {3, 4, "y"}, {9, 10, "v"}, {11, 12, X::empty}});
|
2022-03-28 19:11:41 +02:00
|
|
|
|
2023-07-25 00:56:38 +02:00
|
|
|
test_ignore_empty(
|
2023-08-05 19:58:00 +02:00
|
|
|
{{1, 2, "x"}, {3, 4, "y"}, {9, 10, X::empty}, {11, 12, X::empty}});
|
|
|
|
|
|
|
|
test_ignore_empty(
|
|
|
|
{{1, 2, X::empty}, {3, 4, "y"}, {9, 10, X::empty}, {11, 12, X::empty}});
|
|
|
|
|
|
|
|
test_ignore_empty({{1, 2, X::empty},
|
|
|
|
{3, 4, X::empty},
|
|
|
|
{9, 10, X::empty},
|
|
|
|
{11, 12, X::empty}});
|
|
|
|
|
|
|
|
test_ignore_empty(
|
|
|
|
{{1, 2, "x"}, {3, 4, X::empty}, {9, 10, X::empty}, {11, 12, X::empty}});
|
|
|
|
|
|
|
|
test_ignore_empty(
|
|
|
|
{{1, 2, X::empty}, {3, 4, X::empty}, {9, 10, X::empty}, {11, 12, "w"}});
|
|
|
|
|
|
|
|
test_ignore_empty({{11, 12, X::empty}});
|
2022-03-28 19:11:41 +02:00
|
|
|
|
2023-07-25 00:56:38 +02:00
|
|
|
test_ignore_empty({});
|
|
|
|
}
|