mirror of
https://github.com/RGBCube/serenity
synced 2025-05-31 13:48:12 +00:00

The actual data file for this benchmark was never actually committed to the repository, so let's generate 100k identical lines in memory to be the fairly large data for this test instead.
100 lines
3.2 KiB
C++
100 lines
3.2 KiB
C++
/*
|
|
* Copyright (c) 2020, the SerenityOS developers.
|
|
*
|
|
* SPDX-License-Identifier: BSD-2-Clause
|
|
*/
|
|
|
|
#include <LibTest/TestCase.h>
|
|
|
|
#include "../CSV.h"
|
|
#include "../XSV.h"
|
|
#include <AK/ByteBuffer.h>
|
|
#include <LibCore/File.h>
|
|
|
|
TEST_CASE(should_parse_valid_data)
|
|
{
|
|
{
|
|
auto data = R"~~~(Foo, Bar, Baz
|
|
1, 2, 3
|
|
4, 5, 6
|
|
"""x", y"z, 9)~~~";
|
|
auto csv = Reader::CSV { data, Reader::default_behaviours() | Reader::ParserBehaviour::ReadHeaders | Reader::ParserBehaviour::TrimLeadingFieldSpaces };
|
|
csv.parse();
|
|
EXPECT(!csv.has_error());
|
|
|
|
EXPECT_EQ(csv[0]["Foo"], "1");
|
|
EXPECT_EQ(csv[2]["Foo"], "\"x");
|
|
EXPECT_EQ(csv[2]["Bar"], "y\"z");
|
|
}
|
|
|
|
{
|
|
auto data = R"~~~(Foo, Bar, Baz
|
|
1 , 2, 3
|
|
4, "5 " , 6
|
|
"""x", y"z, 9 )~~~";
|
|
auto csv = Reader::CSV { data, Reader::default_behaviours() | Reader::ParserBehaviour::ReadHeaders | Reader::ParserBehaviour::TrimLeadingFieldSpaces | Reader::ParserBehaviour::TrimTrailingFieldSpaces };
|
|
csv.parse();
|
|
EXPECT(!csv.has_error());
|
|
|
|
EXPECT_EQ(csv[0]["Foo"], "1");
|
|
EXPECT_EQ(csv[1]["Bar"], "5 ");
|
|
EXPECT_EQ(csv[2]["Foo"], "\"x");
|
|
EXPECT_EQ(csv[2]["Baz"], "9");
|
|
}
|
|
}
|
|
|
|
TEST_CASE(should_fail_nicely)
|
|
{
|
|
{
|
|
auto data = R"~~~(Foo, Bar, Baz
|
|
x, y)~~~";
|
|
auto csv = Reader::CSV { data, Reader::default_behaviours() | Reader::ParserBehaviour::ReadHeaders | Reader::ParserBehaviour::TrimLeadingFieldSpaces };
|
|
csv.parse();
|
|
EXPECT(csv.has_error());
|
|
EXPECT_EQ(csv.error(), Reader::ReadError::NonConformingColumnCount);
|
|
}
|
|
|
|
{
|
|
auto data = R"~~~(Foo, Bar, Baz
|
|
x, y, "z)~~~";
|
|
auto csv = Reader::CSV { data, Reader::default_behaviours() | Reader::ParserBehaviour::ReadHeaders | Reader::ParserBehaviour::TrimLeadingFieldSpaces };
|
|
csv.parse();
|
|
EXPECT(csv.has_error());
|
|
EXPECT_EQ(csv.error(), Reader::ReadError::QuoteFailure);
|
|
}
|
|
}
|
|
|
|
TEST_CASE(should_iterate_rows)
|
|
{
|
|
auto data = R"~~~(Foo, Bar, Baz
|
|
1, 2, 3
|
|
4, 5, 6
|
|
"""x", y"z, 9)~~~";
|
|
auto csv = Reader::CSV { data, Reader::default_behaviours() | Reader::ParserBehaviour::ReadHeaders | Reader::ParserBehaviour::TrimLeadingFieldSpaces };
|
|
csv.parse();
|
|
EXPECT(!csv.has_error());
|
|
|
|
bool ran = false;
|
|
for (auto row : csv)
|
|
ran = !row[0].is_empty();
|
|
|
|
EXPECT(ran);
|
|
}
|
|
|
|
BENCHMARK_CASE(fairly_big_data)
|
|
{
|
|
constexpr auto num_rows = 100000u;
|
|
constexpr auto line = "well,hello,friends,1,2,3,4,5,6,7,8,pizza,guacamole\n"sv;
|
|
auto buf = ByteBuffer::create_uninitialized((line.length() * num_rows) + 1);
|
|
buf[buf.size() - 1] = '\0';
|
|
|
|
for (size_t row = 0; row <= num_rows; ++row) {
|
|
memcpy(buf.offset_pointer(row * line.length()), line.characters_without_null_termination(), line.length());
|
|
}
|
|
|
|
auto csv = Reader::CSV { (char const*)buf.data(), Reader::default_behaviours() | Reader::ParserBehaviour::ReadHeaders };
|
|
csv.parse();
|
|
|
|
EXPECT(!csv.has_error());
|
|
EXPECT_EQ(csv.size(), num_rows);
|
|
}
|