Skip to content

Commit

Permalink
🐛 skipping BOM for iterators #602
Browse files Browse the repository at this point in the history
I totally forgot about byte order marks in this scenario.
  • Loading branch information
nlohmann committed Jun 2, 2017
1 parent c043ba6 commit d19c5ce
Show file tree
Hide file tree
Showing 3 changed files with 27 additions and 6 deletions.
10 changes: 8 additions & 2 deletions src/json.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -8814,7 +8814,7 @@ class basic_json
// store number of bytes in the buffer
fill_size = static_cast<size_t>(is.gcount());

// skip byte-order mark
// skip byte order mark
if (fill_size >= 3 and buffer[0] == '\xEF' and buffer[1] == '\xBB' and buffer[2] == '\xBF')
{
buffer_pos += 3;
Expand Down Expand Up @@ -8911,7 +8911,13 @@ class basic_json
public:
input_buffer_adapter(const char* b, size_t l)
: input_adapter(), cursor(b), limit(b + l), start(b)
{}
{
// skip byte order mark
if (l >= 3 and b[0] == '\xEF' and b[1] == '\xBB' and b[2] == '\xBF')
{
cursor += 3;
}
}

// delete because of pointer members
input_buffer_adapter(const input_buffer_adapter&) = delete;
Expand Down
6 changes: 6 additions & 0 deletions test/src/unit-regression.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1169,4 +1169,10 @@ TEST_CASE("regression tests")
std::vector<uint8_t> vec = {'"', '\\', '"', 'X', '"', '"'};
CHECK_THROWS_AS(json::parse(vec), json::parse_error);
}

SECTION("issue #602 - BOM not skipped when using json:parse(iterator)")
{
std::string i = "\xef\xbb\xbf{\n \"foo\": true\n}";
CHECK_NOTHROW(json::parse(i.begin(), i.end()));
}
}
17 changes: 13 additions & 4 deletions test/src/unit-unicode.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1012,10 +1012,19 @@ TEST_CASE("Unicode", "[hide]")

SECTION("ignore byte-order-mark")
{
// read a file with a UTF-8 BOM
std::ifstream f("test/data/json_nlohmann_tests/bom.json");
json j;
CHECK_NOTHROW(f >> j);
SECTION("in a stream")
{
// read a file with a UTF-8 BOM
std::ifstream f("test/data/json_nlohmann_tests/bom.json");
json j;
CHECK_NOTHROW(f >> j);
}

SECTION("with an iterator")
{
std::string i = "\xef\xbb\xbf{\n \"foo\": true\n}";
CHECK_NOTHROW(json::parse(i.begin(), i.end()));
}
}

SECTION("error for incomplete/wrong BOM")
Expand Down

0 comments on commit d19c5ce

Please sign in to comment.