1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
|
#include "charencoding.h"
#include <map>
#include "3rd-party/catch.hpp"
using namespace newsboat;
TEST_CASE("charset_from_bom", "[charencoding]")
{
const std::map<std::string, nonstd::optional<std::string>> test_cases {
{ "", nonstd::nullopt },
{ "text without BOM", nonstd::nullopt },
{ "\xEF\xBB\xBFtext with BOM", "UTF-8" },
{ "\xFE\xFFtext with BOM", "UTF-16BE" },
{ "\xFF\xFEtext with BOM", "UTF-16LE" },
};
for (const auto& test_case : test_cases) {
std::vector<std::uint8_t> input(test_case.first.begin(), test_case.first.end());
const auto actual = charencoding::charset_from_bom(input);
const auto expected = test_case.second;
INFO("actual: " << (actual.has_value() ? actual.value().c_str() : ""));
INFO("expected: " << (expected.has_value() ? expected.value().c_str() : ""));
REQUIRE(actual == expected);
}
}
TEST_CASE("charset_from_xml_declaration", "[charencoding]")
{
const std::map<std::string, nonstd::optional<std::string>> test_cases {
{ "", nonstd::nullopt },
{ "not a declaration", nonstd::nullopt },
{ R"(<?xml version="1.0"?>No encoding specified)", nonstd::nullopt },
{ R"(<?xml version="1.0" encoding="UTF-8"?>Encoding specified)", "UTF-8" },
{ R"(<?xml version="1.0" encoding="utf-8"?>Encoding specified)", "utf-8" },
{ R"(<?xml version="1.0" encoding="fake.encoding"?>Encoding specified)", "fake.encoding" },
};
for (const auto& test_case : test_cases) {
std::vector<std::uint8_t> input(test_case.first.begin(), test_case.first.end());
const auto actual = charencoding::charset_from_xml_declaration(input);
const auto expected = test_case.second;
INFO("actual: " << (actual.has_value() ? actual.value().c_str() : ""));
INFO("expected: " << (expected.has_value() ? expected.value().c_str() : ""));
REQUIRE(actual == expected);
}
}
|