1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94
|
#include "simdutf.h"
#include <array>
#include <memory>
#include <vector>
#include <tests/helpers/transcode_test_base.h>
#include <tests/helpers/random_int.h>
#include <tests/helpers/test.h>
namespace {
constexpr std::array<size_t, 7> input_size{7, 16, 12, 64, 67, 128, 256};
constexpr simdutf::endianness BE = simdutf::endianness::BIG;
using simdutf::tests::helpers::transcode_utf8_to_utf16_test_base;
} // namespace
TEST_LOOP(convert_pure_ASCII) {
size_t counter = 0;
auto generator = [&counter]() -> uint32_t { return counter++ & 0x7f; };
auto procedure = [&implementation](const char *utf8, size_t size,
char16_t *utf16be) -> size_t {
return implementation.convert_valid_utf8_to_utf16be(utf8, size, utf16be);
};
for (size_t size : input_size) {
transcode_utf8_to_utf16_test_base test(BE, generator, size);
ASSERT_TRUE(test(procedure));
}
}
TEST_LOOP(convert_1_or_2_UTF8_bytes) {
simdutf::tests::helpers::RandomInt random(
0x0000, 0x07ff, seed); // range for 1 or 2 UTF-8 bytes
auto procedure = [&implementation](const char *utf8, size_t size,
char16_t *utf16be) -> size_t {
return implementation.convert_valid_utf8_to_utf16be(utf8, size, utf16be);
};
for (size_t size : input_size) {
transcode_utf8_to_utf16_test_base test(BE, random, size);
ASSERT_TRUE(test(procedure));
}
}
TEST_LOOP(convert_1_or_2_or_3_UTF8_bytes) {
// range for 1, 2 or 3 UTF-8 bytes
simdutf::tests::helpers::RandomIntRanges random(
{{0x0000, 0xd7ff}, {0xe000, 0xffff}}, seed);
auto procedure = [&implementation](const char *utf8, size_t size,
char16_t *utf16be) -> size_t {
return implementation.convert_valid_utf8_to_utf16be(utf8, size, utf16be);
};
for (size_t size : input_size) {
transcode_utf8_to_utf16_test_base test(BE, random, size);
ASSERT_TRUE(test(procedure));
}
}
TEST_LOOP(convert_3_or_4_UTF8_bytes) {
simdutf::tests::helpers::RandomIntRanges random(
{{0x0800, 0xd800 - 1}, {0xe000, 0x10ffff}},
seed); // range for 3 or 4 UTF-8 bytes
auto procedure = [&implementation](const char *utf8, size_t size,
char16_t *utf16be) -> size_t {
return implementation.convert_valid_utf8_to_utf16be(utf8, size, utf16be);
};
for (size_t size : input_size) {
transcode_utf8_to_utf16_test_base test(BE, random, size);
ASSERT_TRUE(test(procedure));
}
}
TEST(special_cases) {
const uint8_t utf8[] = {0xC2, 0xA9}; // copyright sign
const uint8_t expected[] = {0x00, 0xA9}; // expected UTF-16BE
size_t utf16len =
implementation.utf16_length_from_utf8((const char *)utf8, 2);
ASSERT_EQUAL(utf16len, 1);
std::unique_ptr<char16_t[]> utf16(new char16_t[utf16len]);
size_t utf16size = implementation.convert_valid_utf8_to_utf16be(
(const char *)utf8, 2, utf16.get());
ASSERT_EQUAL(utf16size, utf16len);
ASSERT_EQUAL(memcmp((const char *)utf16.get(), expected, 2), 0);
}
TEST_MAIN
|