|
| 1 | +//===-- Unittests for wcsnrtombs ------------------------------------------===// |
| 2 | +// |
| 3 | +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | +// See https://llvm.org/LICENSE.txt for license information. |
| 5 | +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | +// |
| 7 | +//===----------------------------------------------------------------------===// |
| 8 | + |
| 9 | +#include "hdr/types/mbstate_t.h" |
| 10 | +#include "src/string/memset.h" |
| 11 | +#include "src/wchar/wcsnrtombs.h" |
| 12 | +#include "test/UnitTest/ErrnoCheckingTest.h" |
| 13 | +#include "test/UnitTest/Test.h" |
| 14 | + |
| 15 | +using LlvmLibcWcsnrtombs = LIBC_NAMESPACE::testing::ErrnoCheckingTest; |
| 16 | + |
| 17 | +// these tests are fairly simple as this function just calls into the internal |
| 18 | +// wcsnrtombs which is more thoroughly tested |
| 19 | + |
| 20 | +TEST_F(LlvmLibcWcsnrtombs, AllMultibyteLengths) { |
| 21 | + mbstate_t state; |
| 22 | + LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t)); |
| 23 | + |
| 24 | + /// clown emoji, sigma symbol, y with diaeresis, letter A |
| 25 | + const wchar_t src[] = {static_cast<wchar_t>(0x1f921), |
| 26 | + static_cast<wchar_t>(0x2211), |
| 27 | + static_cast<wchar_t>(0xff), static_cast<wchar_t>(0x41), |
| 28 | + static_cast<wchar_t>(0x0)}; |
| 29 | + const wchar_t *cur = src; |
| 30 | + char mbs[11]; |
| 31 | + |
| 32 | + ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 11, &state), |
| 33 | + static_cast<size_t>(10)); |
| 34 | + ASSERT_ERRNO_SUCCESS(); |
| 35 | + ASSERT_EQ(cur, nullptr); |
| 36 | + ASSERT_EQ(mbs[0], '\xF0'); // clown begin |
| 37 | + ASSERT_EQ(mbs[1], '\x9F'); |
| 38 | + ASSERT_EQ(mbs[2], '\xA4'); |
| 39 | + ASSERT_EQ(mbs[3], '\xA1'); |
| 40 | + ASSERT_EQ(mbs[4], '\xE2'); // sigma begin |
| 41 | + ASSERT_EQ(mbs[5], '\x88'); |
| 42 | + ASSERT_EQ(mbs[6], '\x91'); |
| 43 | + ASSERT_EQ(mbs[7], '\xC3'); // y diaeresis begin |
| 44 | + ASSERT_EQ(mbs[8], '\xBF'); |
| 45 | + ASSERT_EQ(mbs[9], '\x41'); // A begin |
| 46 | + ASSERT_EQ(mbs[10], '\0'); // null terminator |
| 47 | +} |
| 48 | + |
| 49 | +TEST_F(LlvmLibcWcsnrtombs, DestLimit) { |
| 50 | + mbstate_t state; |
| 51 | + LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t)); |
| 52 | + |
| 53 | + /// clown emoji, sigma symbol, y with diaeresis, letter A |
| 54 | + const wchar_t src[] = {static_cast<wchar_t>(0x1f921), |
| 55 | + static_cast<wchar_t>(0x2211), |
| 56 | + static_cast<wchar_t>(0xff), static_cast<wchar_t>(0x41), |
| 57 | + static_cast<wchar_t>(0x0)}; |
| 58 | + const wchar_t *cur = src; |
| 59 | + |
| 60 | + char mbs[11]; |
| 61 | + for (int i = 0; i < 11; ++i) |
| 62 | + mbs[i] = '\x01'; // dummy initial values |
| 63 | + |
| 64 | + ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 4, &state), |
| 65 | + static_cast<size_t>(4)); |
| 66 | + ASSERT_ERRNO_SUCCESS(); |
| 67 | + ASSERT_EQ(cur, src + 1); |
| 68 | + ASSERT_EQ(mbs[0], '\xF0'); |
| 69 | + ASSERT_EQ(mbs[1], '\x9F'); |
| 70 | + ASSERT_EQ(mbs[2], '\xA4'); |
| 71 | + ASSERT_EQ(mbs[3], '\xA1'); |
| 72 | + ASSERT_EQ(mbs[4], '\x01'); // didn't write more than 4 bytes |
| 73 | + |
| 74 | + for (int i = 0; i < 11; ++i) |
| 75 | + mbs[i] = '\x01'; // dummy initial values |
| 76 | + LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t)); |
| 77 | + cur = src; |
| 78 | + |
| 79 | + // not enough bytes to convert the second character, so only converts one |
| 80 | + ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 6, &state), |
| 81 | + static_cast<size_t>(4)); |
| 82 | + ASSERT_ERRNO_SUCCESS(); |
| 83 | + ASSERT_EQ(cur, src + 1); |
| 84 | + ASSERT_EQ(mbs[0], '\xF0'); |
| 85 | + ASSERT_EQ(mbs[1], '\x9F'); |
| 86 | + ASSERT_EQ(mbs[2], '\xA4'); |
| 87 | + ASSERT_EQ(mbs[3], '\xA1'); |
| 88 | + ASSERT_EQ(mbs[4], '\x01'); |
| 89 | +} |
| 90 | + |
| 91 | +TEST(LlvmLibcWcsnrtombs, SrcLimit) { |
| 92 | + mbstate_t state; |
| 93 | + LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t)); |
| 94 | + |
| 95 | + /// clown emoji, sigma symbol, y with diaeresis, letter A |
| 96 | + const wchar_t src[] = {static_cast<wchar_t>(0x1f921), |
| 97 | + static_cast<wchar_t>(0x2211), |
| 98 | + static_cast<wchar_t>(0xff), static_cast<wchar_t>(0x41), |
| 99 | + static_cast<wchar_t>(0x0)}; |
| 100 | + const wchar_t *cur = src; |
| 101 | + |
| 102 | + char mbs[11]; |
| 103 | + for (int i = 0; i < 11; ++i) |
| 104 | + mbs[i] = '\x01'; // dummy initial values |
| 105 | + |
| 106 | + auto res = LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 2, 11, &state); |
| 107 | + ASSERT_ERRNO_SUCCESS(); |
| 108 | + ASSERT_EQ(res, static_cast<size_t>(7)); |
| 109 | + ASSERT_EQ(cur, src + 2); |
| 110 | + ASSERT_EQ(mbs[0], '\xF0'); // clown begin |
| 111 | + ASSERT_EQ(mbs[1], '\x9F'); |
| 112 | + ASSERT_EQ(mbs[2], '\xA4'); |
| 113 | + ASSERT_EQ(mbs[3], '\xA1'); |
| 114 | + ASSERT_EQ(mbs[4], '\xE2'); // sigma begin |
| 115 | + ASSERT_EQ(mbs[5], '\x88'); |
| 116 | + ASSERT_EQ(mbs[6], '\x91'); |
| 117 | + ASSERT_EQ(mbs[7], '\x01'); |
| 118 | + |
| 119 | + res = LIBC_NAMESPACE::wcsnrtombs(mbs + res, &cur, 100, 11, &state); |
| 120 | + ASSERT_ERRNO_SUCCESS(); |
| 121 | + ASSERT_EQ(res, static_cast<size_t>(3)); |
| 122 | + ASSERT_EQ(cur, nullptr); |
| 123 | + ASSERT_EQ(mbs[0], '\xF0'); // clown begin |
| 124 | + ASSERT_EQ(mbs[1], '\x9F'); |
| 125 | + ASSERT_EQ(mbs[2], '\xA4'); |
| 126 | + ASSERT_EQ(mbs[3], '\xA1'); |
| 127 | + ASSERT_EQ(mbs[4], '\xE2'); // sigma begin |
| 128 | + ASSERT_EQ(mbs[5], '\x88'); |
| 129 | + ASSERT_EQ(mbs[6], '\x91'); |
| 130 | + ASSERT_EQ(mbs[7], '\xC3'); // y diaeresis begin |
| 131 | + ASSERT_EQ(mbs[8], '\xBF'); |
| 132 | + ASSERT_EQ(mbs[9], '\x41'); // A begin |
| 133 | + ASSERT_EQ(mbs[10], '\0'); // null terminator |
| 134 | +} |
| 135 | + |
| 136 | +TEST_F(LlvmLibcWcsnrtombs, ErrnoTest) { |
| 137 | + mbstate_t state; |
| 138 | + LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t)); |
| 139 | + |
| 140 | + const wchar_t src[] = {static_cast<wchar_t>(0x1f921), |
| 141 | + static_cast<wchar_t>(0x2211), |
| 142 | + static_cast<wchar_t>(0x12ffff), // invalid widechar |
| 143 | + static_cast<wchar_t>(0x0)}; |
| 144 | + const wchar_t *cur = src; |
| 145 | + char mbs[11]; |
| 146 | + |
| 147 | + // n parameter ignored when dest is null |
| 148 | + ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 7, &state), |
| 149 | + static_cast<size_t>(7)); |
| 150 | + ASSERT_ERRNO_SUCCESS(); |
| 151 | + |
| 152 | + LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t)); |
| 153 | + ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 100, &state), |
| 154 | + static_cast<size_t>(-1)); |
| 155 | + ASSERT_ERRNO_EQ(EILSEQ); |
| 156 | +} |
0 commit comments