blob: 04cf426d31cc78275911d51b1fc0adff852c67da [file] [log] [blame] [edit]
//===-- Unittests for wcsnrtombs ------------------------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#include "hdr/types/mbstate_t.h"
#include "src/__support/macros/null_check.h"
#include "src/string/memset.h"
#include "src/wchar/wcsnrtombs.h"
#include "test/UnitTest/ErrnoCheckingTest.h"
#include "test/UnitTest/Test.h"
using LlvmLibcWcsnrtombs = LIBC_NAMESPACE::testing::ErrnoCheckingTest;
// these tests are fairly simple as this function just calls into the internal
// wcsnrtombs which is more thoroughly tested
TEST_F(LlvmLibcWcsnrtombs, AllMultibyteLengths) {
mbstate_t state;
LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t));
/// clown emoji, sigma symbol, y with diaeresis, letter A
const wchar_t src[] = {static_cast<wchar_t>(0x1f921),
static_cast<wchar_t>(0x2211),
static_cast<wchar_t>(0xff), static_cast<wchar_t>(0x41),
static_cast<wchar_t>(0x0)};
const wchar_t *cur = src;
char mbs[11];
ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 11, &state),
static_cast<size_t>(10));
ASSERT_ERRNO_SUCCESS();
ASSERT_EQ(cur, nullptr);
ASSERT_EQ(mbs[0], '\xF0'); // clown begin
ASSERT_EQ(mbs[1], '\x9F');
ASSERT_EQ(mbs[2], '\xA4');
ASSERT_EQ(mbs[3], '\xA1');
ASSERT_EQ(mbs[4], '\xE2'); // sigma begin
ASSERT_EQ(mbs[5], '\x88');
ASSERT_EQ(mbs[6], '\x91');
ASSERT_EQ(mbs[7], '\xC3'); // y diaeresis begin
ASSERT_EQ(mbs[8], '\xBF');
ASSERT_EQ(mbs[9], '\x41'); // A begin
ASSERT_EQ(mbs[10], '\0'); // null terminator
}
TEST_F(LlvmLibcWcsnrtombs, DestLimit) {
mbstate_t state;
LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t));
/// clown emoji, sigma symbol, y with diaeresis, letter A
const wchar_t src[] = {static_cast<wchar_t>(0x1f921),
static_cast<wchar_t>(0x2211),
static_cast<wchar_t>(0xff), static_cast<wchar_t>(0x41),
static_cast<wchar_t>(0x0)};
const wchar_t *cur = src;
char mbs[11];
LIBC_NAMESPACE::memset(mbs, '\x01', 11); // dummy initial values
ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 4, &state),
static_cast<size_t>(4));
ASSERT_ERRNO_SUCCESS();
ASSERT_EQ(cur, src + 1);
ASSERT_EQ(mbs[0], '\xF0');
ASSERT_EQ(mbs[1], '\x9F');
ASSERT_EQ(mbs[2], '\xA4');
ASSERT_EQ(mbs[3], '\xA1');
ASSERT_EQ(mbs[4], '\x01'); // didn't write more than 4 bytes
LIBC_NAMESPACE::memset(mbs, '\x01', 11); // dummy initial values
LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t));
cur = src;
// not enough bytes to convert the second character, so only converts one
ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 6, &state),
static_cast<size_t>(4));
ASSERT_ERRNO_SUCCESS();
ASSERT_EQ(cur, src + 1);
ASSERT_EQ(mbs[0], '\xF0');
ASSERT_EQ(mbs[1], '\x9F');
ASSERT_EQ(mbs[2], '\xA4');
ASSERT_EQ(mbs[3], '\xA1');
ASSERT_EQ(mbs[4], '\x01');
}
TEST(LlvmLibcWcsnrtombs, SrcLimit) {
mbstate_t state;
LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t));
/// clown emoji, sigma symbol, y with diaeresis, letter A
const wchar_t src[] = {static_cast<wchar_t>(0x1f921),
static_cast<wchar_t>(0x2211),
static_cast<wchar_t>(0xff), static_cast<wchar_t>(0x41),
static_cast<wchar_t>(0x0)};
const wchar_t *cur = src;
char mbs[11];
LIBC_NAMESPACE::memset(mbs, '\x01', 11); // dummy initial values
auto res = LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 2, 11, &state);
ASSERT_ERRNO_SUCCESS();
ASSERT_EQ(res, static_cast<size_t>(7));
ASSERT_EQ(cur, src + 2);
ASSERT_EQ(mbs[0], '\xF0'); // clown begin
ASSERT_EQ(mbs[1], '\x9F');
ASSERT_EQ(mbs[2], '\xA4');
ASSERT_EQ(mbs[3], '\xA1');
ASSERT_EQ(mbs[4], '\xE2'); // sigma begin
ASSERT_EQ(mbs[5], '\x88');
ASSERT_EQ(mbs[6], '\x91');
ASSERT_EQ(mbs[7], '\x01');
res = LIBC_NAMESPACE::wcsnrtombs(mbs + res, &cur, 100, 11, &state);
ASSERT_ERRNO_SUCCESS();
ASSERT_EQ(res, static_cast<size_t>(3));
ASSERT_EQ(cur, nullptr);
ASSERT_EQ(mbs[0], '\xF0'); // clown begin
ASSERT_EQ(mbs[1], '\x9F');
ASSERT_EQ(mbs[2], '\xA4');
ASSERT_EQ(mbs[3], '\xA1');
ASSERT_EQ(mbs[4], '\xE2'); // sigma begin
ASSERT_EQ(mbs[5], '\x88');
ASSERT_EQ(mbs[6], '\x91');
ASSERT_EQ(mbs[7], '\xC3'); // y diaeresis begin
ASSERT_EQ(mbs[8], '\xBF');
ASSERT_EQ(mbs[9], '\x41'); // A begin
ASSERT_EQ(mbs[10], '\0'); // null terminator
}
TEST_F(LlvmLibcWcsnrtombs, ErrnoTest) {
mbstate_t state;
LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t));
const wchar_t src[] = {static_cast<wchar_t>(0x1f921),
static_cast<wchar_t>(0x2211),
static_cast<wchar_t>(0x12ffff), // invalid widechar
static_cast<wchar_t>(0x0)};
const wchar_t *cur = src;
char mbs[11];
// n parameter ignored when dest is null
ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 7, &state),
static_cast<size_t>(7));
ASSERT_ERRNO_SUCCESS();
LIBC_NAMESPACE::memset(&state, 0, sizeof(mbstate_t));
ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 100, &state),
static_cast<size_t>(-1));
ASSERT_ERRNO_EQ(EILSEQ);
}
TEST_F(LlvmLibcWcsnrtombs, NullState) {
// this test is the same as DestLimit except it uses a nullptr mbstate*
/// clown emoji, sigma symbol, y with diaeresis, letter A
const wchar_t src[] = {static_cast<wchar_t>(0x1f921),
static_cast<wchar_t>(0x2211),
static_cast<wchar_t>(0xff), static_cast<wchar_t>(0x41),
static_cast<wchar_t>(0x0)};
const wchar_t *cur = src;
char mbs[11];
LIBC_NAMESPACE::memset(mbs, '\x01', 11); // dummy initial values
ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 4, nullptr),
static_cast<size_t>(4));
ASSERT_ERRNO_SUCCESS();
ASSERT_EQ(cur, src + 1);
ASSERT_EQ(mbs[0], '\xF0');
ASSERT_EQ(mbs[1], '\x9F');
ASSERT_EQ(mbs[2], '\xA4');
ASSERT_EQ(mbs[3], '\xA1');
ASSERT_EQ(mbs[4], '\x01'); // didn't write more than 4 bytes
LIBC_NAMESPACE::memset(mbs, '\x01', 11); // dummy initial values
// not enough bytes to convert the second character, so only converts one
cur = src;
ASSERT_EQ(LIBC_NAMESPACE::wcsnrtombs(mbs, &cur, 5, 6, nullptr),
static_cast<size_t>(4));
ASSERT_ERRNO_SUCCESS();
ASSERT_EQ(cur, src + 1);
ASSERT_EQ(mbs[0], '\xF0');
ASSERT_EQ(mbs[1], '\x9F');
ASSERT_EQ(mbs[2], '\xA4');
ASSERT_EQ(mbs[3], '\xA1');
ASSERT_EQ(mbs[4], '\x01');
}