llvm-project/libcxx/test/std/localization/locale.stdcvt/codecvt_utf8_in.pass.cpp

361 lines
11 KiB
C++

//===----------------------------------------------------------------------===//
//
// The LLVM Compiler Infrastructure
//
// This file is dual licensed under the MIT and the University of Illinois Open
// Source Licenses. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
// <codecvt>
// template <class Elem, unsigned long Maxcode = 0x10ffff,
// codecvt_mode Mode = (codecvt_mode)0>
// class codecvt_utf8
// : public codecvt<Elem, char, mbstate_t>
// {
// // unspecified
// };
// result
// in(stateT& state,
// const externT* from, const externT* from_end, const externT*& from_next,
// internT* to, internT* to_end, internT*& to_next) const;
#include <codecvt>
#include <cassert>
int main()
{
{
typedef std::codecvt_utf8<wchar_t> C;
C c;
wchar_t w = 0;
char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)};
wchar_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+4);
assert(w == 0x40003);
n[0] = char(0xE1);
n[1] = char(0x80);
n[2] = char(0x85);
r = c.in(m, n, n+3, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+3);
assert(w == 0x1005);
n[0] = char(0xD1);
n[1] = char(0x93);
r = c.in(m, n, n+2, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+2);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
{
typedef std::codecvt_utf8<wchar_t, 0x1000> C;
C c;
wchar_t w = 0;
char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)};
wchar_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp);
assert(r == std::codecvt_base::error);
assert(wp == &w);
assert(np == n);
assert(w == 0);
n[0] = char(0xE1);
n[1] = char(0x80);
n[2] = char(0x85);
r = c.in(m, n, n+3, np, &w, &w+1, wp);
assert(r == std::codecvt_base::error);
assert(wp == &w);
assert(np == n);
assert(w == 0);
n[0] = char(0xD1);
n[1] = char(0x93);
r = c.in(m, n, n+2, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+2);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
{
typedef std::codecvt_utf8<wchar_t, 0xFFFFFFFF, std::consume_header> C;
C c;
wchar_t w = 0;
char n[7] = {char(0xEF), char(0xBB), char(0xBF), char(0xF1), char(0x80), char(0x80), char(0x83)};
wchar_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+7, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+7);
assert(w == 0x40003);
n[0] = char(0xE1);
n[1] = char(0x80);
n[2] = char(0x85);
r = c.in(m, n, n+3, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+3);
assert(w == 0x1005);
n[0] = char(0xEF);
n[1] = char(0xBB);
n[2] = char(0xBF);
n[3] = char(0xD1);
n[4] = char(0x93);
r = c.in(m, n, n+5, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+5);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
{
typedef std::codecvt_utf8<char32_t> C;
C c;
char32_t w = 0;
char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)};
char32_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+4);
assert(w == 0x40003);
n[0] = char(0xE1);
n[1] = char(0x80);
n[2] = char(0x85);
r = c.in(m, n, n+3, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+3);
assert(w == 0x1005);
n[0] = char(0xD1);
n[1] = char(0x93);
r = c.in(m, n, n+2, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+2);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
{
typedef std::codecvt_utf8<char32_t, 0x1000> C;
C c;
char32_t w = 0;
char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)};
char32_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp);
assert(r == std::codecvt_base::error);
assert(wp == &w);
assert(np == n);
assert(w == 0);
n[0] = char(0xE1);
n[1] = char(0x80);
n[2] = char(0x85);
r = c.in(m, n, n+3, np, &w, &w+1, wp);
assert(r == std::codecvt_base::error);
assert(wp == &w);
assert(np == n);
assert(w == 0);
n[0] = char(0xD1);
n[1] = char(0x93);
r = c.in(m, n, n+2, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+2);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
{
typedef std::codecvt_utf8<char32_t, 0xFFFFFFFF, std::consume_header> C;
C c;
char32_t w = 0;
char n[7] = {char(0xEF), char(0xBB), char(0xBF), char(0xF1), char(0x80), char(0x80), char(0x83)};
char32_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+7, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+7);
assert(w == 0x40003);
n[0] = char(0xE1);
n[1] = char(0x80);
n[2] = char(0x85);
r = c.in(m, n, n+3, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+3);
assert(w == 0x1005);
n[0] = char(0xEF);
n[1] = char(0xBB);
n[2] = char(0xBF);
n[3] = char(0xD1);
n[4] = char(0x93);
r = c.in(m, n, n+5, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+5);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
{
typedef std::codecvt_utf8<char16_t> C;
C c;
char16_t w = 0;
char n[3] = {char(0xE1), char(0x80), char(0x85)};
char16_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+3, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+3);
assert(w == 0x1005);
n[0] = char(0xD1);
n[1] = char(0x93);
r = c.in(m, n, n+2, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+2);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
{
typedef std::codecvt_utf8<char16_t, 0x1000> C;
C c;
char16_t w = 0;
char n[3] = {char(0xE1), char(0x80), char(0x85)};
char16_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+3, np, &w, &w+1, wp);
assert(r == std::codecvt_base::error);
assert(wp == &w);
assert(np == n);
assert(w == 0);
n[0] = char(0xD1);
n[1] = char(0x93);
r = c.in(m, n, n+2, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+2);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
{
typedef std::codecvt_utf8<char16_t, 0xFFFFFFFF, std::consume_header> C;
C c;
char16_t w = 0;
char n[6] = {char(0xEF), char(0xBB), char(0xBF), char(0xE1), char(0x80), char(0x85)};
char16_t* wp = nullptr;
std::mbstate_t m;
const char* np = nullptr;
std::codecvt_base::result r = c.in(m, n, n+6, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+6);
assert(w == 0x1005);
n[0] = char(0xD1);
n[1] = char(0x93);
r = c.in(m, n, n+2, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+2);
assert(w == 0x453);
w = 0x56;
n[0] = char(0x56);
r = c.in(m, n, n+1, np, &w, &w+1, wp);
assert(r == std::codecvt_base::ok);
assert(wp == &w+1);
assert(np == n+1);
assert(w == 0x56);
}
}