//===----------------------------------------------------------------------===// // // The LLVM Compiler Infrastructure // // This file is dual licensed under the MIT and the University of Illinois Open // Source Licenses. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // <codecvt> // template <class Elem, unsigned long Maxcode = 0x10ffff, // codecvt_mode Mode = (codecvt_mode)0> // class codecvt_utf8 // : public codecvt<Elem, char, mbstate_t> // { // // unspecified // }; // result // in(stateT& state, // const externT* from, const externT* from_end, const externT*& from_next, // internT* to, internT* to_end, internT*& to_next) const; #include <codecvt> #include <cassert> int main() { { typedef std::codecvt_utf8<char32_t> C; C c; char32_t w = 0; char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)}; char32_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+4); assert(w == 0x40003); n[0] = char(0xE1); n[1] = char(0x80); n[2] = char(0x85); r = c.in(m, n, n+3, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+3); assert(w == 0x1005); n[0] = char(0xD1); n[1] = char(0x93); r = c.in(m, n, n+2, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+2); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } { typedef std::codecvt_utf8<char32_t, 0x1000> C; C c; char32_t w = 0; char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)}; char32_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp); assert(r == std::codecvt_base::error); assert(wp == &w); assert(np == n); assert(w == 0); n[0] = char(0xE1); n[1] = char(0x80); n[2] = char(0x85); r = c.in(m, n, n+3, np, &w, &w+1, wp); assert(r == std::codecvt_base::error); assert(wp == &w); assert(np == n); assert(w == 0); n[0] = char(0xD1); n[1] = char(0x93); r = c.in(m, n, n+2, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+2); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } { typedef std::codecvt_utf8<char32_t, 0xFFFFFFFF, std::consume_header> C; C c; char32_t w = 0; char n[7] = {char(0xEF), char(0xBB), char(0xBF), char(0xF1), char(0x80), char(0x80), char(0x83)}; char32_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+7, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+7); assert(w == 0x40003); n[0] = char(0xE1); n[1] = char(0x80); n[2] = char(0x85); r = c.in(m, n, n+3, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+3); assert(w == 0x1005); n[0] = char(0xEF); n[1] = char(0xBB); n[2] = char(0xBF); n[3] = char(0xD1); n[4] = char(0x93); r = c.in(m, n, n+5, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+5); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } { typedef std::codecvt_utf8<char32_t> C; C c; char32_t w = 0; char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)}; char32_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+4); assert(w == 0x40003); n[0] = char(0xE1); n[1] = char(0x80); n[2] = char(0x85); r = c.in(m, n, n+3, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+3); assert(w == 0x1005); n[0] = char(0xD1); n[1] = char(0x93); r = c.in(m, n, n+2, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+2); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } { typedef std::codecvt_utf8<char32_t, 0x1000> C; C c; char32_t w = 0; char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)}; char32_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp); assert(r == std::codecvt_base::error); assert(wp == &w); assert(np == n); assert(w == 0); n[0] = char(0xE1); n[1] = char(0x80); n[2] = char(0x85); r = c.in(m, n, n+3, np, &w, &w+1, wp); assert(r == std::codecvt_base::error); assert(wp == &w); assert(np == n); assert(w == 0); n[0] = char(0xD1); n[1] = char(0x93); r = c.in(m, n, n+2, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+2); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } { typedef std::codecvt_utf8<char32_t, 0xFFFFFFFF, std::consume_header> C; C c; char32_t w = 0; char n[7] = {char(0xEF), char(0xBB), char(0xBF), char(0xF1), char(0x80), char(0x80), char(0x83)}; char32_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+7, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+7); assert(w == 0x40003); n[0] = char(0xE1); n[1] = char(0x80); n[2] = char(0x85); r = c.in(m, n, n+3, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+3); assert(w == 0x1005); n[0] = char(0xEF); n[1] = char(0xBB); n[2] = char(0xBF); n[3] = char(0xD1); n[4] = char(0x93); r = c.in(m, n, n+5, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+5); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } { typedef std::codecvt_utf8<char16_t> C; C c; char16_t w = 0; char n[3] = {char(0xE1), char(0x80), char(0x85)}; char16_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+3, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+3); assert(w == 0x1005); n[0] = char(0xD1); n[1] = char(0x93); r = c.in(m, n, n+2, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+2); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } { typedef std::codecvt_utf8<char16_t, 0x1000> C; C c; char16_t w = 0; char n[3] = {char(0xE1), char(0x80), char(0x85)}; char16_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+3, np, &w, &w+1, wp); assert(r == std::codecvt_base::error); assert(wp == &w); assert(np == n); assert(w == 0); n[0] = char(0xD1); n[1] = char(0x93); r = c.in(m, n, n+2, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+2); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } { typedef std::codecvt_utf8<char16_t, 0xFFFFFFFF, std::consume_header> C; C c; char16_t w = 0; char n[6] = {char(0xEF), char(0xBB), char(0xBF), char(0xE1), char(0x80), char(0x85)}; char16_t* wp = nullptr; std::mbstate_t m; const char* np = nullptr; std::codecvt_base::result r = c.in(m, n, n+6, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+6); assert(w == 0x1005); n[0] = char(0xD1); n[1] = char(0x93); r = c.in(m, n, n+2, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+2); assert(w == 0x453); w = 0x56; n[0] = char(0x56); r = c.in(m, n, n+1, np, &w, &w+1, wp); assert(r == std::codecvt_base::ok); assert(wp == &w+1); assert(np == n+1); assert(w == 0x56); } }