forked from OSchip/llvm-project
				
			
		
			
				
	
	
		
			361 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			361 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C++
		
	
	
	
| //===----------------------------------------------------------------------===//
 | |
| //
 | |
| //                     The LLVM Compiler Infrastructure
 | |
| //
 | |
| // This file is dual licensed under the MIT and the University of Illinois Open
 | |
| // Source Licenses. See LICENSE.TXT for details.
 | |
| //
 | |
| //===----------------------------------------------------------------------===//
 | |
| 
 | |
| // <codecvt>
 | |
| 
 | |
| // template <class Elem, unsigned long Maxcode = 0x10ffff,
 | |
| //           codecvt_mode Mode = (codecvt_mode)0>
 | |
| // class codecvt_utf8
 | |
| //     : public codecvt<Elem, char, mbstate_t>
 | |
| // {
 | |
| //     // unspecified
 | |
| // };
 | |
| 
 | |
| // result
 | |
| //     in(stateT& state,
 | |
| //        const externT* from, const externT* from_end, const externT*& from_next,
 | |
| //        internT* to, internT* to_end, internT*& to_next) const;
 | |
| 
 | |
| #include <codecvt>
 | |
| #include <cassert>
 | |
| 
 | |
| int main()
 | |
| {
 | |
|     {
 | |
|         typedef std::codecvt_utf8<wchar_t> C;
 | |
|         C c;
 | |
|         wchar_t w = 0;
 | |
|         char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)};
 | |
|         wchar_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+4);
 | |
|         assert(w == 0x40003);
 | |
| 
 | |
|         n[0] = char(0xE1);
 | |
|         n[1] = char(0x80);
 | |
|         n[2] = char(0x85);
 | |
|         r = c.in(m, n, n+3, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+3);
 | |
|         assert(w == 0x1005);
 | |
| 
 | |
|         n[0] = char(0xD1);
 | |
|         n[1] = char(0x93);
 | |
|         r = c.in(m, n, n+2, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+2);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
|     {
 | |
|         typedef std::codecvt_utf8<wchar_t, 0x1000> C;
 | |
|         C c;
 | |
|         wchar_t w = 0;
 | |
|         char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)};
 | |
|         wchar_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::error);
 | |
|         assert(wp == &w);
 | |
|         assert(np == n);
 | |
|         assert(w == 0);
 | |
| 
 | |
|         n[0] = char(0xE1);
 | |
|         n[1] = char(0x80);
 | |
|         n[2] = char(0x85);
 | |
|         r = c.in(m, n, n+3, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::error);
 | |
|         assert(wp == &w);
 | |
|         assert(np == n);
 | |
|         assert(w == 0);
 | |
| 
 | |
|         n[0] = char(0xD1);
 | |
|         n[1] = char(0x93);
 | |
|         r = c.in(m, n, n+2, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+2);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
|     {
 | |
|         typedef std::codecvt_utf8<wchar_t, 0xFFFFFFFF, std::consume_header> C;
 | |
|         C c;
 | |
|         wchar_t w = 0;
 | |
|         char n[7] = {char(0xEF), char(0xBB), char(0xBF), char(0xF1), char(0x80), char(0x80), char(0x83)};
 | |
|         wchar_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+7, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+7);
 | |
|         assert(w == 0x40003);
 | |
| 
 | |
|         n[0] = char(0xE1);
 | |
|         n[1] = char(0x80);
 | |
|         n[2] = char(0x85);
 | |
|         r = c.in(m, n, n+3, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+3);
 | |
|         assert(w == 0x1005);
 | |
| 
 | |
|         n[0] = char(0xEF);
 | |
|         n[1] = char(0xBB);
 | |
|         n[2] = char(0xBF);
 | |
|         n[3] = char(0xD1);
 | |
|         n[4] = char(0x93);
 | |
|         r = c.in(m, n, n+5, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+5);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
|     {
 | |
|         typedef std::codecvt_utf8<char32_t> C;
 | |
|         C c;
 | |
|         char32_t w = 0;
 | |
|         char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)};
 | |
|         char32_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+4);
 | |
|         assert(w == 0x40003);
 | |
| 
 | |
|         n[0] = char(0xE1);
 | |
|         n[1] = char(0x80);
 | |
|         n[2] = char(0x85);
 | |
|         r = c.in(m, n, n+3, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+3);
 | |
|         assert(w == 0x1005);
 | |
| 
 | |
|         n[0] = char(0xD1);
 | |
|         n[1] = char(0x93);
 | |
|         r = c.in(m, n, n+2, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+2);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
|     {
 | |
|         typedef std::codecvt_utf8<char32_t, 0x1000> C;
 | |
|         C c;
 | |
|         char32_t w = 0;
 | |
|         char n[4] = {char(0xF1), char(0x80), char(0x80), char(0x83)};
 | |
|         char32_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+4, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::error);
 | |
|         assert(wp == &w);
 | |
|         assert(np == n);
 | |
|         assert(w == 0);
 | |
| 
 | |
|         n[0] = char(0xE1);
 | |
|         n[1] = char(0x80);
 | |
|         n[2] = char(0x85);
 | |
|         r = c.in(m, n, n+3, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::error);
 | |
|         assert(wp == &w);
 | |
|         assert(np == n);
 | |
|         assert(w == 0);
 | |
| 
 | |
|         n[0] = char(0xD1);
 | |
|         n[1] = char(0x93);
 | |
|         r = c.in(m, n, n+2, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+2);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
|     {
 | |
|         typedef std::codecvt_utf8<char32_t, 0xFFFFFFFF, std::consume_header> C;
 | |
|         C c;
 | |
|         char32_t w = 0;
 | |
|         char n[7] = {char(0xEF), char(0xBB), char(0xBF), char(0xF1), char(0x80), char(0x80), char(0x83)};
 | |
|         char32_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+7, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+7);
 | |
|         assert(w == 0x40003);
 | |
| 
 | |
|         n[0] = char(0xE1);
 | |
|         n[1] = char(0x80);
 | |
|         n[2] = char(0x85);
 | |
|         r = c.in(m, n, n+3, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+3);
 | |
|         assert(w == 0x1005);
 | |
| 
 | |
|         n[0] = char(0xEF);
 | |
|         n[1] = char(0xBB);
 | |
|         n[2] = char(0xBF);
 | |
|         n[3] = char(0xD1);
 | |
|         n[4] = char(0x93);
 | |
|         r = c.in(m, n, n+5, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+5);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
|     {
 | |
|         typedef std::codecvt_utf8<char16_t> C;
 | |
|         C c;
 | |
|         char16_t w = 0;
 | |
|         char n[3] = {char(0xE1), char(0x80), char(0x85)};
 | |
|         char16_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+3, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+3);
 | |
|         assert(w == 0x1005);
 | |
| 
 | |
|         n[0] = char(0xD1);
 | |
|         n[1] = char(0x93);
 | |
|         r = c.in(m, n, n+2, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+2);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
|     {
 | |
|         typedef std::codecvt_utf8<char16_t, 0x1000> C;
 | |
|         C c;
 | |
|         char16_t w = 0;
 | |
|         char n[3] = {char(0xE1), char(0x80), char(0x85)};
 | |
|         char16_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+3, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::error);
 | |
|         assert(wp == &w);
 | |
|         assert(np == n);
 | |
|         assert(w == 0);
 | |
| 
 | |
|         n[0] = char(0xD1);
 | |
|         n[1] = char(0x93);
 | |
|         r = c.in(m, n, n+2, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+2);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
|     {
 | |
|         typedef std::codecvt_utf8<char16_t, 0xFFFFFFFF, std::consume_header> C;
 | |
|         C c;
 | |
|         char16_t w = 0;
 | |
|         char n[6] = {char(0xEF), char(0xBB), char(0xBF), char(0xE1), char(0x80), char(0x85)};
 | |
|         char16_t* wp = nullptr;
 | |
|         std::mbstate_t m;
 | |
|         const char* np = nullptr;
 | |
|         std::codecvt_base::result r = c.in(m, n, n+6, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+6);
 | |
|         assert(w == 0x1005);
 | |
| 
 | |
|         n[0] = char(0xD1);
 | |
|         n[1] = char(0x93);
 | |
|         r = c.in(m, n, n+2, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+2);
 | |
|         assert(w == 0x453);
 | |
| 
 | |
|         w = 0x56;
 | |
|         n[0] = char(0x56);
 | |
|         r = c.in(m, n, n+1, np, &w, &w+1, wp);
 | |
|         assert(r == std::codecvt_base::ok);
 | |
|         assert(wp == &w+1);
 | |
|         assert(np == n+1);
 | |
|         assert(w == 0x56);
 | |
|     }
 | |
| }
 |