1 //===------------------------- locale.cpp ---------------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is dual licensed under the MIT and the University of Illinois Open
6 // Source Licenses. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
10 // On Solaris, we need to define something to make the C99 parts of localeconv
11 // visible.
12 #ifdef __sun__
13 #define _LCONV_C99
14 #endif
15 
16 #include "string"
17 #include "locale"
18 #include "codecvt"
19 #include "vector"
20 #include "algorithm"
21 #include "typeinfo"
22 #ifndef _LIBCPP_NO_EXCEPTIONS
23 #  include "type_traits"
24 #endif
25 #include "clocale"
26 #include "cstring"
27 #if defined(_LIBCPP_MSVCRT)
28 #define _CTYPE_DISABLE_MACROS
29 #endif
30 #include "cwctype"
31 #include "__sso_allocator"
32 #if defined(_LIBCPP_MSVCRT) || defined(__MINGW32__)
33 #include "support/win32/locale_win32.h"
34 #elif !defined(__BIONIC__)
35 #include <langinfo.h>
36 #endif
37 #include <stdlib.h>
38 #include <stdio.h>
39 #include "include/atomic_support.h"
40 #include "__undef_macros"
41 
42 // On Linux, wint_t and wchar_t have different signed-ness, and this causes
43 // lots of noise in the build log, but no bugs that I know of.
44 #if defined(__clang__)
45 #pragma clang diagnostic ignored "-Wsign-conversion"
46 #endif
47 
48 _LIBCPP_BEGIN_NAMESPACE_STD
49 
50 struct __libcpp_unique_locale {
__libcpp_unique_locale__libcpp_unique_locale51   __libcpp_unique_locale(const char* nm) : __loc_(newlocale(LC_ALL_MASK, nm, 0)) {}
52 
~__libcpp_unique_locale__libcpp_unique_locale53   ~__libcpp_unique_locale() {
54     if (__loc_)
55       freelocale(__loc_);
56   }
57 
operator bool__libcpp_unique_locale58   explicit operator bool() const { return __loc_; }
59 
get__libcpp_unique_locale60   locale_t& get() { return __loc_; }
61 
62   locale_t __loc_;
63 private:
64   __libcpp_unique_locale(__libcpp_unique_locale const&);
65   __libcpp_unique_locale& operator=(__libcpp_unique_locale const&);
66 };
67 
68 #ifdef __cloc_defined
__cloc()69 locale_t __cloc() {
70   // In theory this could create a race condition. In practice
71   // the race condition is non-fatal since it will just create
72   // a little resource leak. Better approach would be appreciated.
73   static locale_t result = newlocale(LC_ALL_MASK, "C", 0);
74   return result;
75 }
76 #endif // __cloc_defined
77 
78 namespace {
79 
80 struct release
81 {
operator ()__anonbaef69a20111::release82     void operator()(locale::facet* p) {p->__release_shared();}
83 };
84 
85 template <class T, class A0>
86 inline
87 T&
make(A0 a0)88 make(A0 a0)
89 {
90     static typename aligned_storage<sizeof(T)>::type buf;
91     auto *obj = ::new (&buf) T(a0);
92     return *obj;
93 }
94 
95 template <class T, class A0, class A1>
96 inline
97 T&
make(A0 a0,A1 a1)98 make(A0 a0, A1 a1)
99 {
100     static typename aligned_storage<sizeof(T)>::type buf;
101     ::new (&buf) T(a0, a1);
102     return *reinterpret_cast<T*>(&buf);
103 }
104 
105 template <class T, class A0, class A1, class A2>
106 inline
107 T&
make(A0 a0,A1 a1,A2 a2)108 make(A0 a0, A1 a1, A2 a2)
109 {
110     static typename aligned_storage<sizeof(T)>::type buf;
111     auto *obj = ::new (&buf) T(a0, a1, a2);
112     return *obj;
113 }
114 
115 template <typename T, size_t N>
116 inline
117 _LIBCPP_CONSTEXPR
118 size_t
countof(const T (&)[N])119 countof(const T (&)[N])
120 {
121     return N;
122 }
123 
124 template <typename T>
125 inline
126 _LIBCPP_CONSTEXPR
127 size_t
countof(const T * const begin,const T * const end)128 countof(const T * const begin, const T * const end)
129 {
130     return static_cast<size_t>(end - begin);
131 }
132 
__throw_runtime_error(const string & msg)133 _LIBCPP_NORETURN static void __throw_runtime_error(const string &msg)
134 {
135 #ifndef _LIBCPP_NO_EXCEPTIONS
136     throw runtime_error(msg);
137 #else
138     (void)msg;
139     _VSTD::abort();
140 #endif
141 }
142 
143 }
144 
145 #if defined(_AIX)
146 // Set priority to INT_MIN + 256 + 150
147 # pragma priority ( -2147483242 )
148 #endif
149 
150 const locale::category locale::none;
151 const locale::category locale::collate;
152 const locale::category locale::ctype;
153 const locale::category locale::monetary;
154 const locale::category locale::numeric;
155 const locale::category locale::time;
156 const locale::category locale::messages;
157 const locale::category locale::all;
158 
159 class _LIBCPP_HIDDEN locale::__imp
160     : public facet
161 {
162     enum {N = 28};
163 #if defined(_LIBCPP_COMPILER_MSVC)
164 // FIXME: MSVC doesn't support aligned parameters by value.
165 // I can't get the __sso_allocator to work here
166 // for MSVC I think for this reason.
167     vector<facet*> facets_;
168 #else
169     vector<facet*, __sso_allocator<facet*, N> > facets_;
170 #endif
171     string         name_;
172 public:
173     explicit __imp(size_t refs = 0);
174     explicit __imp(const string& name, size_t refs = 0);
175     __imp(const __imp&);
176     __imp(const __imp&, const string&, locale::category c);
177     __imp(const __imp& other, const __imp& one, locale::category c);
178     __imp(const __imp&, facet* f, long id);
179     ~__imp();
180 
name() const181     const string& name() const {return name_;}
has_facet(long id) const182     bool has_facet(long id) const
183         {return static_cast<size_t>(id) < facets_.size() && facets_[static_cast<size_t>(id)];}
184     const locale::facet* use_facet(long id) const;
185 
186     static const locale& make_classic();
187     static       locale& make_global();
188 private:
189     void install(facet* f, long id);
install(F * f)190     template <class F> void install(F* f) {install(f, f->id.__get());}
191     template <class F> void install_from(const __imp& other);
192 };
193 
__imp(size_t refs)194 locale::__imp::__imp(size_t refs)
195     : facet(refs),
196       facets_(N),
197       name_("C")
198 {
199     facets_.clear();
200     install(&make<_VSTD::collate<char> >(1u));
201     install(&make<_VSTD::collate<wchar_t> >(1u));
202     install(&make<_VSTD::ctype<char> >(nullptr, false, 1u));
203     install(&make<_VSTD::ctype<wchar_t> >(1u));
204     install(&make<codecvt<char, char, mbstate_t> >(1u));
205     install(&make<codecvt<wchar_t, char, mbstate_t> >(1u));
206     install(&make<codecvt<char16_t, char, mbstate_t> >(1u));
207     install(&make<codecvt<char32_t, char, mbstate_t> >(1u));
208     install(&make<numpunct<char> >(1u));
209     install(&make<numpunct<wchar_t> >(1u));
210     install(&make<num_get<char> >(1u));
211     install(&make<num_get<wchar_t> >(1u));
212     install(&make<num_put<char> >(1u));
213     install(&make<num_put<wchar_t> >(1u));
214     install(&make<moneypunct<char, false> >(1u));
215     install(&make<moneypunct<char, true> >(1u));
216     install(&make<moneypunct<wchar_t, false> >(1u));
217     install(&make<moneypunct<wchar_t, true> >(1u));
218     install(&make<money_get<char> >(1u));
219     install(&make<money_get<wchar_t> >(1u));
220     install(&make<money_put<char> >(1u));
221     install(&make<money_put<wchar_t> >(1u));
222     install(&make<time_get<char> >(1u));
223     install(&make<time_get<wchar_t> >(1u));
224     install(&make<time_put<char> >(1u));
225     install(&make<time_put<wchar_t> >(1u));
226     install(&make<_VSTD::messages<char> >(1u));
227     install(&make<_VSTD::messages<wchar_t> >(1u));
228 }
229 
__imp(const string & name,size_t refs)230 locale::__imp::__imp(const string& name, size_t refs)
231     : facet(refs),
232       facets_(N),
233       name_(name)
234 {
235 #ifndef _LIBCPP_NO_EXCEPTIONS
236     try
237     {
238 #endif  // _LIBCPP_NO_EXCEPTIONS
239         facets_ = locale::classic().__locale_->facets_;
240         for (unsigned i = 0; i < facets_.size(); ++i)
241             if (facets_[i])
242                 facets_[i]->__add_shared();
243         install(new collate_byname<char>(name_));
244         install(new collate_byname<wchar_t>(name_));
245         install(new ctype_byname<char>(name_));
246         install(new ctype_byname<wchar_t>(name_));
247         install(new codecvt_byname<char, char, mbstate_t>(name_));
248         install(new codecvt_byname<wchar_t, char, mbstate_t>(name_));
249         install(new codecvt_byname<char16_t, char, mbstate_t>(name_));
250         install(new codecvt_byname<char32_t, char, mbstate_t>(name_));
251         install(new numpunct_byname<char>(name_));
252         install(new numpunct_byname<wchar_t>(name_));
253         install(new moneypunct_byname<char, false>(name_));
254         install(new moneypunct_byname<char, true>(name_));
255         install(new moneypunct_byname<wchar_t, false>(name_));
256         install(new moneypunct_byname<wchar_t, true>(name_));
257         install(new time_get_byname<char>(name_));
258         install(new time_get_byname<wchar_t>(name_));
259         install(new time_put_byname<char>(name_));
260         install(new time_put_byname<wchar_t>(name_));
261         install(new messages_byname<char>(name_));
262         install(new messages_byname<wchar_t>(name_));
263 #ifndef _LIBCPP_NO_EXCEPTIONS
264     }
265     catch (...)
266     {
267         for (unsigned i = 0; i < facets_.size(); ++i)
268             if (facets_[i])
269                 facets_[i]->__release_shared();
270         throw;
271     }
272 #endif  // _LIBCPP_NO_EXCEPTIONS
273 }
274 
275 // NOTE avoid the `base class should be explicitly initialized in the
276 // copy constructor` warning emitted by GCC
277 #if defined(__clang__) || _GNUC_VER >= 406
278 #pragma GCC diagnostic push
279 #pragma GCC diagnostic ignored "-Wextra"
280 #endif
281 
__imp(const __imp & other)282 locale::__imp::__imp(const __imp& other)
283     : facets_(max<size_t>(N, other.facets_.size())),
284       name_(other.name_)
285 {
286     facets_ = other.facets_;
287     for (unsigned i = 0; i < facets_.size(); ++i)
288         if (facets_[i])
289             facets_[i]->__add_shared();
290 }
291 
292 #if defined(__clang__) || _GNUC_VER >= 406
293 #pragma GCC diagnostic pop
294 #endif
295 
__imp(const __imp & other,const string & name,locale::category c)296 locale::__imp::__imp(const __imp& other, const string& name, locale::category c)
297     : facets_(N),
298       name_("*")
299 {
300     facets_ = other.facets_;
301     for (unsigned i = 0; i < facets_.size(); ++i)
302         if (facets_[i])
303             facets_[i]->__add_shared();
304 #ifndef _LIBCPP_NO_EXCEPTIONS
305     try
306     {
307 #endif  // _LIBCPP_NO_EXCEPTIONS
308         if (c & locale::collate)
309         {
310             install(new collate_byname<char>(name));
311             install(new collate_byname<wchar_t>(name));
312         }
313         if (c & locale::ctype)
314         {
315             install(new ctype_byname<char>(name));
316             install(new ctype_byname<wchar_t>(name));
317             install(new codecvt_byname<char, char, mbstate_t>(name));
318             install(new codecvt_byname<wchar_t, char, mbstate_t>(name));
319             install(new codecvt_byname<char16_t, char, mbstate_t>(name));
320             install(new codecvt_byname<char32_t, char, mbstate_t>(name));
321         }
322         if (c & locale::monetary)
323         {
324             install(new moneypunct_byname<char, false>(name));
325             install(new moneypunct_byname<char, true>(name));
326             install(new moneypunct_byname<wchar_t, false>(name));
327             install(new moneypunct_byname<wchar_t, true>(name));
328         }
329         if (c & locale::numeric)
330         {
331             install(new numpunct_byname<char>(name));
332             install(new numpunct_byname<wchar_t>(name));
333         }
334         if (c & locale::time)
335         {
336             install(new time_get_byname<char>(name));
337             install(new time_get_byname<wchar_t>(name));
338             install(new time_put_byname<char>(name));
339             install(new time_put_byname<wchar_t>(name));
340         }
341         if (c & locale::messages)
342         {
343             install(new messages_byname<char>(name));
344             install(new messages_byname<wchar_t>(name));
345         }
346 #ifndef _LIBCPP_NO_EXCEPTIONS
347     }
348     catch (...)
349     {
350         for (unsigned i = 0; i < facets_.size(); ++i)
351             if (facets_[i])
352                 facets_[i]->__release_shared();
353         throw;
354     }
355 #endif  // _LIBCPP_NO_EXCEPTIONS
356 }
357 
358 template<class F>
359 inline
360 void
install_from(const locale::__imp & one)361 locale::__imp::install_from(const locale::__imp& one)
362 {
363     long id = F::id.__get();
364     install(const_cast<F*>(static_cast<const F*>(one.use_facet(id))), id);
365 }
366 
__imp(const __imp & other,const __imp & one,locale::category c)367 locale::__imp::__imp(const __imp& other, const __imp& one, locale::category c)
368     : facets_(N),
369       name_("*")
370 {
371     facets_ = other.facets_;
372     for (unsigned i = 0; i < facets_.size(); ++i)
373         if (facets_[i])
374             facets_[i]->__add_shared();
375 #ifndef _LIBCPP_NO_EXCEPTIONS
376     try
377     {
378 #endif  // _LIBCPP_NO_EXCEPTIONS
379         if (c & locale::collate)
380         {
381             install_from<_VSTD::collate<char> >(one);
382             install_from<_VSTD::collate<wchar_t> >(one);
383         }
384         if (c & locale::ctype)
385         {
386             install_from<_VSTD::ctype<char> >(one);
387             install_from<_VSTD::ctype<wchar_t> >(one);
388             install_from<_VSTD::codecvt<char, char, mbstate_t> >(one);
389             install_from<_VSTD::codecvt<char16_t, char, mbstate_t> >(one);
390             install_from<_VSTD::codecvt<char32_t, char, mbstate_t> >(one);
391             install_from<_VSTD::codecvt<wchar_t, char, mbstate_t> >(one);
392         }
393         if (c & locale::monetary)
394         {
395             install_from<moneypunct<char, false> >(one);
396             install_from<moneypunct<char, true> >(one);
397             install_from<moneypunct<wchar_t, false> >(one);
398             install_from<moneypunct<wchar_t, true> >(one);
399             install_from<money_get<char> >(one);
400             install_from<money_get<wchar_t> >(one);
401             install_from<money_put<char> >(one);
402             install_from<money_put<wchar_t> >(one);
403         }
404         if (c & locale::numeric)
405         {
406             install_from<numpunct<char> >(one);
407             install_from<numpunct<wchar_t> >(one);
408             install_from<num_get<char> >(one);
409             install_from<num_get<wchar_t> >(one);
410             install_from<num_put<char> >(one);
411             install_from<num_put<wchar_t> >(one);
412         }
413         if (c & locale::time)
414         {
415             install_from<time_get<char> >(one);
416             install_from<time_get<wchar_t> >(one);
417             install_from<time_put<char> >(one);
418             install_from<time_put<wchar_t> >(one);
419         }
420         if (c & locale::messages)
421         {
422             install_from<_VSTD::messages<char> >(one);
423             install_from<_VSTD::messages<wchar_t> >(one);
424         }
425 #ifndef _LIBCPP_NO_EXCEPTIONS
426     }
427     catch (...)
428     {
429         for (unsigned i = 0; i < facets_.size(); ++i)
430             if (facets_[i])
431                 facets_[i]->__release_shared();
432         throw;
433     }
434 #endif  // _LIBCPP_NO_EXCEPTIONS
435 }
436 
__imp(const __imp & other,facet * f,long id)437 locale::__imp::__imp(const __imp& other, facet* f, long id)
438     : facets_(max<size_t>(N, other.facets_.size()+1)),
439       name_("*")
440 {
441     f->__add_shared();
442     unique_ptr<facet, release> hold(f);
443     facets_ = other.facets_;
444     for (unsigned i = 0; i < other.facets_.size(); ++i)
445         if (facets_[i])
446             facets_[i]->__add_shared();
447     install(hold.get(), id);
448 }
449 
~__imp()450 locale::__imp::~__imp()
451 {
452     for (unsigned i = 0; i < facets_.size(); ++i)
453         if (facets_[i])
454             facets_[i]->__release_shared();
455 }
456 
457 void
install(facet * f,long id)458 locale::__imp::install(facet* f, long id)
459 {
460     f->__add_shared();
461     unique_ptr<facet, release> hold(f);
462     if (static_cast<size_t>(id) >= facets_.size())
463         facets_.resize(static_cast<size_t>(id+1));
464     if (facets_[static_cast<size_t>(id)])
465         facets_[static_cast<size_t>(id)]->__release_shared();
466     facets_[static_cast<size_t>(id)] = hold.release();
467 }
468 
469 const locale::facet*
use_facet(long id) const470 locale::__imp::use_facet(long id) const
471 {
472 #ifndef _LIBCPP_NO_EXCEPTIONS
473     if (!has_facet(id))
474         throw bad_cast();
475 #endif  // _LIBCPP_NO_EXCEPTIONS
476     return facets_[static_cast<size_t>(id)];
477 }
478 
479 // locale
480 
481 const locale&
make_classic()482 locale::__imp::make_classic()
483 {
484     // only one thread can get in here and it only gets in once
485     static aligned_storage<sizeof(locale)>::type buf;
486     locale* c = reinterpret_cast<locale*>(&buf);
487     c->__locale_ = &make<__imp>(1u);
488     return *c;
489 }
490 
491 const locale&
classic()492 locale::classic()
493 {
494     static const locale& c = __imp::make_classic();
495     return c;
496 }
497 
498 locale&
make_global()499 locale::__imp::make_global()
500 {
501     // only one thread can get in here and it only gets in once
502     static aligned_storage<sizeof(locale)>::type buf;
503     auto *obj = ::new (&buf) locale(locale::classic());
504     return *obj;
505 }
506 
507 locale&
__global()508 locale::__global()
509 {
510     static locale& g = __imp::make_global();
511     return g;
512 }
513 
locale()514 locale::locale()  _NOEXCEPT
515     : __locale_(__global().__locale_)
516 {
517     __locale_->__add_shared();
518 }
519 
locale(const locale & l)520 locale::locale(const locale& l)  _NOEXCEPT
521     : __locale_(l.__locale_)
522 {
523     __locale_->__add_shared();
524 }
525 
~locale()526 locale::~locale()
527 {
528     __locale_->__release_shared();
529 }
530 
531 const locale&
operator =(const locale & other)532 locale::operator=(const locale& other)  _NOEXCEPT
533 {
534     other.__locale_->__add_shared();
535     __locale_->__release_shared();
536     __locale_ = other.__locale_;
537     return *this;
538 }
539 
locale(const char * name)540 locale::locale(const char* name)
541 #ifndef _LIBCPP_NO_EXCEPTIONS
542     : __locale_(name ? new __imp(name)
543                      : throw runtime_error("locale constructed with null"))
544 #else  // _LIBCPP_NO_EXCEPTIONS
545     : __locale_(new __imp(name))
546 #endif
547 {
548     __locale_->__add_shared();
549 }
550 
locale(const string & name)551 locale::locale(const string& name)
552     : __locale_(new __imp(name))
553 {
554     __locale_->__add_shared();
555 }
556 
locale(const locale & other,const char * name,category c)557 locale::locale(const locale& other, const char* name, category c)
558 #ifndef _LIBCPP_NO_EXCEPTIONS
559     : __locale_(name ? new __imp(*other.__locale_, name, c)
560                      : throw runtime_error("locale constructed with null"))
561 #else  // _LIBCPP_NO_EXCEPTIONS
562     : __locale_(new __imp(*other.__locale_, name, c))
563 #endif
564 {
565     __locale_->__add_shared();
566 }
567 
locale(const locale & other,const string & name,category c)568 locale::locale(const locale& other, const string& name, category c)
569     : __locale_(new __imp(*other.__locale_, name, c))
570 {
571     __locale_->__add_shared();
572 }
573 
locale(const locale & other,const locale & one,category c)574 locale::locale(const locale& other, const locale& one, category c)
575     : __locale_(new __imp(*other.__locale_, *one.__locale_, c))
576 {
577     __locale_->__add_shared();
578 }
579 
580 string
name() const581 locale::name() const
582 {
583     return __locale_->name();
584 }
585 
586 void
__install_ctor(const locale & other,facet * f,long id)587 locale::__install_ctor(const locale& other, facet* f, long id)
588 {
589     if (f)
590         __locale_ = new __imp(*other.__locale_, f, id);
591     else
592         __locale_ = other.__locale_;
593     __locale_->__add_shared();
594 }
595 
596 locale
global(const locale & loc)597 locale::global(const locale& loc)
598 {
599     locale& g = __global();
600     locale r = g;
601     g = loc;
602     if (g.name() != "*")
603         setlocale(LC_ALL, g.name().c_str());
604     return r;
605 }
606 
607 bool
has_facet(id & x) const608 locale::has_facet(id& x) const
609 {
610     return __locale_->has_facet(x.__get());
611 }
612 
613 const locale::facet*
use_facet(id & x) const614 locale::use_facet(id& x) const
615 {
616     return __locale_->use_facet(x.__get());
617 }
618 
619 bool
operator ==(const locale & y) const620 locale::operator==(const locale& y) const
621 {
622     return (__locale_ == y.__locale_)
623         || (__locale_->name() != "*" && __locale_->name() == y.__locale_->name());
624 }
625 
626 // locale::facet
627 
~facet()628 locale::facet::~facet()
629 {
630 }
631 
632 void
__on_zero_shared()633 locale::facet::__on_zero_shared() _NOEXCEPT
634 {
635     delete this;
636 }
637 
638 // locale::id
639 
640 int32_t locale::id::__next_id = 0;
641 
642 namespace
643 {
644 
645 class __fake_bind
646 {
647     locale::id* id_;
648     void (locale::id::* pmf_)();
649 public:
__fake_bind(void (locale::id::* pmf)(),locale::id * id)650     __fake_bind(void (locale::id::* pmf)(), locale::id* id)
651         : id_(id), pmf_(pmf) {}
652 
operator ()() const653     void operator()() const
654     {
655         (id_->*pmf_)();
656     }
657 };
658 
659 }
660 
661 long
__get()662 locale::id::__get()
663 {
664     call_once(__flag_, __fake_bind(&locale::id::__init, this));
665     return __id_ - 1;
666 }
667 
668 void
__init()669 locale::id::__init()
670 {
671     __id_ = __libcpp_atomic_add(&__next_id, 1);
672 }
673 
674 // template <> class collate_byname<char>
675 
collate_byname(const char * n,size_t refs)676 collate_byname<char>::collate_byname(const char* n, size_t refs)
677     : collate<char>(refs),
678       __l(newlocale(LC_ALL_MASK, n, 0))
679 {
680     if (__l == 0)
681         __throw_runtime_error("collate_byname<char>::collate_byname"
682                             " failed to construct for " + string(n));
683 }
684 
collate_byname(const string & name,size_t refs)685 collate_byname<char>::collate_byname(const string& name, size_t refs)
686     : collate<char>(refs),
687       __l(newlocale(LC_ALL_MASK, name.c_str(), 0))
688 {
689     if (__l == 0)
690         __throw_runtime_error("collate_byname<char>::collate_byname"
691                             " failed to construct for " + name);
692 }
693 
~collate_byname()694 collate_byname<char>::~collate_byname()
695 {
696     freelocale(__l);
697 }
698 
699 int
do_compare(const char_type * __lo1,const char_type * __hi1,const char_type * __lo2,const char_type * __hi2) const700 collate_byname<char>::do_compare(const char_type* __lo1, const char_type* __hi1,
701                                  const char_type* __lo2, const char_type* __hi2) const
702 {
703     string_type lhs(__lo1, __hi1);
704     string_type rhs(__lo2, __hi2);
705     int r = strcoll_l(lhs.c_str(), rhs.c_str(), __l);
706     if (r < 0)
707         return -1;
708     if (r > 0)
709         return 1;
710     return r;
711 }
712 
713 collate_byname<char>::string_type
do_transform(const char_type * lo,const char_type * hi) const714 collate_byname<char>::do_transform(const char_type* lo, const char_type* hi) const
715 {
716     const string_type in(lo, hi);
717     string_type out(strxfrm_l(0, in.c_str(), 0, __l), char());
718     strxfrm_l(const_cast<char*>(out.c_str()), in.c_str(), out.size()+1, __l);
719     return out;
720 }
721 
722 // template <> class collate_byname<wchar_t>
723 
collate_byname(const char * n,size_t refs)724 collate_byname<wchar_t>::collate_byname(const char* n, size_t refs)
725     : collate<wchar_t>(refs),
726       __l(newlocale(LC_ALL_MASK, n, 0))
727 {
728     if (__l == 0)
729         __throw_runtime_error("collate_byname<wchar_t>::collate_byname(size_t refs)"
730                             " failed to construct for " + string(n));
731 }
732 
collate_byname(const string & name,size_t refs)733 collate_byname<wchar_t>::collate_byname(const string& name, size_t refs)
734     : collate<wchar_t>(refs),
735       __l(newlocale(LC_ALL_MASK, name.c_str(), 0))
736 {
737     if (__l == 0)
738         __throw_runtime_error("collate_byname<wchar_t>::collate_byname(size_t refs)"
739                             " failed to construct for " + name);
740 }
741 
~collate_byname()742 collate_byname<wchar_t>::~collate_byname()
743 {
744     freelocale(__l);
745 }
746 
747 int
do_compare(const char_type * __lo1,const char_type * __hi1,const char_type * __lo2,const char_type * __hi2) const748 collate_byname<wchar_t>::do_compare(const char_type* __lo1, const char_type* __hi1,
749                                  const char_type* __lo2, const char_type* __hi2) const
750 {
751     string_type lhs(__lo1, __hi1);
752     string_type rhs(__lo2, __hi2);
753     int r = wcscoll_l(lhs.c_str(), rhs.c_str(), __l);
754     if (r < 0)
755         return -1;
756     if (r > 0)
757         return 1;
758     return r;
759 }
760 
761 collate_byname<wchar_t>::string_type
do_transform(const char_type * lo,const char_type * hi) const762 collate_byname<wchar_t>::do_transform(const char_type* lo, const char_type* hi) const
763 {
764     const string_type in(lo, hi);
765     string_type out(wcsxfrm_l(0, in.c_str(), 0, __l), wchar_t());
766     wcsxfrm_l(const_cast<wchar_t*>(out.c_str()), in.c_str(), out.size()+1, __l);
767     return out;
768 }
769 
770 // template <> class ctype<wchar_t>;
771 
772 const ctype_base::mask ctype_base::space;
773 const ctype_base::mask ctype_base::print;
774 const ctype_base::mask ctype_base::cntrl;
775 const ctype_base::mask ctype_base::upper;
776 const ctype_base::mask ctype_base::lower;
777 const ctype_base::mask ctype_base::alpha;
778 const ctype_base::mask ctype_base::digit;
779 const ctype_base::mask ctype_base::punct;
780 const ctype_base::mask ctype_base::xdigit;
781 const ctype_base::mask ctype_base::blank;
782 const ctype_base::mask ctype_base::alnum;
783 const ctype_base::mask ctype_base::graph;
784 
785 locale::id ctype<wchar_t>::id;
786 
~ctype()787 ctype<wchar_t>::~ctype()
788 {
789 }
790 
791 bool
do_is(mask m,char_type c) const792 ctype<wchar_t>::do_is(mask m, char_type c) const
793 {
794     return isascii(c) ? (ctype<char>::classic_table()[c] & m) != 0 : false;
795 }
796 
797 const wchar_t*
do_is(const char_type * low,const char_type * high,mask * vec) const798 ctype<wchar_t>::do_is(const char_type* low, const char_type* high, mask* vec) const
799 {
800     for (; low != high; ++low, ++vec)
801         *vec = static_cast<mask>(isascii(*low) ?
802                                    ctype<char>::classic_table()[*low] : 0);
803     return low;
804 }
805 
806 const wchar_t*
do_scan_is(mask m,const char_type * low,const char_type * high) const807 ctype<wchar_t>::do_scan_is(mask m, const char_type* low, const char_type* high) const
808 {
809     for (; low != high; ++low)
810         if (isascii(*low) && (ctype<char>::classic_table()[*low] & m))
811             break;
812     return low;
813 }
814 
815 const wchar_t*
do_scan_not(mask m,const char_type * low,const char_type * high) const816 ctype<wchar_t>::do_scan_not(mask m, const char_type* low, const char_type* high) const
817 {
818     for (; low != high; ++low)
819         if (!(isascii(*low) && (ctype<char>::classic_table()[*low] & m)))
820             break;
821     return low;
822 }
823 
824 wchar_t
do_toupper(char_type c) const825 ctype<wchar_t>::do_toupper(char_type c) const
826 {
827 #ifdef _LIBCPP_HAS_DEFAULTRUNELOCALE
828     return isascii(c) ? _DefaultRuneLocale.__mapupper[c] : c;
829 #elif defined(__GLIBC__) || defined(__EMSCRIPTEN__) || \
830       defined(__NetBSD__)
831     return isascii(c) ? ctype<char>::__classic_upper_table()[c] : c;
832 #else
833     return (isascii(c) && iswlower_l(c, _LIBCPP_GET_C_LOCALE)) ? c-L'a'+L'A' : c;
834 #endif
835 }
836 
837 const wchar_t*
do_toupper(char_type * low,const char_type * high) const838 ctype<wchar_t>::do_toupper(char_type* low, const char_type* high) const
839 {
840     for (; low != high; ++low)
841 #ifdef _LIBCPP_HAS_DEFAULTRUNELOCALE
842         *low = isascii(*low) ? _DefaultRuneLocale.__mapupper[*low] : *low;
843 #elif defined(__GLIBC__) || defined(__EMSCRIPTEN__) || \
844       defined(__NetBSD__)
845         *low = isascii(*low) ? ctype<char>::__classic_upper_table()[*low]
846                              : *low;
847 #else
848         *low = (isascii(*low) && islower_l(*low, _LIBCPP_GET_C_LOCALE)) ? (*low-L'a'+L'A') : *low;
849 #endif
850     return low;
851 }
852 
853 wchar_t
do_tolower(char_type c) const854 ctype<wchar_t>::do_tolower(char_type c) const
855 {
856 #ifdef _LIBCPP_HAS_DEFAULTRUNELOCALE
857     return isascii(c) ? _DefaultRuneLocale.__maplower[c] : c;
858 #elif defined(__GLIBC__) || defined(__EMSCRIPTEN__) || \
859       defined(__NetBSD__)
860     return isascii(c) ? ctype<char>::__classic_lower_table()[c] : c;
861 #else
862     return (isascii(c) && isupper_l(c, _LIBCPP_GET_C_LOCALE)) ? c-L'A'+'a' : c;
863 #endif
864 }
865 
866 const wchar_t*
do_tolower(char_type * low,const char_type * high) const867 ctype<wchar_t>::do_tolower(char_type* low, const char_type* high) const
868 {
869     for (; low != high; ++low)
870 #ifdef _LIBCPP_HAS_DEFAULTRUNELOCALE
871         *low = isascii(*low) ? _DefaultRuneLocale.__maplower[*low] : *low;
872 #elif defined(__GLIBC__) || defined(__EMSCRIPTEN__) || \
873       defined(__NetBSD__)
874         *low = isascii(*low) ? ctype<char>::__classic_lower_table()[*low]
875                              : *low;
876 #else
877         *low = (isascii(*low) && isupper_l(*low, _LIBCPP_GET_C_LOCALE)) ? *low-L'A'+L'a' : *low;
878 #endif
879     return low;
880 }
881 
882 wchar_t
do_widen(char c) const883 ctype<wchar_t>::do_widen(char c) const
884 {
885     return c;
886 }
887 
888 const char*
do_widen(const char * low,const char * high,char_type * dest) const889 ctype<wchar_t>::do_widen(const char* low, const char* high, char_type* dest) const
890 {
891     for (; low != high; ++low, ++dest)
892         *dest = *low;
893     return low;
894 }
895 
896 char
do_narrow(char_type c,char dfault) const897 ctype<wchar_t>::do_narrow(char_type c, char dfault) const
898 {
899     if (isascii(c))
900         return static_cast<char>(c);
901     return dfault;
902 }
903 
904 const wchar_t*
do_narrow(const char_type * low,const char_type * high,char dfault,char * dest) const905 ctype<wchar_t>::do_narrow(const char_type* low, const char_type* high, char dfault, char* dest) const
906 {
907     for (; low != high; ++low, ++dest)
908         if (isascii(*low))
909             *dest = static_cast<char>(*low);
910         else
911             *dest = dfault;
912     return low;
913 }
914 
915 // template <> class ctype<char>;
916 
917 locale::id ctype<char>::id;
918 
ctype(const mask * tab,bool del,size_t refs)919 ctype<char>::ctype(const mask* tab, bool del, size_t refs)
920     : locale::facet(refs),
921       __tab_(tab),
922       __del_(del)
923 {
924   if (__tab_ == 0)
925       __tab_ = classic_table();
926 }
927 
~ctype()928 ctype<char>::~ctype()
929 {
930     if (__tab_ && __del_)
931         delete [] __tab_;
932 }
933 
934 char
do_toupper(char_type c) const935 ctype<char>::do_toupper(char_type c) const
936 {
937 #ifdef _LIBCPP_HAS_DEFAULTRUNELOCALE
938     return isascii(c) ?
939       static_cast<char>(_DefaultRuneLocale.__mapupper[static_cast<ptrdiff_t>(c)]) : c;
940 #elif defined(__NetBSD__)
941     return static_cast<char>(__classic_upper_table()[static_cast<unsigned char>(c)]);
942 #elif defined(__GLIBC__) || defined(__EMSCRIPTEN__)
943     return isascii(c) ?
944       static_cast<char>(__classic_upper_table()[static_cast<unsigned char>(c)]) : c;
945 #else
946     return (isascii(c) && islower_l(c, _LIBCPP_GET_C_LOCALE)) ? c-'a'+'A' : c;
947 #endif
948 }
949 
950 const char*
do_toupper(char_type * low,const char_type * high) const951 ctype<char>::do_toupper(char_type* low, const char_type* high) const
952 {
953     for (; low != high; ++low)
954 #ifdef _LIBCPP_HAS_DEFAULTRUNELOCALE
955         *low = isascii(*low) ?
956           static_cast<char>(_DefaultRuneLocale.__mapupper[static_cast<ptrdiff_t>(*low)]) : *low;
957 #elif defined(__NetBSD__)
958         *low = static_cast<char>(__classic_upper_table()[static_cast<unsigned char>(*low)]);
959 #elif defined(__GLIBC__) || defined(__EMSCRIPTEN__)
960         *low = isascii(*low) ?
961           static_cast<char>(__classic_upper_table()[static_cast<size_t>(*low)]) : *low;
962 #else
963         *low = (isascii(*low) && islower_l(*low, _LIBCPP_GET_C_LOCALE)) ? *low-'a'+'A' : *low;
964 #endif
965     return low;
966 }
967 
968 char
do_tolower(char_type c) const969 ctype<char>::do_tolower(char_type c) const
970 {
971 #ifdef _LIBCPP_HAS_DEFAULTRUNELOCALE
972     return isascii(c) ?
973       static_cast<char>(_DefaultRuneLocale.__maplower[static_cast<ptrdiff_t>(c)]) : c;
974 #elif defined(__NetBSD__)
975     return static_cast<char>(__classic_lower_table()[static_cast<unsigned char>(c)]);
976 #elif defined(__GLIBC__) || defined(__EMSCRIPTEN__)
977     return isascii(c) ?
978       static_cast<char>(__classic_lower_table()[static_cast<size_t>(c)]) : c;
979 #else
980     return (isascii(c) && isupper_l(c, _LIBCPP_GET_C_LOCALE)) ? c-'A'+'a' : c;
981 #endif
982 }
983 
984 const char*
do_tolower(char_type * low,const char_type * high) const985 ctype<char>::do_tolower(char_type* low, const char_type* high) const
986 {
987     for (; low != high; ++low)
988 #ifdef _LIBCPP_HAS_DEFAULTRUNELOCALE
989         *low = isascii(*low) ? static_cast<char>(_DefaultRuneLocale.__maplower[static_cast<ptrdiff_t>(*low)]) : *low;
990 #elif defined(__NetBSD__)
991         *low = static_cast<char>(__classic_lower_table()[static_cast<unsigned char>(*low)]);
992 #elif defined(__GLIBC__) || defined(__EMSCRIPTEN__)
993         *low = isascii(*low) ? static_cast<char>(__classic_lower_table()[static_cast<size_t>(*low)]) : *low;
994 #else
995         *low = (isascii(*low) && isupper_l(*low, _LIBCPP_GET_C_LOCALE)) ? *low-'A'+'a' : *low;
996 #endif
997     return low;
998 }
999 
1000 char
do_widen(char c) const1001 ctype<char>::do_widen(char c) const
1002 {
1003     return c;
1004 }
1005 
1006 const char*
do_widen(const char * low,const char * high,char_type * dest) const1007 ctype<char>::do_widen(const char* low, const char* high, char_type* dest) const
1008 {
1009     for (; low != high; ++low, ++dest)
1010         *dest = *low;
1011     return low;
1012 }
1013 
1014 char
do_narrow(char_type c,char dfault) const1015 ctype<char>::do_narrow(char_type c, char dfault) const
1016 {
1017     if (isascii(c))
1018         return static_cast<char>(c);
1019     return dfault;
1020 }
1021 
1022 const char*
do_narrow(const char_type * low,const char_type * high,char dfault,char * dest) const1023 ctype<char>::do_narrow(const char_type* low, const char_type* high, char dfault, char* dest) const
1024 {
1025     for (; low != high; ++low, ++dest)
1026         if (isascii(*low))
1027             *dest = *low;
1028         else
1029             *dest = dfault;
1030     return low;
1031 }
1032 
1033 #if defined(__EMSCRIPTEN__)
1034 extern "C" const unsigned short ** __ctype_b_loc();
1035 extern "C" const int ** __ctype_tolower_loc();
1036 extern "C" const int ** __ctype_toupper_loc();
1037 #endif
1038 
1039 #ifdef _LIBCPP_PROVIDES_DEFAULT_RUNE_TABLE
1040 const ctype<char>::mask*
classic_table()1041 ctype<char>::classic_table()  _NOEXCEPT
1042 {
1043     static _LIBCPP_CONSTEXPR const ctype<char>::mask builtin_table[table_size] = {
1044         cntrl,                          cntrl,
1045         cntrl,                          cntrl,
1046         cntrl,                          cntrl,
1047         cntrl,                          cntrl,
1048         cntrl,                          cntrl | space | blank,
1049         cntrl | space,                  cntrl | space,
1050         cntrl | space,                  cntrl | space,
1051         cntrl,                          cntrl,
1052         cntrl,                          cntrl,
1053         cntrl,                          cntrl,
1054         cntrl,                          cntrl,
1055         cntrl,                          cntrl,
1056         cntrl,                          cntrl,
1057         cntrl,                          cntrl,
1058         cntrl,                          cntrl,
1059         cntrl,                          cntrl,
1060         space | blank | print,          punct | print,
1061         punct | print,                  punct | print,
1062         punct | print,                  punct | print,
1063         punct | print,                  punct | print,
1064         punct | print,                  punct | print,
1065         punct | print,                  punct | print,
1066         punct | print,                  punct | print,
1067         punct | print,                  punct | print,
1068         digit | print | xdigit,         digit | print | xdigit,
1069         digit | print | xdigit,         digit | print | xdigit,
1070         digit | print | xdigit,         digit | print | xdigit,
1071         digit | print | xdigit,         digit | print | xdigit,
1072         digit | print | xdigit,         digit | print | xdigit,
1073         punct | print,                  punct | print,
1074         punct | print,                  punct | print,
1075         punct | print,                  punct | print,
1076         punct | print,                  upper | xdigit | print | alpha,
1077         upper | xdigit | print | alpha, upper | xdigit | print | alpha,
1078         upper | xdigit | print | alpha, upper | xdigit | print | alpha,
1079         upper | xdigit | print | alpha, upper | print | alpha,
1080         upper | print | alpha,          upper | print | alpha,
1081         upper | print | alpha,          upper | print | alpha,
1082         upper | print | alpha,          upper | print | alpha,
1083         upper | print | alpha,          upper | print | alpha,
1084         upper | print | alpha,          upper | print | alpha,
1085         upper | print | alpha,          upper | print | alpha,
1086         upper | print | alpha,          upper | print | alpha,
1087         upper | print | alpha,          upper | print | alpha,
1088         upper | print | alpha,          upper | print | alpha,
1089         upper | print | alpha,          punct | print,
1090         punct | print,                  punct | print,
1091         punct | print,                  punct | print,
1092         punct | print,                  lower | xdigit | print | alpha,
1093         lower | xdigit | print | alpha, lower | xdigit | print | alpha,
1094         lower | xdigit | print | alpha, lower | xdigit | print | alpha,
1095         lower | xdigit | print | alpha, lower | print | alpha,
1096         lower | print | alpha,          lower | print | alpha,
1097         lower | print | alpha,          lower | print | alpha,
1098         lower | print | alpha,          lower | print | alpha,
1099         lower | print | alpha,          lower | print | alpha,
1100         lower | print | alpha,          lower | print | alpha,
1101         lower | print | alpha,          lower | print | alpha,
1102         lower | print | alpha,          lower | print | alpha,
1103         lower | print | alpha,          lower | print | alpha,
1104         lower | print | alpha,          lower | print | alpha,
1105         lower | print | alpha,          punct | print,
1106         punct | print,                  punct | print,
1107         punct | print,                  cntrl,
1108         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1109         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1110         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1111         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1112         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1113         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1114         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
1115         0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
1116     };
1117     return builtin_table;
1118 }
1119 #else
1120 const ctype<char>::mask*
classic_table()1121 ctype<char>::classic_table()  _NOEXCEPT
1122 {
1123 #if defined(__APPLE__) || defined(__FreeBSD__)
1124     return _DefaultRuneLocale.__runetype;
1125 #elif defined(__NetBSD__)
1126     return _C_ctype_tab_ + 1;
1127 #elif defined(__GLIBC__)
1128     return _LIBCPP_GET_C_LOCALE->__ctype_b;
1129 #elif __sun__
1130     return __ctype_mask;
1131 #elif defined(_LIBCPP_MSVCRT) || defined(__MINGW32__)
1132     return __pctype_func();
1133 #elif defined(__EMSCRIPTEN__)
1134     return *__ctype_b_loc();
1135 #elif defined(_NEWLIB_VERSION)
1136     // Newlib has a 257-entry table in ctype_.c, where (char)0 starts at [1].
1137     return _ctype_ + 1;
1138 #elif defined(_AIX)
1139     return (const unsigned int *)__lc_ctype_ptr->obj->mask;
1140 #else
1141     // Platform not supported: abort so the person doing the port knows what to
1142     // fix
1143 # warning  ctype<char>::classic_table() is not implemented
1144     printf("ctype<char>::classic_table() is not implemented\n");
1145     abort();
1146     return NULL;
1147 #endif
1148 }
1149 #endif
1150 
1151 #if defined(__GLIBC__)
1152 const int*
__classic_lower_table()1153 ctype<char>::__classic_lower_table() _NOEXCEPT
1154 {
1155     return _LIBCPP_GET_C_LOCALE->__ctype_tolower;
1156 }
1157 
1158 const int*
__classic_upper_table()1159 ctype<char>::__classic_upper_table() _NOEXCEPT
1160 {
1161     return _LIBCPP_GET_C_LOCALE->__ctype_toupper;
1162 }
1163 #elif __NetBSD__
1164 const short*
__classic_lower_table()1165 ctype<char>::__classic_lower_table() _NOEXCEPT
1166 {
1167     return _C_tolower_tab_ + 1;
1168 }
1169 
1170 const short*
__classic_upper_table()1171 ctype<char>::__classic_upper_table() _NOEXCEPT
1172 {
1173     return _C_toupper_tab_ + 1;
1174 }
1175 
1176 #elif defined(__EMSCRIPTEN__)
1177 const int*
__classic_lower_table()1178 ctype<char>::__classic_lower_table() _NOEXCEPT
1179 {
1180     return *__ctype_tolower_loc();
1181 }
1182 
1183 const int*
__classic_upper_table()1184 ctype<char>::__classic_upper_table() _NOEXCEPT
1185 {
1186     return *__ctype_toupper_loc();
1187 }
1188 #endif // __GLIBC__ || __NETBSD__ || __EMSCRIPTEN__
1189 
1190 // template <> class ctype_byname<char>
1191 
ctype_byname(const char * name,size_t refs)1192 ctype_byname<char>::ctype_byname(const char* name, size_t refs)
1193     : ctype<char>(0, false, refs),
1194       __l(newlocale(LC_ALL_MASK, name, 0))
1195 {
1196     if (__l == 0)
1197         __throw_runtime_error("ctype_byname<char>::ctype_byname"
1198                             " failed to construct for " + string(name));
1199 }
1200 
ctype_byname(const string & name,size_t refs)1201 ctype_byname<char>::ctype_byname(const string& name, size_t refs)
1202     : ctype<char>(0, false, refs),
1203       __l(newlocale(LC_ALL_MASK, name.c_str(), 0))
1204 {
1205     if (__l == 0)
1206         __throw_runtime_error("ctype_byname<char>::ctype_byname"
1207                             " failed to construct for " + name);
1208 }
1209 
~ctype_byname()1210 ctype_byname<char>::~ctype_byname()
1211 {
1212     freelocale(__l);
1213 }
1214 
1215 char
do_toupper(char_type c) const1216 ctype_byname<char>::do_toupper(char_type c) const
1217 {
1218     return static_cast<char>(toupper_l(static_cast<unsigned char>(c), __l));
1219 }
1220 
1221 const char*
do_toupper(char_type * low,const char_type * high) const1222 ctype_byname<char>::do_toupper(char_type* low, const char_type* high) const
1223 {
1224     for (; low != high; ++low)
1225         *low = static_cast<char>(toupper_l(static_cast<unsigned char>(*low), __l));
1226     return low;
1227 }
1228 
1229 char
do_tolower(char_type c) const1230 ctype_byname<char>::do_tolower(char_type c) const
1231 {
1232     return static_cast<char>(tolower_l(static_cast<unsigned char>(c), __l));
1233 }
1234 
1235 const char*
do_tolower(char_type * low,const char_type * high) const1236 ctype_byname<char>::do_tolower(char_type* low, const char_type* high) const
1237 {
1238     for (; low != high; ++low)
1239         *low = static_cast<char>(tolower_l(static_cast<unsigned char>(*low), __l));
1240     return low;
1241 }
1242 
1243 // template <> class ctype_byname<wchar_t>
1244 
ctype_byname(const char * name,size_t refs)1245 ctype_byname<wchar_t>::ctype_byname(const char* name, size_t refs)
1246     : ctype<wchar_t>(refs),
1247       __l(newlocale(LC_ALL_MASK, name, 0))
1248 {
1249     if (__l == 0)
1250         __throw_runtime_error("ctype_byname<wchar_t>::ctype_byname"
1251                             " failed to construct for " + string(name));
1252 }
1253 
ctype_byname(const string & name,size_t refs)1254 ctype_byname<wchar_t>::ctype_byname(const string& name, size_t refs)
1255     : ctype<wchar_t>(refs),
1256       __l(newlocale(LC_ALL_MASK, name.c_str(), 0))
1257 {
1258     if (__l == 0)
1259         __throw_runtime_error("ctype_byname<wchar_t>::ctype_byname"
1260                             " failed to construct for " + name);
1261 }
1262 
~ctype_byname()1263 ctype_byname<wchar_t>::~ctype_byname()
1264 {
1265     freelocale(__l);
1266 }
1267 
1268 bool
do_is(mask m,char_type c) const1269 ctype_byname<wchar_t>::do_is(mask m, char_type c) const
1270 {
1271 #ifdef _LIBCPP_WCTYPE_IS_MASK
1272     return static_cast<bool>(iswctype_l(c, m, __l));
1273 #else
1274     bool result = false;
1275     wint_t ch = static_cast<wint_t>(c);
1276     if ((m & space) == space) result |= (iswspace_l(ch, __l) != 0);
1277     if ((m & print) == print) result |= (iswprint_l(ch, __l) != 0);
1278     if ((m & cntrl) == cntrl) result |= (iswcntrl_l(ch, __l) != 0);
1279     if ((m & upper) == upper) result |= (iswupper_l(ch, __l) != 0);
1280     if ((m & lower) == lower) result |= (iswlower_l(ch, __l) != 0);
1281     if ((m & alpha) == alpha) result |= (iswalpha_l(ch, __l) != 0);
1282     if ((m & digit) == digit) result |= (iswdigit_l(ch, __l) != 0);
1283     if ((m & punct) == punct) result |= (iswpunct_l(ch, __l) != 0);
1284     if ((m & xdigit) == xdigit) result |= (iswxdigit_l(ch, __l) != 0);
1285     if ((m & blank) == blank) result |= (iswblank_l(ch, __l) != 0);
1286     return result;
1287 #endif
1288 }
1289 
1290 const wchar_t*
do_is(const char_type * low,const char_type * high,mask * vec) const1291 ctype_byname<wchar_t>::do_is(const char_type* low, const char_type* high, mask* vec) const
1292 {
1293     for (; low != high; ++low, ++vec)
1294     {
1295         if (isascii(*low))
1296             *vec = static_cast<mask>(ctype<char>::classic_table()[*low]);
1297         else
1298         {
1299             *vec = 0;
1300             wint_t ch = static_cast<wint_t>(*low);
1301             if (iswspace_l(ch, __l))
1302                 *vec |= space;
1303 #ifndef _LIBCPP_CTYPE_MASK_IS_COMPOSITE_PRINT
1304             if (iswprint_l(ch, __l))
1305                 *vec |= print;
1306 #endif
1307             if (iswcntrl_l(ch, __l))
1308                 *vec |= cntrl;
1309             if (iswupper_l(ch, __l))
1310                 *vec |= upper;
1311             if (iswlower_l(ch, __l))
1312                 *vec |= lower;
1313 #ifndef _LIBCPP_CTYPE_MASK_IS_COMPOSITE_ALPHA
1314             if (iswalpha_l(ch, __l))
1315                 *vec |= alpha;
1316 #endif
1317             if (iswdigit_l(ch, __l))
1318                 *vec |= digit;
1319             if (iswpunct_l(ch, __l))
1320                 *vec |= punct;
1321 #ifndef _LIBCPP_CTYPE_MASK_IS_COMPOSITE_XDIGIT
1322             if (iswxdigit_l(ch, __l))
1323                 *vec |= xdigit;
1324 #endif
1325 #if !defined(__sun__)
1326             if (iswblank_l(ch, __l))
1327                 *vec |= blank;
1328 #endif
1329         }
1330     }
1331     return low;
1332 }
1333 
1334 const wchar_t*
do_scan_is(mask m,const char_type * low,const char_type * high) const1335 ctype_byname<wchar_t>::do_scan_is(mask m, const char_type* low, const char_type* high) const
1336 {
1337     for (; low != high; ++low)
1338     {
1339 #ifdef _LIBCPP_WCTYPE_IS_MASK
1340         if (iswctype_l(*low, m, __l))
1341             break;
1342 #else
1343         wint_t ch = static_cast<wint_t>(*low);
1344         if ((m & space) == space && iswspace_l(ch, __l)) break;
1345         if ((m & print) == print && iswprint_l(ch, __l)) break;
1346         if ((m & cntrl) == cntrl && iswcntrl_l(ch, __l)) break;
1347         if ((m & upper) == upper && iswupper_l(ch, __l)) break;
1348         if ((m & lower) == lower && iswlower_l(ch, __l)) break;
1349         if ((m & alpha) == alpha && iswalpha_l(ch, __l)) break;
1350         if ((m & digit) == digit && iswdigit_l(ch, __l)) break;
1351         if ((m & punct) == punct && iswpunct_l(ch, __l)) break;
1352         if ((m & xdigit) == xdigit && iswxdigit_l(ch, __l)) break;
1353         if ((m & blank) == blank && iswblank_l(ch, __l)) break;
1354 #endif
1355     }
1356     return low;
1357 }
1358 
1359 const wchar_t*
do_scan_not(mask m,const char_type * low,const char_type * high) const1360 ctype_byname<wchar_t>::do_scan_not(mask m, const char_type* low, const char_type* high) const
1361 {
1362     for (; low != high; ++low)
1363     {
1364 #ifdef _LIBCPP_WCTYPE_IS_MASK
1365         if (!iswctype_l(*low, m, __l))
1366             break;
1367 #else
1368         wint_t ch = static_cast<wint_t>(*low);
1369         if ((m & space) == space && iswspace_l(ch, __l)) continue;
1370         if ((m & print) == print && iswprint_l(ch, __l)) continue;
1371         if ((m & cntrl) == cntrl && iswcntrl_l(ch, __l)) continue;
1372         if ((m & upper) == upper && iswupper_l(ch, __l)) continue;
1373         if ((m & lower) == lower && iswlower_l(ch, __l)) continue;
1374         if ((m & alpha) == alpha && iswalpha_l(ch, __l)) continue;
1375         if ((m & digit) == digit && iswdigit_l(ch, __l)) continue;
1376         if ((m & punct) == punct && iswpunct_l(ch, __l)) continue;
1377         if ((m & xdigit) == xdigit && iswxdigit_l(ch, __l)) continue;
1378         if ((m & blank) == blank && iswblank_l(ch, __l)) continue;
1379         break;
1380 #endif
1381     }
1382     return low;
1383 }
1384 
1385 wchar_t
do_toupper(char_type c) const1386 ctype_byname<wchar_t>::do_toupper(char_type c) const
1387 {
1388     return towupper_l(c, __l);
1389 }
1390 
1391 const wchar_t*
do_toupper(char_type * low,const char_type * high) const1392 ctype_byname<wchar_t>::do_toupper(char_type* low, const char_type* high) const
1393 {
1394     for (; low != high; ++low)
1395         *low = towupper_l(*low, __l);
1396     return low;
1397 }
1398 
1399 wchar_t
do_tolower(char_type c) const1400 ctype_byname<wchar_t>::do_tolower(char_type c) const
1401 {
1402     return towlower_l(c, __l);
1403 }
1404 
1405 const wchar_t*
do_tolower(char_type * low,const char_type * high) const1406 ctype_byname<wchar_t>::do_tolower(char_type* low, const char_type* high) const
1407 {
1408     for (; low != high; ++low)
1409         *low = towlower_l(*low, __l);
1410     return low;
1411 }
1412 
1413 wchar_t
do_widen(char c) const1414 ctype_byname<wchar_t>::do_widen(char c) const
1415 {
1416     return __libcpp_btowc_l(c, __l);
1417 }
1418 
1419 const char*
do_widen(const char * low,const char * high,char_type * dest) const1420 ctype_byname<wchar_t>::do_widen(const char* low, const char* high, char_type* dest) const
1421 {
1422     for (; low != high; ++low, ++dest)
1423         *dest = __libcpp_btowc_l(*low, __l);
1424     return low;
1425 }
1426 
1427 char
do_narrow(char_type c,char dfault) const1428 ctype_byname<wchar_t>::do_narrow(char_type c, char dfault) const
1429 {
1430     int r = __libcpp_wctob_l(c, __l);
1431     return r != static_cast<int>(WEOF) ? static_cast<char>(r) : dfault;
1432 }
1433 
1434 const wchar_t*
do_narrow(const char_type * low,const char_type * high,char dfault,char * dest) const1435 ctype_byname<wchar_t>::do_narrow(const char_type* low, const char_type* high, char dfault, char* dest) const
1436 {
1437     for (; low != high; ++low, ++dest)
1438     {
1439         int r = __libcpp_wctob_l(*low, __l);
1440         *dest = r != static_cast<int>(WEOF) ? static_cast<char>(r) : dfault;
1441     }
1442     return low;
1443 }
1444 
1445 // template <> class codecvt<char, char, mbstate_t>
1446 
1447 locale::id codecvt<char, char, mbstate_t>::id;
1448 
~codecvt()1449 codecvt<char, char, mbstate_t>::~codecvt()
1450 {
1451 }
1452 
1453 codecvt<char, char, mbstate_t>::result
do_out(state_type &,const intern_type * frm,const intern_type *,const intern_type * & frm_nxt,extern_type * to,extern_type *,extern_type * & to_nxt) const1454 codecvt<char, char, mbstate_t>::do_out(state_type&,
1455     const intern_type* frm, const intern_type*, const intern_type*& frm_nxt,
1456     extern_type* to, extern_type*, extern_type*& to_nxt) const
1457 {
1458     frm_nxt = frm;
1459     to_nxt = to;
1460     return noconv;
1461 }
1462 
1463 codecvt<char, char, mbstate_t>::result
do_in(state_type &,const extern_type * frm,const extern_type *,const extern_type * & frm_nxt,intern_type * to,intern_type *,intern_type * & to_nxt) const1464 codecvt<char, char, mbstate_t>::do_in(state_type&,
1465     const extern_type* frm, const extern_type*, const extern_type*& frm_nxt,
1466     intern_type* to, intern_type*, intern_type*& to_nxt) const
1467 {
1468     frm_nxt = frm;
1469     to_nxt = to;
1470     return noconv;
1471 }
1472 
1473 codecvt<char, char, mbstate_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const1474 codecvt<char, char, mbstate_t>::do_unshift(state_type&,
1475     extern_type* to, extern_type*, extern_type*& to_nxt) const
1476 {
1477     to_nxt = to;
1478     return noconv;
1479 }
1480 
1481 int
do_encoding() const1482 codecvt<char, char, mbstate_t>::do_encoding() const  _NOEXCEPT
1483 {
1484     return 1;
1485 }
1486 
1487 bool
do_always_noconv() const1488 codecvt<char, char, mbstate_t>::do_always_noconv() const  _NOEXCEPT
1489 {
1490     return true;
1491 }
1492 
1493 int
do_length(state_type &,const extern_type * frm,const extern_type * end,size_t mx) const1494 codecvt<char, char, mbstate_t>::do_length(state_type&,
1495     const extern_type* frm, const extern_type* end, size_t mx) const
1496 {
1497     return static_cast<int>(min<size_t>(mx, static_cast<size_t>(end-frm)));
1498 }
1499 
1500 int
do_max_length() const1501 codecvt<char, char, mbstate_t>::do_max_length() const  _NOEXCEPT
1502 {
1503     return 1;
1504 }
1505 
1506 // template <> class codecvt<wchar_t, char, mbstate_t>
1507 
1508 locale::id codecvt<wchar_t, char, mbstate_t>::id;
1509 
codecvt(size_t refs)1510 codecvt<wchar_t, char, mbstate_t>::codecvt(size_t refs)
1511     : locale::facet(refs),
1512       __l(_LIBCPP_GET_C_LOCALE)
1513 {
1514 }
1515 
codecvt(const char * nm,size_t refs)1516 codecvt<wchar_t, char, mbstate_t>::codecvt(const char* nm, size_t refs)
1517     : locale::facet(refs),
1518       __l(newlocale(LC_ALL_MASK, nm, 0))
1519 {
1520     if (__l == 0)
1521         __throw_runtime_error("codecvt_byname<wchar_t, char, mbstate_t>::codecvt_byname"
1522                             " failed to construct for " + string(nm));
1523 }
1524 
~codecvt()1525 codecvt<wchar_t, char, mbstate_t>::~codecvt()
1526 {
1527     if (__l != _LIBCPP_GET_C_LOCALE)
1528         freelocale(__l);
1529 }
1530 
1531 codecvt<wchar_t, char, mbstate_t>::result
do_out(state_type & st,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const1532 codecvt<wchar_t, char, mbstate_t>::do_out(state_type& st,
1533     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
1534     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
1535 {
1536     // look for first internal null in frm
1537     const intern_type* fend = frm;
1538     for (; fend != frm_end; ++fend)
1539         if (*fend == 0)
1540             break;
1541     // loop over all null-terminated sequences in frm
1542     to_nxt = to;
1543     for (frm_nxt = frm; frm != frm_end && to != to_end; frm = frm_nxt, to = to_nxt)
1544     {
1545         // save state in case it is needed to recover to_nxt on error
1546         mbstate_t save_state = st;
1547         size_t n = __libcpp_wcsnrtombs_l(to, &frm_nxt, static_cast<size_t>(fend-frm),
1548                                      static_cast<size_t>(to_end-to), &st, __l);
1549         if (n == size_t(-1))
1550         {
1551             // need to recover to_nxt
1552             for (to_nxt = to; frm != frm_nxt; ++frm)
1553             {
1554                 n = __libcpp_wcrtomb_l(to_nxt, *frm, &save_state, __l);
1555                 if (n == size_t(-1))
1556                     break;
1557                 to_nxt += n;
1558             }
1559             frm_nxt = frm;
1560             return error;
1561         }
1562         if (n == 0)
1563             return partial;
1564         to_nxt += n;
1565         if (to_nxt == to_end)
1566             break;
1567         if (fend != frm_end)  // set up next null terminated sequence
1568         {
1569             // Try to write the terminating null
1570             extern_type tmp[MB_LEN_MAX];
1571             n = __libcpp_wcrtomb_l(tmp, intern_type(), &st, __l);
1572             if (n == size_t(-1))  // on error
1573                 return error;
1574             if (n > static_cast<size_t>(to_end-to_nxt))  // is there room?
1575                 return partial;
1576             for (extern_type* p = tmp; n; --n)  // write it
1577                 *to_nxt++ = *p++;
1578             ++frm_nxt;
1579             // look for next null in frm
1580             for (fend = frm_nxt; fend != frm_end; ++fend)
1581                 if (*fend == 0)
1582                     break;
1583         }
1584     }
1585     return frm_nxt == frm_end ? ok : partial;
1586 }
1587 
1588 codecvt<wchar_t, char, mbstate_t>::result
do_in(state_type & st,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const1589 codecvt<wchar_t, char, mbstate_t>::do_in(state_type& st,
1590     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
1591     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
1592 {
1593     // look for first internal null in frm
1594     const extern_type* fend = frm;
1595     for (; fend != frm_end; ++fend)
1596         if (*fend == 0)
1597             break;
1598     // loop over all null-terminated sequences in frm
1599     to_nxt = to;
1600     for (frm_nxt = frm; frm != frm_end && to != to_end; frm = frm_nxt, to = to_nxt)
1601     {
1602         // save state in case it is needed to recover to_nxt on error
1603         mbstate_t save_state = st;
1604         size_t n = __libcpp_mbsnrtowcs_l(to, &frm_nxt, static_cast<size_t>(fend-frm),
1605                                      static_cast<size_t>(to_end-to), &st, __l);
1606         if (n == size_t(-1))
1607         {
1608             // need to recover to_nxt
1609             for (to_nxt = to; frm != frm_nxt; ++to_nxt)
1610             {
1611                 n = __libcpp_mbrtowc_l(to_nxt, frm, static_cast<size_t>(fend-frm),
1612                                    &save_state, __l);
1613                 switch (n)
1614                 {
1615                 case 0:
1616                     ++frm;
1617                     break;
1618                 case size_t(-1):
1619                     frm_nxt = frm;
1620                     return error;
1621                 case size_t(-2):
1622                     frm_nxt = frm;
1623                     return partial;
1624                 default:
1625                     frm += n;
1626                     break;
1627                 }
1628             }
1629             frm_nxt = frm;
1630             return frm_nxt == frm_end ? ok : partial;
1631         }
1632         if (n == size_t(-1))
1633             return error;
1634         to_nxt += n;
1635         if (to_nxt == to_end)
1636             break;
1637         if (fend != frm_end)  // set up next null terminated sequence
1638         {
1639             // Try to write the terminating null
1640             n = __libcpp_mbrtowc_l(to_nxt, frm_nxt, 1, &st, __l);
1641             if (n != 0)  // on error
1642                 return error;
1643             ++to_nxt;
1644             ++frm_nxt;
1645             // look for next null in frm
1646             for (fend = frm_nxt; fend != frm_end; ++fend)
1647                 if (*fend == 0)
1648                     break;
1649         }
1650     }
1651     return frm_nxt == frm_end ? ok : partial;
1652 }
1653 
1654 codecvt<wchar_t, char, mbstate_t>::result
do_unshift(state_type & st,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const1655 codecvt<wchar_t, char, mbstate_t>::do_unshift(state_type& st,
1656     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
1657 {
1658     to_nxt = to;
1659     extern_type tmp[MB_LEN_MAX];
1660     size_t n = __libcpp_wcrtomb_l(tmp, intern_type(), &st, __l);
1661     if (n == size_t(-1) || n == 0)  // on error
1662         return error;
1663     --n;
1664     if (n > static_cast<size_t>(to_end-to_nxt))  // is there room?
1665         return partial;
1666     for (extern_type* p = tmp; n; --n)  // write it
1667         *to_nxt++ = *p++;
1668     return ok;
1669 }
1670 
1671 int
do_encoding() const1672 codecvt<wchar_t, char, mbstate_t>::do_encoding() const  _NOEXCEPT
1673 {
1674     if (__libcpp_mbtowc_l(nullptr, nullptr, MB_LEN_MAX, __l) != 0)
1675         return -1;
1676 
1677     // stateless encoding
1678     if (__l == 0 || __libcpp_mb_cur_max_l(__l) == 1)  // there are no known constant length encodings
1679         return 1;                // which take more than 1 char to form a wchar_t
1680     return 0;
1681 }
1682 
1683 bool
do_always_noconv() const1684 codecvt<wchar_t, char, mbstate_t>::do_always_noconv() const  _NOEXCEPT
1685 {
1686     return false;
1687 }
1688 
1689 int
do_length(state_type & st,const extern_type * frm,const extern_type * frm_end,size_t mx) const1690 codecvt<wchar_t, char, mbstate_t>::do_length(state_type& st,
1691     const extern_type* frm, const extern_type* frm_end, size_t mx) const
1692 {
1693     int nbytes = 0;
1694     for (size_t nwchar_t = 0; nwchar_t < mx && frm != frm_end; ++nwchar_t)
1695     {
1696         size_t n = __libcpp_mbrlen_l(frm, static_cast<size_t>(frm_end-frm), &st, __l);
1697         switch (n)
1698         {
1699         case 0:
1700             ++nbytes;
1701             ++frm;
1702             break;
1703         case size_t(-1):
1704         case size_t(-2):
1705             return nbytes;
1706         default:
1707             nbytes += n;
1708             frm += n;
1709             break;
1710         }
1711     }
1712     return nbytes;
1713 }
1714 
1715 int
do_max_length() const1716 codecvt<wchar_t, char, mbstate_t>::do_max_length() const  _NOEXCEPT
1717 {
1718     return __l == 0 ? 1 : static_cast<int>(__libcpp_mb_cur_max_l(__l));
1719 }
1720 
1721 //                                     Valid UTF ranges
1722 //     UTF-32               UTF-16                          UTF-8               # of code points
1723 //                     first      second       first   second    third   fourth
1724 // 000000 - 00007F  0000 - 007F               00 - 7F                                 127
1725 // 000080 - 0007FF  0080 - 07FF               C2 - DF, 80 - BF                       1920
1726 // 000800 - 000FFF  0800 - 0FFF               E0 - E0, A0 - BF, 80 - BF              2048
1727 // 001000 - 00CFFF  1000 - CFFF               E1 - EC, 80 - BF, 80 - BF             49152
1728 // 00D000 - 00D7FF  D000 - D7FF               ED - ED, 80 - 9F, 80 - BF              2048
1729 // 00D800 - 00DFFF                invalid
1730 // 00E000 - 00FFFF  E000 - FFFF               EE - EF, 80 - BF, 80 - BF              8192
1731 // 010000 - 03FFFF  D800 - D8BF, DC00 - DFFF  F0 - F0, 90 - BF, 80 - BF, 80 - BF   196608
1732 // 040000 - 0FFFFF  D8C0 - DBBF, DC00 - DFFF  F1 - F3, 80 - BF, 80 - BF, 80 - BF   786432
1733 // 100000 - 10FFFF  DBC0 - DBFF, DC00 - DFFF  F4 - F4, 80 - 8F, 80 - BF, 80 - BF    65536
1734 
1735 static
1736 codecvt_base::result
utf16_to_utf8(const uint16_t * frm,const uint16_t * frm_end,const uint16_t * & frm_nxt,uint8_t * to,uint8_t * to_end,uint8_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))1737 utf16_to_utf8(const uint16_t* frm, const uint16_t* frm_end, const uint16_t*& frm_nxt,
1738               uint8_t* to, uint8_t* to_end, uint8_t*& to_nxt,
1739               unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
1740 {
1741     frm_nxt = frm;
1742     to_nxt = to;
1743     if (mode & generate_header)
1744     {
1745         if (to_end-to_nxt < 3)
1746             return codecvt_base::partial;
1747         *to_nxt++ = static_cast<uint8_t>(0xEF);
1748         *to_nxt++ = static_cast<uint8_t>(0xBB);
1749         *to_nxt++ = static_cast<uint8_t>(0xBF);
1750     }
1751     for (; frm_nxt < frm_end; ++frm_nxt)
1752     {
1753         uint16_t wc1 = *frm_nxt;
1754         if (wc1 > Maxcode)
1755             return codecvt_base::error;
1756         if (wc1 < 0x0080)
1757         {
1758             if (to_end-to_nxt < 1)
1759                 return codecvt_base::partial;
1760             *to_nxt++ = static_cast<uint8_t>(wc1);
1761         }
1762         else if (wc1 < 0x0800)
1763         {
1764             if (to_end-to_nxt < 2)
1765                 return codecvt_base::partial;
1766             *to_nxt++ = static_cast<uint8_t>(0xC0 | (wc1 >> 6));
1767             *to_nxt++ = static_cast<uint8_t>(0x80 | (wc1 & 0x03F));
1768         }
1769         else if (wc1 < 0xD800)
1770         {
1771             if (to_end-to_nxt < 3)
1772                 return codecvt_base::partial;
1773             *to_nxt++ = static_cast<uint8_t>(0xE0 |  (wc1 >> 12));
1774             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc1 & 0x0FC0) >> 6));
1775             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc1 & 0x003F));
1776         }
1777         else if (wc1 < 0xDC00)
1778         {
1779             if (frm_end-frm_nxt < 2)
1780                 return codecvt_base::partial;
1781             uint16_t wc2 = frm_nxt[1];
1782             if ((wc2 & 0xFC00) != 0xDC00)
1783                 return codecvt_base::error;
1784             if (to_end-to_nxt < 4)
1785                 return codecvt_base::partial;
1786             if (((((wc1 & 0x03C0UL) >> 6) + 1) << 16) +
1787                 ((wc1 & 0x003FUL) << 10) + (wc2 & 0x03FF) > Maxcode)
1788                 return codecvt_base::error;
1789             ++frm_nxt;
1790             uint8_t z = ((wc1 & 0x03C0) >> 6) + 1;
1791             *to_nxt++ = static_cast<uint8_t>(0xF0 | (z >> 2));
1792             *to_nxt++ = static_cast<uint8_t>(0x80 | ((z & 0x03) << 4)     | ((wc1 & 0x003C) >> 2));
1793             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc1 & 0x0003) << 4) | ((wc2 & 0x03C0) >> 6));
1794             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc2 & 0x003F));
1795         }
1796         else if (wc1 < 0xE000)
1797         {
1798             return codecvt_base::error;
1799         }
1800         else
1801         {
1802             if (to_end-to_nxt < 3)
1803                 return codecvt_base::partial;
1804             *to_nxt++ = static_cast<uint8_t>(0xE0 |  (wc1 >> 12));
1805             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc1 & 0x0FC0) >> 6));
1806             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc1 & 0x003F));
1807         }
1808     }
1809     return codecvt_base::ok;
1810 }
1811 
1812 static
1813 codecvt_base::result
utf16_to_utf8(const uint32_t * frm,const uint32_t * frm_end,const uint32_t * & frm_nxt,uint8_t * to,uint8_t * to_end,uint8_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))1814 utf16_to_utf8(const uint32_t* frm, const uint32_t* frm_end, const uint32_t*& frm_nxt,
1815               uint8_t* to, uint8_t* to_end, uint8_t*& to_nxt,
1816               unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
1817 {
1818     frm_nxt = frm;
1819     to_nxt = to;
1820     if (mode & generate_header)
1821     {
1822         if (to_end-to_nxt < 3)
1823             return codecvt_base::partial;
1824         *to_nxt++ = static_cast<uint8_t>(0xEF);
1825         *to_nxt++ = static_cast<uint8_t>(0xBB);
1826         *to_nxt++ = static_cast<uint8_t>(0xBF);
1827     }
1828     for (; frm_nxt < frm_end; ++frm_nxt)
1829     {
1830         uint16_t wc1 = static_cast<uint16_t>(*frm_nxt);
1831         if (wc1 > Maxcode)
1832             return codecvt_base::error;
1833         if (wc1 < 0x0080)
1834         {
1835             if (to_end-to_nxt < 1)
1836                 return codecvt_base::partial;
1837             *to_nxt++ = static_cast<uint8_t>(wc1);
1838         }
1839         else if (wc1 < 0x0800)
1840         {
1841             if (to_end-to_nxt < 2)
1842                 return codecvt_base::partial;
1843             *to_nxt++ = static_cast<uint8_t>(0xC0 | (wc1 >> 6));
1844             *to_nxt++ = static_cast<uint8_t>(0x80 | (wc1 & 0x03F));
1845         }
1846         else if (wc1 < 0xD800)
1847         {
1848             if (to_end-to_nxt < 3)
1849                 return codecvt_base::partial;
1850             *to_nxt++ = static_cast<uint8_t>(0xE0 |  (wc1 >> 12));
1851             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc1 & 0x0FC0) >> 6));
1852             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc1 & 0x003F));
1853         }
1854         else if (wc1 < 0xDC00)
1855         {
1856             if (frm_end-frm_nxt < 2)
1857                 return codecvt_base::partial;
1858             uint16_t wc2 = static_cast<uint16_t>(frm_nxt[1]);
1859             if ((wc2 & 0xFC00) != 0xDC00)
1860                 return codecvt_base::error;
1861             if (to_end-to_nxt < 4)
1862                 return codecvt_base::partial;
1863             if (((((wc1 & 0x03C0UL) >> 6) + 1) << 16) +
1864                 ((wc1 & 0x003FUL) << 10) + (wc2 & 0x03FF) > Maxcode)
1865                 return codecvt_base::error;
1866             ++frm_nxt;
1867             uint8_t z = ((wc1 & 0x03C0) >> 6) + 1;
1868             *to_nxt++ = static_cast<uint8_t>(0xF0 | (z >> 2));
1869             *to_nxt++ = static_cast<uint8_t>(0x80 | ((z & 0x03) << 4)     | ((wc1 & 0x003C) >> 2));
1870             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc1 & 0x0003) << 4) | ((wc2 & 0x03C0) >> 6));
1871             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc2 & 0x003F));
1872         }
1873         else if (wc1 < 0xE000)
1874         {
1875             return codecvt_base::error;
1876         }
1877         else
1878         {
1879             if (to_end-to_nxt < 3)
1880                 return codecvt_base::partial;
1881             *to_nxt++ = static_cast<uint8_t>(0xE0 |  (wc1 >> 12));
1882             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc1 & 0x0FC0) >> 6));
1883             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc1 & 0x003F));
1884         }
1885     }
1886     return codecvt_base::ok;
1887 }
1888 
1889 static
1890 codecvt_base::result
utf8_to_utf16(const uint8_t * frm,const uint8_t * frm_end,const uint8_t * & frm_nxt,uint16_t * to,uint16_t * to_end,uint16_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))1891 utf8_to_utf16(const uint8_t* frm, const uint8_t* frm_end, const uint8_t*& frm_nxt,
1892               uint16_t* to, uint16_t* to_end, uint16_t*& to_nxt,
1893               unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
1894 {
1895     frm_nxt = frm;
1896     to_nxt = to;
1897     if (mode & consume_header)
1898     {
1899         if (frm_end-frm_nxt >= 3 && frm_nxt[0] == 0xEF && frm_nxt[1] == 0xBB &&
1900                                                           frm_nxt[2] == 0xBF)
1901             frm_nxt += 3;
1902     }
1903     for (; frm_nxt < frm_end && to_nxt < to_end; ++to_nxt)
1904     {
1905         uint8_t c1 = *frm_nxt;
1906         if (c1 > Maxcode)
1907             return codecvt_base::error;
1908         if (c1 < 0x80)
1909         {
1910             *to_nxt = static_cast<uint16_t>(c1);
1911             ++frm_nxt;
1912         }
1913         else if (c1 < 0xC2)
1914         {
1915             return codecvt_base::error;
1916         }
1917         else if (c1 < 0xE0)
1918         {
1919             if (frm_end-frm_nxt < 2)
1920                 return codecvt_base::partial;
1921             uint8_t c2 = frm_nxt[1];
1922             if ((c2 & 0xC0) != 0x80)
1923                 return codecvt_base::error;
1924             uint16_t t = static_cast<uint16_t>(((c1 & 0x1F) << 6) | (c2 & 0x3F));
1925             if (t > Maxcode)
1926                 return codecvt_base::error;
1927             *to_nxt = t;
1928             frm_nxt += 2;
1929         }
1930         else if (c1 < 0xF0)
1931         {
1932             if (frm_end-frm_nxt < 3)
1933                 return codecvt_base::partial;
1934             uint8_t c2 = frm_nxt[1];
1935             uint8_t c3 = frm_nxt[2];
1936             switch (c1)
1937             {
1938             case 0xE0:
1939                 if ((c2 & 0xE0) != 0xA0)
1940                     return codecvt_base::error;
1941                  break;
1942             case 0xED:
1943                 if ((c2 & 0xE0) != 0x80)
1944                     return codecvt_base::error;
1945                  break;
1946             default:
1947                 if ((c2 & 0xC0) != 0x80)
1948                     return codecvt_base::error;
1949                  break;
1950             }
1951             if ((c3 & 0xC0) != 0x80)
1952                 return codecvt_base::error;
1953             uint16_t t = static_cast<uint16_t>(((c1 & 0x0F) << 12)
1954                                              | ((c2 & 0x3F) << 6)
1955                                              |  (c3 & 0x3F));
1956             if (t > Maxcode)
1957                 return codecvt_base::error;
1958             *to_nxt = t;
1959             frm_nxt += 3;
1960         }
1961         else if (c1 < 0xF5)
1962         {
1963             if (frm_end-frm_nxt < 4)
1964                 return codecvt_base::partial;
1965             uint8_t c2 = frm_nxt[1];
1966             uint8_t c3 = frm_nxt[2];
1967             uint8_t c4 = frm_nxt[3];
1968             switch (c1)
1969             {
1970             case 0xF0:
1971                 if (!(0x90 <= c2 && c2 <= 0xBF))
1972                     return codecvt_base::error;
1973                  break;
1974             case 0xF4:
1975                 if ((c2 & 0xF0) != 0x80)
1976                     return codecvt_base::error;
1977                  break;
1978             default:
1979                 if ((c2 & 0xC0) != 0x80)
1980                     return codecvt_base::error;
1981                  break;
1982             }
1983             if ((c3 & 0xC0) != 0x80 || (c4 & 0xC0) != 0x80)
1984                 return codecvt_base::error;
1985             if (to_end-to_nxt < 2)
1986                 return codecvt_base::partial;
1987             if ((((c1 & 7UL) << 18) +
1988                 ((c2 & 0x3FUL) << 12) +
1989                 ((c3 & 0x3FUL) << 6) + (c4 & 0x3F)) > Maxcode)
1990                 return codecvt_base::error;
1991             *to_nxt = static_cast<uint16_t>(
1992                     0xD800
1993                   | (((((c1 & 0x07) << 2) | ((c2 & 0x30) >> 4)) - 1) << 6)
1994                   | ((c2 & 0x0F) << 2)
1995                   | ((c3 & 0x30) >> 4));
1996             *++to_nxt = static_cast<uint16_t>(
1997                     0xDC00
1998                   | ((c3 & 0x0F) << 6)
1999                   |  (c4 & 0x3F));
2000             frm_nxt += 4;
2001         }
2002         else
2003         {
2004             return codecvt_base::error;
2005         }
2006     }
2007     return frm_nxt < frm_end ? codecvt_base::partial : codecvt_base::ok;
2008 }
2009 
2010 static
2011 codecvt_base::result
utf8_to_utf16(const uint8_t * frm,const uint8_t * frm_end,const uint8_t * & frm_nxt,uint32_t * to,uint32_t * to_end,uint32_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2012 utf8_to_utf16(const uint8_t* frm, const uint8_t* frm_end, const uint8_t*& frm_nxt,
2013               uint32_t* to, uint32_t* to_end, uint32_t*& to_nxt,
2014               unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2015 {
2016     frm_nxt = frm;
2017     to_nxt = to;
2018     if (mode & consume_header)
2019     {
2020         if (frm_end-frm_nxt >= 3 && frm_nxt[0] == 0xEF && frm_nxt[1] == 0xBB &&
2021                                                           frm_nxt[2] == 0xBF)
2022             frm_nxt += 3;
2023     }
2024     for (; frm_nxt < frm_end && to_nxt < to_end; ++to_nxt)
2025     {
2026         uint8_t c1 = *frm_nxt;
2027         if (c1 > Maxcode)
2028             return codecvt_base::error;
2029         if (c1 < 0x80)
2030         {
2031             *to_nxt = static_cast<uint32_t>(c1);
2032             ++frm_nxt;
2033         }
2034         else if (c1 < 0xC2)
2035         {
2036             return codecvt_base::error;
2037         }
2038         else if (c1 < 0xE0)
2039         {
2040             if (frm_end-frm_nxt < 2)
2041                 return codecvt_base::partial;
2042             uint8_t c2 = frm_nxt[1];
2043             if ((c2 & 0xC0) != 0x80)
2044                 return codecvt_base::error;
2045             uint16_t t = static_cast<uint16_t>(((c1 & 0x1F) << 6) | (c2 & 0x3F));
2046             if (t > Maxcode)
2047                 return codecvt_base::error;
2048             *to_nxt = static_cast<uint32_t>(t);
2049             frm_nxt += 2;
2050         }
2051         else if (c1 < 0xF0)
2052         {
2053             if (frm_end-frm_nxt < 3)
2054                 return codecvt_base::partial;
2055             uint8_t c2 = frm_nxt[1];
2056             uint8_t c3 = frm_nxt[2];
2057             switch (c1)
2058             {
2059             case 0xE0:
2060                 if ((c2 & 0xE0) != 0xA0)
2061                     return codecvt_base::error;
2062                  break;
2063             case 0xED:
2064                 if ((c2 & 0xE0) != 0x80)
2065                     return codecvt_base::error;
2066                  break;
2067             default:
2068                 if ((c2 & 0xC0) != 0x80)
2069                     return codecvt_base::error;
2070                  break;
2071             }
2072             if ((c3 & 0xC0) != 0x80)
2073                 return codecvt_base::error;
2074             uint16_t t = static_cast<uint16_t>(((c1 & 0x0F) << 12)
2075                                              | ((c2 & 0x3F) << 6)
2076                                              |  (c3 & 0x3F));
2077             if (t > Maxcode)
2078                 return codecvt_base::error;
2079             *to_nxt = static_cast<uint32_t>(t);
2080             frm_nxt += 3;
2081         }
2082         else if (c1 < 0xF5)
2083         {
2084             if (frm_end-frm_nxt < 4)
2085                 return codecvt_base::partial;
2086             uint8_t c2 = frm_nxt[1];
2087             uint8_t c3 = frm_nxt[2];
2088             uint8_t c4 = frm_nxt[3];
2089             switch (c1)
2090             {
2091             case 0xF0:
2092                 if (!(0x90 <= c2 && c2 <= 0xBF))
2093                     return codecvt_base::error;
2094                  break;
2095             case 0xF4:
2096                 if ((c2 & 0xF0) != 0x80)
2097                     return codecvt_base::error;
2098                  break;
2099             default:
2100                 if ((c2 & 0xC0) != 0x80)
2101                     return codecvt_base::error;
2102                  break;
2103             }
2104             if ((c3 & 0xC0) != 0x80 || (c4 & 0xC0) != 0x80)
2105                 return codecvt_base::error;
2106             if (to_end-to_nxt < 2)
2107                 return codecvt_base::partial;
2108             if ((((c1 & 7UL) << 18) +
2109                 ((c2 & 0x3FUL) << 12) +
2110                 ((c3 & 0x3FUL) << 6) + (c4 & 0x3F)) > Maxcode)
2111                 return codecvt_base::error;
2112             *to_nxt = static_cast<uint32_t>(
2113                     0xD800
2114                   | (((((c1 & 0x07) << 2) | ((c2 & 0x30) >> 4)) - 1) << 6)
2115                   | ((c2 & 0x0F) << 2)
2116                   | ((c3 & 0x30) >> 4));
2117             *++to_nxt = static_cast<uint32_t>(
2118                     0xDC00
2119                   | ((c3 & 0x0F) << 6)
2120                   |  (c4 & 0x3F));
2121             frm_nxt += 4;
2122         }
2123         else
2124         {
2125             return codecvt_base::error;
2126         }
2127     }
2128     return frm_nxt < frm_end ? codecvt_base::partial : codecvt_base::ok;
2129 }
2130 
2131 static
2132 int
utf8_to_utf16_length(const uint8_t * frm,const uint8_t * frm_end,size_t mx,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2133 utf8_to_utf16_length(const uint8_t* frm, const uint8_t* frm_end,
2134                      size_t mx, unsigned long Maxcode = 0x10FFFF,
2135                      codecvt_mode mode = codecvt_mode(0))
2136 {
2137     const uint8_t* frm_nxt = frm;
2138     if (mode & consume_header)
2139     {
2140         if (frm_end-frm_nxt >= 3 && frm_nxt[0] == 0xEF && frm_nxt[1] == 0xBB &&
2141                                                           frm_nxt[2] == 0xBF)
2142             frm_nxt += 3;
2143     }
2144     for (size_t nchar16_t = 0; frm_nxt < frm_end && nchar16_t < mx; ++nchar16_t)
2145     {
2146         uint8_t c1 = *frm_nxt;
2147         if (c1 > Maxcode)
2148             break;
2149         if (c1 < 0x80)
2150         {
2151             ++frm_nxt;
2152         }
2153         else if (c1 < 0xC2)
2154         {
2155             break;
2156         }
2157         else if (c1 < 0xE0)
2158         {
2159             if ((frm_end-frm_nxt < 2) || (frm_nxt[1] & 0xC0) != 0x80)
2160                 break;
2161             uint16_t t = static_cast<uint16_t>(((c1 & 0x1F) << 6) | (frm_nxt[1] & 0x3F));
2162             if (t > Maxcode)
2163                 break;
2164             frm_nxt += 2;
2165         }
2166         else if (c1 < 0xF0)
2167         {
2168             if (frm_end-frm_nxt < 3)
2169                 break;
2170             uint8_t c2 = frm_nxt[1];
2171             uint8_t c3 = frm_nxt[2];
2172             switch (c1)
2173             {
2174             case 0xE0:
2175                 if ((c2 & 0xE0) != 0xA0)
2176                     return static_cast<int>(frm_nxt - frm);
2177                 break;
2178             case 0xED:
2179                 if ((c2 & 0xE0) != 0x80)
2180                     return static_cast<int>(frm_nxt - frm);
2181                  break;
2182             default:
2183                 if ((c2 & 0xC0) != 0x80)
2184                     return static_cast<int>(frm_nxt - frm);
2185                  break;
2186             }
2187             if ((c3 & 0xC0) != 0x80)
2188                 break;
2189             if ((((c1 & 0x0Fu) << 12) | ((c2 & 0x3Fu) << 6) | (c3 & 0x3Fu)) > Maxcode)
2190                 break;
2191             frm_nxt += 3;
2192         }
2193         else if (c1 < 0xF5)
2194         {
2195             if (frm_end-frm_nxt < 4 || mx-nchar16_t < 2)
2196                 break;
2197             uint8_t c2 = frm_nxt[1];
2198             uint8_t c3 = frm_nxt[2];
2199             uint8_t c4 = frm_nxt[3];
2200             switch (c1)
2201             {
2202             case 0xF0:
2203                 if (!(0x90 <= c2 && c2 <= 0xBF))
2204                     return static_cast<int>(frm_nxt - frm);
2205                  break;
2206             case 0xF4:
2207                 if ((c2 & 0xF0) != 0x80)
2208                     return static_cast<int>(frm_nxt - frm);
2209                  break;
2210             default:
2211                 if ((c2 & 0xC0) != 0x80)
2212                     return static_cast<int>(frm_nxt - frm);
2213                  break;
2214             }
2215             if ((c3 & 0xC0) != 0x80 || (c4 & 0xC0) != 0x80)
2216                 break;
2217             if ((((c1 & 7UL) << 18) +
2218                 ((c2 & 0x3FUL) << 12) +
2219                 ((c3 & 0x3FUL) << 6) + (c4 & 0x3F)) > Maxcode)
2220                 break;
2221             ++nchar16_t;
2222             frm_nxt += 4;
2223         }
2224         else
2225         {
2226             break;
2227         }
2228     }
2229     return static_cast<int>(frm_nxt - frm);
2230 }
2231 
2232 static
2233 codecvt_base::result
ucs4_to_utf8(const uint32_t * frm,const uint32_t * frm_end,const uint32_t * & frm_nxt,uint8_t * to,uint8_t * to_end,uint8_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2234 ucs4_to_utf8(const uint32_t* frm, const uint32_t* frm_end, const uint32_t*& frm_nxt,
2235              uint8_t* to, uint8_t* to_end, uint8_t*& to_nxt,
2236              unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2237 {
2238     frm_nxt = frm;
2239     to_nxt = to;
2240     if (mode & generate_header)
2241     {
2242         if (to_end-to_nxt < 3)
2243             return codecvt_base::partial;
2244         *to_nxt++ = static_cast<uint8_t>(0xEF);
2245         *to_nxt++ = static_cast<uint8_t>(0xBB);
2246         *to_nxt++ = static_cast<uint8_t>(0xBF);
2247     }
2248     for (; frm_nxt < frm_end; ++frm_nxt)
2249     {
2250         uint32_t wc = *frm_nxt;
2251         if ((wc & 0xFFFFF800) == 0x00D800 || wc > Maxcode)
2252             return codecvt_base::error;
2253         if (wc < 0x000080)
2254         {
2255             if (to_end-to_nxt < 1)
2256                 return codecvt_base::partial;
2257             *to_nxt++ = static_cast<uint8_t>(wc);
2258         }
2259         else if (wc < 0x000800)
2260         {
2261             if (to_end-to_nxt < 2)
2262                 return codecvt_base::partial;
2263             *to_nxt++ = static_cast<uint8_t>(0xC0 | (wc >> 6));
2264             *to_nxt++ = static_cast<uint8_t>(0x80 | (wc & 0x03F));
2265         }
2266         else if (wc < 0x010000)
2267         {
2268             if (to_end-to_nxt < 3)
2269                 return codecvt_base::partial;
2270             *to_nxt++ = static_cast<uint8_t>(0xE0 |  (wc >> 12));
2271             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc & 0x0FC0) >> 6));
2272             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc & 0x003F));
2273         }
2274         else // if (wc < 0x110000)
2275         {
2276             if (to_end-to_nxt < 4)
2277                 return codecvt_base::partial;
2278             *to_nxt++ = static_cast<uint8_t>(0xF0 |  (wc >> 18));
2279             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc & 0x03F000) >> 12));
2280             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc & 0x000FC0) >> 6));
2281             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc & 0x00003F));
2282         }
2283     }
2284     return codecvt_base::ok;
2285 }
2286 
2287 static
2288 codecvt_base::result
utf8_to_ucs4(const uint8_t * frm,const uint8_t * frm_end,const uint8_t * & frm_nxt,uint32_t * to,uint32_t * to_end,uint32_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2289 utf8_to_ucs4(const uint8_t* frm, const uint8_t* frm_end, const uint8_t*& frm_nxt,
2290              uint32_t* to, uint32_t* to_end, uint32_t*& to_nxt,
2291              unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2292 {
2293     frm_nxt = frm;
2294     to_nxt = to;
2295     if (mode & consume_header)
2296     {
2297         if (frm_end-frm_nxt >= 3 && frm_nxt[0] == 0xEF && frm_nxt[1] == 0xBB &&
2298                                                           frm_nxt[2] == 0xBF)
2299             frm_nxt += 3;
2300     }
2301     for (; frm_nxt < frm_end && to_nxt < to_end; ++to_nxt)
2302     {
2303         uint8_t c1 = static_cast<uint8_t>(*frm_nxt);
2304         if (c1 < 0x80)
2305         {
2306             if (c1 > Maxcode)
2307                 return codecvt_base::error;
2308             *to_nxt = static_cast<uint32_t>(c1);
2309             ++frm_nxt;
2310         }
2311         else if (c1 < 0xC2)
2312         {
2313             return codecvt_base::error;
2314         }
2315         else if (c1 < 0xE0)
2316         {
2317             if (frm_end-frm_nxt < 2)
2318                 return codecvt_base::partial;
2319             uint8_t c2 = frm_nxt[1];
2320             if ((c2 & 0xC0) != 0x80)
2321                 return codecvt_base::error;
2322             uint32_t t = static_cast<uint32_t>(((c1 & 0x1F) << 6)
2323                                               | (c2 & 0x3F));
2324             if (t > Maxcode)
2325                 return codecvt_base::error;
2326             *to_nxt = t;
2327             frm_nxt += 2;
2328         }
2329         else if (c1 < 0xF0)
2330         {
2331             if (frm_end-frm_nxt < 3)
2332                 return codecvt_base::partial;
2333             uint8_t c2 = frm_nxt[1];
2334             uint8_t c3 = frm_nxt[2];
2335             switch (c1)
2336             {
2337             case 0xE0:
2338                 if ((c2 & 0xE0) != 0xA0)
2339                     return codecvt_base::error;
2340                  break;
2341             case 0xED:
2342                 if ((c2 & 0xE0) != 0x80)
2343                     return codecvt_base::error;
2344                  break;
2345             default:
2346                 if ((c2 & 0xC0) != 0x80)
2347                     return codecvt_base::error;
2348                  break;
2349             }
2350             if ((c3 & 0xC0) != 0x80)
2351                 return codecvt_base::error;
2352             uint32_t t = static_cast<uint32_t>(((c1 & 0x0F) << 12)
2353                                              | ((c2 & 0x3F) << 6)
2354                                              |  (c3 & 0x3F));
2355             if (t > Maxcode)
2356                 return codecvt_base::error;
2357             *to_nxt = t;
2358             frm_nxt += 3;
2359         }
2360         else if (c1 < 0xF5)
2361         {
2362             if (frm_end-frm_nxt < 4)
2363                 return codecvt_base::partial;
2364             uint8_t c2 = frm_nxt[1];
2365             uint8_t c3 = frm_nxt[2];
2366             uint8_t c4 = frm_nxt[3];
2367             switch (c1)
2368             {
2369             case 0xF0:
2370                 if (!(0x90 <= c2 && c2 <= 0xBF))
2371                     return codecvt_base::error;
2372                  break;
2373             case 0xF4:
2374                 if ((c2 & 0xF0) != 0x80)
2375                     return codecvt_base::error;
2376                  break;
2377             default:
2378                 if ((c2 & 0xC0) != 0x80)
2379                     return codecvt_base::error;
2380                  break;
2381             }
2382             if ((c3 & 0xC0) != 0x80 || (c4 & 0xC0) != 0x80)
2383                 return codecvt_base::error;
2384             uint32_t t = static_cast<uint32_t>(((c1 & 0x07) << 18)
2385                                              | ((c2 & 0x3F) << 12)
2386                                              | ((c3 & 0x3F) << 6)
2387                                              |  (c4 & 0x3F));
2388             if (t > Maxcode)
2389                 return codecvt_base::error;
2390             *to_nxt = t;
2391             frm_nxt += 4;
2392         }
2393         else
2394         {
2395             return codecvt_base::error;
2396         }
2397     }
2398     return frm_nxt < frm_end ? codecvt_base::partial : codecvt_base::ok;
2399 }
2400 
2401 static
2402 int
utf8_to_ucs4_length(const uint8_t * frm,const uint8_t * frm_end,size_t mx,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2403 utf8_to_ucs4_length(const uint8_t* frm, const uint8_t* frm_end,
2404                     size_t mx, unsigned long Maxcode = 0x10FFFF,
2405                     codecvt_mode mode = codecvt_mode(0))
2406 {
2407     const uint8_t* frm_nxt = frm;
2408     if (mode & consume_header)
2409     {
2410         if (frm_end-frm_nxt >= 3 && frm_nxt[0] == 0xEF && frm_nxt[1] == 0xBB &&
2411                                                           frm_nxt[2] == 0xBF)
2412             frm_nxt += 3;
2413     }
2414     for (size_t nchar32_t = 0; frm_nxt < frm_end && nchar32_t < mx; ++nchar32_t)
2415     {
2416         uint8_t c1 = static_cast<uint8_t>(*frm_nxt);
2417         if (c1 < 0x80)
2418         {
2419             if (c1 > Maxcode)
2420                 break;
2421             ++frm_nxt;
2422         }
2423         else if (c1 < 0xC2)
2424         {
2425             break;
2426         }
2427         else if (c1 < 0xE0)
2428         {
2429             if ((frm_end-frm_nxt < 2) || ((frm_nxt[1] & 0xC0) != 0x80))
2430                 break;
2431             if ((((c1 & 0x1Fu) << 6) | (frm_nxt[1] & 0x3Fu)) > Maxcode)
2432                 break;
2433             frm_nxt += 2;
2434         }
2435         else if (c1 < 0xF0)
2436         {
2437             if (frm_end-frm_nxt < 3)
2438                 break;
2439             uint8_t c2 = frm_nxt[1];
2440             uint8_t c3 = frm_nxt[2];
2441             switch (c1)
2442             {
2443             case 0xE0:
2444                 if ((c2 & 0xE0) != 0xA0)
2445                     return static_cast<int>(frm_nxt - frm);
2446                 break;
2447             case 0xED:
2448                 if ((c2 & 0xE0) != 0x80)
2449                     return static_cast<int>(frm_nxt - frm);
2450                  break;
2451             default:
2452                 if ((c2 & 0xC0) != 0x80)
2453                     return static_cast<int>(frm_nxt - frm);
2454                  break;
2455             }
2456             if ((c3 & 0xC0) != 0x80)
2457                 break;
2458             if ((((c1 & 0x0Fu) << 12) | ((c2 & 0x3Fu) << 6) | (c3 & 0x3Fu)) > Maxcode)
2459                 break;
2460             frm_nxt += 3;
2461         }
2462         else if (c1 < 0xF5)
2463         {
2464             if (frm_end-frm_nxt < 4)
2465                 break;
2466             uint8_t c2 = frm_nxt[1];
2467             uint8_t c3 = frm_nxt[2];
2468             uint8_t c4 = frm_nxt[3];
2469             switch (c1)
2470             {
2471             case 0xF0:
2472                 if (!(0x90 <= c2 && c2 <= 0xBF))
2473                     return static_cast<int>(frm_nxt - frm);
2474                  break;
2475             case 0xF4:
2476                 if ((c2 & 0xF0) != 0x80)
2477                     return static_cast<int>(frm_nxt - frm);
2478                  break;
2479             default:
2480                 if ((c2 & 0xC0) != 0x80)
2481                     return static_cast<int>(frm_nxt - frm);
2482                  break;
2483             }
2484             if ((c3 & 0xC0) != 0x80 || (c4 & 0xC0) != 0x80)
2485                 break;
2486             if ((((c1 & 0x07u) << 18) | ((c2 & 0x3Fu) << 12) |
2487                  ((c3 & 0x3Fu) << 6)  |  (c4 & 0x3Fu)) > Maxcode)
2488                 break;
2489             frm_nxt += 4;
2490         }
2491         else
2492         {
2493             break;
2494         }
2495     }
2496     return static_cast<int>(frm_nxt - frm);
2497 }
2498 
2499 static
2500 codecvt_base::result
ucs2_to_utf8(const uint16_t * frm,const uint16_t * frm_end,const uint16_t * & frm_nxt,uint8_t * to,uint8_t * to_end,uint8_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2501 ucs2_to_utf8(const uint16_t* frm, const uint16_t* frm_end, const uint16_t*& frm_nxt,
2502              uint8_t* to, uint8_t* to_end, uint8_t*& to_nxt,
2503              unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2504 {
2505     frm_nxt = frm;
2506     to_nxt = to;
2507     if (mode & generate_header)
2508     {
2509         if (to_end-to_nxt < 3)
2510             return codecvt_base::partial;
2511         *to_nxt++ = static_cast<uint8_t>(0xEF);
2512         *to_nxt++ = static_cast<uint8_t>(0xBB);
2513         *to_nxt++ = static_cast<uint8_t>(0xBF);
2514     }
2515     for (; frm_nxt < frm_end; ++frm_nxt)
2516     {
2517         uint16_t wc = *frm_nxt;
2518         if ((wc & 0xF800) == 0xD800 || wc > Maxcode)
2519             return codecvt_base::error;
2520         if (wc < 0x0080)
2521         {
2522             if (to_end-to_nxt < 1)
2523                 return codecvt_base::partial;
2524             *to_nxt++ = static_cast<uint8_t>(wc);
2525         }
2526         else if (wc < 0x0800)
2527         {
2528             if (to_end-to_nxt < 2)
2529                 return codecvt_base::partial;
2530             *to_nxt++ = static_cast<uint8_t>(0xC0 | (wc >> 6));
2531             *to_nxt++ = static_cast<uint8_t>(0x80 | (wc & 0x03F));
2532         }
2533         else // if (wc <= 0xFFFF)
2534         {
2535             if (to_end-to_nxt < 3)
2536                 return codecvt_base::partial;
2537             *to_nxt++ = static_cast<uint8_t>(0xE0 |  (wc >> 12));
2538             *to_nxt++ = static_cast<uint8_t>(0x80 | ((wc & 0x0FC0) >> 6));
2539             *to_nxt++ = static_cast<uint8_t>(0x80 |  (wc & 0x003F));
2540         }
2541     }
2542     return codecvt_base::ok;
2543 }
2544 
2545 static
2546 codecvt_base::result
utf8_to_ucs2(const uint8_t * frm,const uint8_t * frm_end,const uint8_t * & frm_nxt,uint16_t * to,uint16_t * to_end,uint16_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2547 utf8_to_ucs2(const uint8_t* frm, const uint8_t* frm_end, const uint8_t*& frm_nxt,
2548              uint16_t* to, uint16_t* to_end, uint16_t*& to_nxt,
2549              unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2550 {
2551     frm_nxt = frm;
2552     to_nxt = to;
2553     if (mode & consume_header)
2554     {
2555         if (frm_end-frm_nxt >= 3 && frm_nxt[0] == 0xEF && frm_nxt[1] == 0xBB &&
2556                                                           frm_nxt[2] == 0xBF)
2557             frm_nxt += 3;
2558     }
2559     for (; frm_nxt < frm_end && to_nxt < to_end; ++to_nxt)
2560     {
2561         uint8_t c1 = static_cast<uint8_t>(*frm_nxt);
2562         if (c1 < 0x80)
2563         {
2564             if (c1 > Maxcode)
2565                 return codecvt_base::error;
2566             *to_nxt = static_cast<uint16_t>(c1);
2567             ++frm_nxt;
2568         }
2569         else if (c1 < 0xC2)
2570         {
2571             return codecvt_base::error;
2572         }
2573         else if (c1 < 0xE0)
2574         {
2575             if (frm_end-frm_nxt < 2)
2576                 return codecvt_base::partial;
2577             uint8_t c2 = frm_nxt[1];
2578             if ((c2 & 0xC0) != 0x80)
2579                 return codecvt_base::error;
2580             uint16_t t = static_cast<uint16_t>(((c1 & 0x1F) << 6)
2581                                               | (c2 & 0x3F));
2582             if (t > Maxcode)
2583                 return codecvt_base::error;
2584             *to_nxt = t;
2585             frm_nxt += 2;
2586         }
2587         else if (c1 < 0xF0)
2588         {
2589             if (frm_end-frm_nxt < 3)
2590                 return codecvt_base::partial;
2591             uint8_t c2 = frm_nxt[1];
2592             uint8_t c3 = frm_nxt[2];
2593             switch (c1)
2594             {
2595             case 0xE0:
2596                 if ((c2 & 0xE0) != 0xA0)
2597                     return codecvt_base::error;
2598                  break;
2599             case 0xED:
2600                 if ((c2 & 0xE0) != 0x80)
2601                     return codecvt_base::error;
2602                  break;
2603             default:
2604                 if ((c2 & 0xC0) != 0x80)
2605                     return codecvt_base::error;
2606                  break;
2607             }
2608             if ((c3 & 0xC0) != 0x80)
2609                 return codecvt_base::error;
2610             uint16_t t = static_cast<uint16_t>(((c1 & 0x0F) << 12)
2611                                              | ((c2 & 0x3F) << 6)
2612                                              |  (c3 & 0x3F));
2613             if (t > Maxcode)
2614                 return codecvt_base::error;
2615             *to_nxt = t;
2616             frm_nxt += 3;
2617         }
2618         else
2619         {
2620             return codecvt_base::error;
2621         }
2622     }
2623     return frm_nxt < frm_end ? codecvt_base::partial : codecvt_base::ok;
2624 }
2625 
2626 static
2627 int
utf8_to_ucs2_length(const uint8_t * frm,const uint8_t * frm_end,size_t mx,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2628 utf8_to_ucs2_length(const uint8_t* frm, const uint8_t* frm_end,
2629                     size_t mx, unsigned long Maxcode = 0x10FFFF,
2630                     codecvt_mode mode = codecvt_mode(0))
2631 {
2632     const uint8_t* frm_nxt = frm;
2633     if (mode & consume_header)
2634     {
2635         if (frm_end-frm_nxt >= 3 && frm_nxt[0] == 0xEF && frm_nxt[1] == 0xBB &&
2636                                                           frm_nxt[2] == 0xBF)
2637             frm_nxt += 3;
2638     }
2639     for (size_t nchar32_t = 0; frm_nxt < frm_end && nchar32_t < mx; ++nchar32_t)
2640     {
2641         uint8_t c1 = static_cast<uint8_t>(*frm_nxt);
2642         if (c1 < 0x80)
2643         {
2644             if (c1 > Maxcode)
2645                 break;
2646             ++frm_nxt;
2647         }
2648         else if (c1 < 0xC2)
2649         {
2650             break;
2651         }
2652         else if (c1 < 0xE0)
2653         {
2654             if ((frm_end-frm_nxt < 2) || ((frm_nxt[1] & 0xC0) != 0x80))
2655                 break;
2656             if ((((c1 & 0x1Fu) << 6) | (frm_nxt[1] & 0x3Fu)) > Maxcode)
2657                 break;
2658             frm_nxt += 2;
2659         }
2660         else if (c1 < 0xF0)
2661         {
2662             if (frm_end-frm_nxt < 3)
2663                 break;
2664             uint8_t c2 = frm_nxt[1];
2665             uint8_t c3 = frm_nxt[2];
2666             switch (c1)
2667             {
2668             case 0xE0:
2669                 if ((c2 & 0xE0) != 0xA0)
2670                     return static_cast<int>(frm_nxt - frm);
2671                 break;
2672             case 0xED:
2673                 if ((c2 & 0xE0) != 0x80)
2674                     return static_cast<int>(frm_nxt - frm);
2675                  break;
2676             default:
2677                 if ((c2 & 0xC0) != 0x80)
2678                     return static_cast<int>(frm_nxt - frm);
2679                  break;
2680             }
2681             if ((c3 & 0xC0) != 0x80)
2682                 break;
2683             if ((((c1 & 0x0Fu) << 12) | ((c2 & 0x3Fu) << 6) | (c3 & 0x3Fu)) > Maxcode)
2684                 break;
2685             frm_nxt += 3;
2686         }
2687         else
2688         {
2689             break;
2690         }
2691     }
2692     return static_cast<int>(frm_nxt - frm);
2693 }
2694 
2695 static
2696 codecvt_base::result
ucs4_to_utf16be(const uint32_t * frm,const uint32_t * frm_end,const uint32_t * & frm_nxt,uint8_t * to,uint8_t * to_end,uint8_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2697 ucs4_to_utf16be(const uint32_t* frm, const uint32_t* frm_end, const uint32_t*& frm_nxt,
2698                 uint8_t* to, uint8_t* to_end, uint8_t*& to_nxt,
2699                 unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2700 {
2701     frm_nxt = frm;
2702     to_nxt = to;
2703     if (mode & generate_header)
2704     {
2705         if (to_end-to_nxt < 2)
2706             return codecvt_base::partial;
2707         *to_nxt++ = static_cast<uint8_t>(0xFE);
2708         *to_nxt++ = static_cast<uint8_t>(0xFF);
2709     }
2710     for (; frm_nxt < frm_end; ++frm_nxt)
2711     {
2712         uint32_t wc = *frm_nxt;
2713         if ((wc & 0xFFFFF800) == 0x00D800 || wc > Maxcode)
2714             return codecvt_base::error;
2715         if (wc < 0x010000)
2716         {
2717             if (to_end-to_nxt < 2)
2718                 return codecvt_base::partial;
2719             *to_nxt++ = static_cast<uint8_t>(wc >> 8);
2720             *to_nxt++ = static_cast<uint8_t>(wc);
2721         }
2722         else
2723         {
2724             if (to_end-to_nxt < 4)
2725                 return codecvt_base::partial;
2726             uint16_t t = static_cast<uint16_t>(
2727                     0xD800
2728                   | ((((wc & 0x1F0000) >> 16) - 1) << 6)
2729                   |   ((wc & 0x00FC00) >> 10));
2730             *to_nxt++ = static_cast<uint8_t>(t >> 8);
2731             *to_nxt++ = static_cast<uint8_t>(t);
2732             t = static_cast<uint16_t>(0xDC00 | (wc & 0x03FF));
2733             *to_nxt++ = static_cast<uint8_t>(t >> 8);
2734             *to_nxt++ = static_cast<uint8_t>(t);
2735         }
2736     }
2737     return codecvt_base::ok;
2738 }
2739 
2740 static
2741 codecvt_base::result
utf16be_to_ucs4(const uint8_t * frm,const uint8_t * frm_end,const uint8_t * & frm_nxt,uint32_t * to,uint32_t * to_end,uint32_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2742 utf16be_to_ucs4(const uint8_t* frm, const uint8_t* frm_end, const uint8_t*& frm_nxt,
2743                 uint32_t* to, uint32_t* to_end, uint32_t*& to_nxt,
2744                 unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2745 {
2746     frm_nxt = frm;
2747     to_nxt = to;
2748     if (mode & consume_header)
2749     {
2750         if (frm_end-frm_nxt >= 2 && frm_nxt[0] == 0xFE && frm_nxt[1] == 0xFF)
2751             frm_nxt += 2;
2752     }
2753     for (; frm_nxt < frm_end - 1 && to_nxt < to_end; ++to_nxt)
2754     {
2755         uint16_t c1 = static_cast<uint16_t>(frm_nxt[0] << 8 | frm_nxt[1]);
2756         if ((c1 & 0xFC00) == 0xDC00)
2757             return codecvt_base::error;
2758         if ((c1 & 0xFC00) != 0xD800)
2759         {
2760             if (c1 > Maxcode)
2761                 return codecvt_base::error;
2762             *to_nxt = static_cast<uint32_t>(c1);
2763             frm_nxt += 2;
2764         }
2765         else
2766         {
2767             if (frm_end-frm_nxt < 4)
2768                 return codecvt_base::partial;
2769             uint16_t c2 = static_cast<uint16_t>(frm_nxt[2] << 8 | frm_nxt[3]);
2770             if ((c2 & 0xFC00) != 0xDC00)
2771                 return codecvt_base::error;
2772             uint32_t t = static_cast<uint32_t>(
2773                     ((((c1 & 0x03C0) >> 6) + 1) << 16)
2774                   |   ((c1 & 0x003F) << 10)
2775                   |    (c2 & 0x03FF));
2776             if (t > Maxcode)
2777                 return codecvt_base::error;
2778             *to_nxt = t;
2779             frm_nxt += 4;
2780         }
2781     }
2782     return frm_nxt < frm_end ? codecvt_base::partial : codecvt_base::ok;
2783 }
2784 
2785 static
2786 int
utf16be_to_ucs4_length(const uint8_t * frm,const uint8_t * frm_end,size_t mx,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2787 utf16be_to_ucs4_length(const uint8_t* frm, const uint8_t* frm_end,
2788                        size_t mx, unsigned long Maxcode = 0x10FFFF,
2789                        codecvt_mode mode = codecvt_mode(0))
2790 {
2791     const uint8_t* frm_nxt = frm;
2792     if (mode & consume_header)
2793     {
2794         if (frm_end-frm_nxt >= 2 && frm_nxt[0] == 0xFE && frm_nxt[1] == 0xFF)
2795             frm_nxt += 2;
2796     }
2797     for (size_t nchar32_t = 0; frm_nxt < frm_end - 1 && nchar32_t < mx; ++nchar32_t)
2798     {
2799         uint16_t c1 = static_cast<uint16_t>(frm_nxt[0] << 8 | frm_nxt[1]);
2800         if ((c1 & 0xFC00) == 0xDC00)
2801             break;
2802         if ((c1 & 0xFC00) != 0xD800)
2803         {
2804             if (c1 > Maxcode)
2805                 break;
2806             frm_nxt += 2;
2807         }
2808         else
2809         {
2810             if (frm_end-frm_nxt < 4)
2811                 break;
2812             uint16_t c2 = static_cast<uint16_t>(frm_nxt[2] << 8 | frm_nxt[3]);
2813             if ((c2 & 0xFC00) != 0xDC00)
2814                 break;
2815             uint32_t t = static_cast<uint32_t>(
2816                     ((((c1 & 0x03C0) >> 6) + 1) << 16)
2817                   |   ((c1 & 0x003F) << 10)
2818                   |    (c2 & 0x03FF));
2819             if (t > Maxcode)
2820                 break;
2821             frm_nxt += 4;
2822         }
2823     }
2824     return static_cast<int>(frm_nxt - frm);
2825 }
2826 
2827 static
2828 codecvt_base::result
ucs4_to_utf16le(const uint32_t * frm,const uint32_t * frm_end,const uint32_t * & frm_nxt,uint8_t * to,uint8_t * to_end,uint8_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2829 ucs4_to_utf16le(const uint32_t* frm, const uint32_t* frm_end, const uint32_t*& frm_nxt,
2830                 uint8_t* to, uint8_t* to_end, uint8_t*& to_nxt,
2831                 unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2832 {
2833     frm_nxt = frm;
2834     to_nxt = to;
2835     if (mode & generate_header)
2836     {
2837         if (to_end - to_nxt < 2)
2838             return codecvt_base::partial;
2839         *to_nxt++ = static_cast<uint8_t>(0xFF);
2840         *to_nxt++ = static_cast<uint8_t>(0xFE);
2841     }
2842     for (; frm_nxt < frm_end; ++frm_nxt)
2843     {
2844         uint32_t wc = *frm_nxt;
2845         if ((wc & 0xFFFFF800) == 0x00D800 || wc > Maxcode)
2846             return codecvt_base::error;
2847         if (wc < 0x010000)
2848         {
2849             if (to_end-to_nxt < 2)
2850                 return codecvt_base::partial;
2851             *to_nxt++ = static_cast<uint8_t>(wc);
2852             *to_nxt++ = static_cast<uint8_t>(wc >> 8);
2853         }
2854         else
2855         {
2856             if (to_end-to_nxt < 4)
2857                 return codecvt_base::partial;
2858             uint16_t t = static_cast<uint16_t>(
2859                     0xD800
2860                   | ((((wc & 0x1F0000) >> 16) - 1) << 6)
2861                   |   ((wc & 0x00FC00) >> 10));
2862             *to_nxt++ = static_cast<uint8_t>(t);
2863             *to_nxt++ = static_cast<uint8_t>(t >> 8);
2864             t = static_cast<uint16_t>(0xDC00 | (wc & 0x03FF));
2865             *to_nxt++ = static_cast<uint8_t>(t);
2866             *to_nxt++ = static_cast<uint8_t>(t >> 8);
2867         }
2868     }
2869     return codecvt_base::ok;
2870 }
2871 
2872 static
2873 codecvt_base::result
utf16le_to_ucs4(const uint8_t * frm,const uint8_t * frm_end,const uint8_t * & frm_nxt,uint32_t * to,uint32_t * to_end,uint32_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2874 utf16le_to_ucs4(const uint8_t* frm, const uint8_t* frm_end, const uint8_t*& frm_nxt,
2875                 uint32_t* to, uint32_t* to_end, uint32_t*& to_nxt,
2876                 unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2877 {
2878     frm_nxt = frm;
2879     to_nxt = to;
2880     if (mode & consume_header)
2881     {
2882         if (frm_end-frm_nxt >= 2 && frm_nxt[0] == 0xFF && frm_nxt[1] == 0xFE)
2883             frm_nxt += 2;
2884     }
2885     for (; frm_nxt < frm_end - 1 && to_nxt < to_end; ++to_nxt)
2886     {
2887         uint16_t c1 = static_cast<uint16_t>(frm_nxt[1] << 8 | frm_nxt[0]);
2888         if ((c1 & 0xFC00) == 0xDC00)
2889             return codecvt_base::error;
2890         if ((c1 & 0xFC00) != 0xD800)
2891         {
2892             if (c1 > Maxcode)
2893                 return codecvt_base::error;
2894             *to_nxt = static_cast<uint32_t>(c1);
2895             frm_nxt += 2;
2896         }
2897         else
2898         {
2899             if (frm_end-frm_nxt < 4)
2900                 return codecvt_base::partial;
2901             uint16_t c2 = static_cast<uint16_t>(frm_nxt[3] << 8 | frm_nxt[2]);
2902             if ((c2 & 0xFC00) != 0xDC00)
2903                 return codecvt_base::error;
2904             uint32_t t = static_cast<uint32_t>(
2905                     ((((c1 & 0x03C0) >> 6) + 1) << 16)
2906                   |   ((c1 & 0x003F) << 10)
2907                   |    (c2 & 0x03FF));
2908             if (t > Maxcode)
2909                 return codecvt_base::error;
2910             *to_nxt = t;
2911             frm_nxt += 4;
2912         }
2913     }
2914     return frm_nxt < frm_end ? codecvt_base::partial : codecvt_base::ok;
2915 }
2916 
2917 static
2918 int
utf16le_to_ucs4_length(const uint8_t * frm,const uint8_t * frm_end,size_t mx,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2919 utf16le_to_ucs4_length(const uint8_t* frm, const uint8_t* frm_end,
2920                        size_t mx, unsigned long Maxcode = 0x10FFFF,
2921                        codecvt_mode mode = codecvt_mode(0))
2922 {
2923     const uint8_t* frm_nxt = frm;
2924     if (mode & consume_header)
2925     {
2926         if (frm_end-frm_nxt >= 2 && frm_nxt[0] == 0xFF && frm_nxt[1] == 0xFE)
2927             frm_nxt += 2;
2928     }
2929     for (size_t nchar32_t = 0; frm_nxt < frm_end - 1 && nchar32_t < mx; ++nchar32_t)
2930     {
2931         uint16_t c1 = static_cast<uint16_t>(frm_nxt[1] << 8 | frm_nxt[0]);
2932         if ((c1 & 0xFC00) == 0xDC00)
2933             break;
2934         if ((c1 & 0xFC00) != 0xD800)
2935         {
2936             if (c1 > Maxcode)
2937                 break;
2938             frm_nxt += 2;
2939         }
2940         else
2941         {
2942             if (frm_end-frm_nxt < 4)
2943                 break;
2944             uint16_t c2 = static_cast<uint16_t>(frm_nxt[3] << 8 | frm_nxt[2]);
2945             if ((c2 & 0xFC00) != 0xDC00)
2946                 break;
2947             uint32_t t = static_cast<uint32_t>(
2948                     ((((c1 & 0x03C0) >> 6) + 1) << 16)
2949                   |   ((c1 & 0x003F) << 10)
2950                   |    (c2 & 0x03FF));
2951             if (t > Maxcode)
2952                 break;
2953             frm_nxt += 4;
2954         }
2955     }
2956     return static_cast<int>(frm_nxt - frm);
2957 }
2958 
2959 static
2960 codecvt_base::result
ucs2_to_utf16be(const uint16_t * frm,const uint16_t * frm_end,const uint16_t * & frm_nxt,uint8_t * to,uint8_t * to_end,uint8_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2961 ucs2_to_utf16be(const uint16_t* frm, const uint16_t* frm_end, const uint16_t*& frm_nxt,
2962                 uint8_t* to, uint8_t* to_end, uint8_t*& to_nxt,
2963                 unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2964 {
2965     frm_nxt = frm;
2966     to_nxt = to;
2967     if (mode & generate_header)
2968     {
2969         if (to_end-to_nxt < 2)
2970             return codecvt_base::partial;
2971         *to_nxt++ = static_cast<uint8_t>(0xFE);
2972         *to_nxt++ = static_cast<uint8_t>(0xFF);
2973     }
2974     for (; frm_nxt < frm_end; ++frm_nxt)
2975     {
2976         uint16_t wc = *frm_nxt;
2977         if ((wc & 0xF800) == 0xD800 || wc > Maxcode)
2978             return codecvt_base::error;
2979         if (to_end-to_nxt < 2)
2980             return codecvt_base::partial;
2981         *to_nxt++ = static_cast<uint8_t>(wc >> 8);
2982         *to_nxt++ = static_cast<uint8_t>(wc);
2983     }
2984     return codecvt_base::ok;
2985 }
2986 
2987 static
2988 codecvt_base::result
utf16be_to_ucs2(const uint8_t * frm,const uint8_t * frm_end,const uint8_t * & frm_nxt,uint16_t * to,uint16_t * to_end,uint16_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))2989 utf16be_to_ucs2(const uint8_t* frm, const uint8_t* frm_end, const uint8_t*& frm_nxt,
2990                 uint16_t* to, uint16_t* to_end, uint16_t*& to_nxt,
2991                 unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
2992 {
2993     frm_nxt = frm;
2994     to_nxt = to;
2995     if (mode & consume_header)
2996     {
2997         if (frm_end-frm_nxt >= 2 && frm_nxt[0] == 0xFE && frm_nxt[1] == 0xFF)
2998             frm_nxt += 2;
2999     }
3000     for (; frm_nxt < frm_end - 1 && to_nxt < to_end; ++to_nxt)
3001     {
3002         uint16_t c1 = static_cast<uint16_t>(frm_nxt[0] << 8 | frm_nxt[1]);
3003         if ((c1 & 0xF800) == 0xD800 || c1 > Maxcode)
3004             return codecvt_base::error;
3005         *to_nxt = c1;
3006         frm_nxt += 2;
3007     }
3008     return frm_nxt < frm_end ? codecvt_base::partial : codecvt_base::ok;
3009 }
3010 
3011 static
3012 int
utf16be_to_ucs2_length(const uint8_t * frm,const uint8_t * frm_end,size_t mx,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))3013 utf16be_to_ucs2_length(const uint8_t* frm, const uint8_t* frm_end,
3014                        size_t mx, unsigned long Maxcode = 0x10FFFF,
3015                        codecvt_mode mode = codecvt_mode(0))
3016 {
3017     const uint8_t* frm_nxt = frm;
3018     if (mode & consume_header)
3019     {
3020         if (frm_end-frm_nxt >= 2 && frm_nxt[0] == 0xFE && frm_nxt[1] == 0xFF)
3021             frm_nxt += 2;
3022     }
3023     for (size_t nchar16_t = 0; frm_nxt < frm_end - 1 && nchar16_t < mx; ++nchar16_t)
3024     {
3025         uint16_t c1 = static_cast<uint16_t>(frm_nxt[0] << 8 | frm_nxt[1]);
3026         if ((c1 & 0xF800) == 0xD800 || c1 > Maxcode)
3027             break;
3028         frm_nxt += 2;
3029     }
3030     return static_cast<int>(frm_nxt - frm);
3031 }
3032 
3033 static
3034 codecvt_base::result
ucs2_to_utf16le(const uint16_t * frm,const uint16_t * frm_end,const uint16_t * & frm_nxt,uint8_t * to,uint8_t * to_end,uint8_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))3035 ucs2_to_utf16le(const uint16_t* frm, const uint16_t* frm_end, const uint16_t*& frm_nxt,
3036                 uint8_t* to, uint8_t* to_end, uint8_t*& to_nxt,
3037                 unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
3038 {
3039     frm_nxt = frm;
3040     to_nxt = to;
3041     if (mode & generate_header)
3042     {
3043         if (to_end-to_nxt < 2)
3044             return codecvt_base::partial;
3045         *to_nxt++ = static_cast<uint8_t>(0xFF);
3046         *to_nxt++ = static_cast<uint8_t>(0xFE);
3047     }
3048     for (; frm_nxt < frm_end; ++frm_nxt)
3049     {
3050         uint16_t wc = *frm_nxt;
3051         if ((wc & 0xF800) == 0xD800 || wc > Maxcode)
3052             return codecvt_base::error;
3053         if (to_end-to_nxt < 2)
3054             return codecvt_base::partial;
3055         *to_nxt++ = static_cast<uint8_t>(wc);
3056         *to_nxt++ = static_cast<uint8_t>(wc >> 8);
3057     }
3058     return codecvt_base::ok;
3059 }
3060 
3061 static
3062 codecvt_base::result
utf16le_to_ucs2(const uint8_t * frm,const uint8_t * frm_end,const uint8_t * & frm_nxt,uint16_t * to,uint16_t * to_end,uint16_t * & to_nxt,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))3063 utf16le_to_ucs2(const uint8_t* frm, const uint8_t* frm_end, const uint8_t*& frm_nxt,
3064                 uint16_t* to, uint16_t* to_end, uint16_t*& to_nxt,
3065                 unsigned long Maxcode = 0x10FFFF, codecvt_mode mode = codecvt_mode(0))
3066 {
3067     frm_nxt = frm;
3068     to_nxt = to;
3069     if (mode & consume_header)
3070     {
3071         if (frm_end-frm_nxt >= 2 && frm_nxt[0] == 0xFF && frm_nxt[1] == 0xFE)
3072             frm_nxt += 2;
3073     }
3074     for (; frm_nxt < frm_end - 1 && to_nxt < to_end; ++to_nxt)
3075     {
3076         uint16_t c1 = static_cast<uint16_t>(frm_nxt[1] << 8 | frm_nxt[0]);
3077         if ((c1 & 0xF800) == 0xD800 || c1 > Maxcode)
3078             return codecvt_base::error;
3079         *to_nxt = c1;
3080         frm_nxt += 2;
3081     }
3082     return frm_nxt < frm_end ? codecvt_base::partial : codecvt_base::ok;
3083 }
3084 
3085 static
3086 int
utf16le_to_ucs2_length(const uint8_t * frm,const uint8_t * frm_end,size_t mx,unsigned long Maxcode=0x10FFFF,codecvt_mode mode=codecvt_mode (0))3087 utf16le_to_ucs2_length(const uint8_t* frm, const uint8_t* frm_end,
3088                        size_t mx, unsigned long Maxcode = 0x10FFFF,
3089                        codecvt_mode mode = codecvt_mode(0))
3090 {
3091     const uint8_t* frm_nxt = frm;
3092     frm_nxt = frm;
3093     if (mode & consume_header)
3094     {
3095         if (frm_end-frm_nxt >= 2 && frm_nxt[0] == 0xFF && frm_nxt[1] == 0xFE)
3096             frm_nxt += 2;
3097     }
3098     for (size_t nchar16_t = 0; frm_nxt < frm_end - 1 && nchar16_t < mx; ++nchar16_t)
3099     {
3100         uint16_t c1 = static_cast<uint16_t>(frm_nxt[1] << 8 | frm_nxt[0]);
3101         if ((c1 & 0xF800) == 0xD800 || c1 > Maxcode)
3102             break;
3103         frm_nxt += 2;
3104     }
3105     return static_cast<int>(frm_nxt - frm);
3106 }
3107 
3108 // template <> class codecvt<char16_t, char, mbstate_t>
3109 
3110 locale::id codecvt<char16_t, char, mbstate_t>::id;
3111 
~codecvt()3112 codecvt<char16_t, char, mbstate_t>::~codecvt()
3113 {
3114 }
3115 
3116 codecvt<char16_t, char, mbstate_t>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3117 codecvt<char16_t, char, mbstate_t>::do_out(state_type&,
3118     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3119     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3120 {
3121     const uint16_t* _frm = reinterpret_cast<const uint16_t*>(frm);
3122     const uint16_t* _frm_end = reinterpret_cast<const uint16_t*>(frm_end);
3123     const uint16_t* _frm_nxt = _frm;
3124     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3125     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3126     uint8_t* _to_nxt = _to;
3127     result r = utf16_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt);
3128     frm_nxt = frm + (_frm_nxt - _frm);
3129     to_nxt = to + (_to_nxt - _to);
3130     return r;
3131 }
3132 
3133 codecvt<char16_t, char, mbstate_t>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3134 codecvt<char16_t, char, mbstate_t>::do_in(state_type&,
3135     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3136     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3137 {
3138     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3139     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3140     const uint8_t* _frm_nxt = _frm;
3141     uint16_t* _to = reinterpret_cast<uint16_t*>(to);
3142     uint16_t* _to_end = reinterpret_cast<uint16_t*>(to_end);
3143     uint16_t* _to_nxt = _to;
3144     result r = utf8_to_utf16(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt);
3145     frm_nxt = frm + (_frm_nxt - _frm);
3146     to_nxt = to + (_to_nxt - _to);
3147     return r;
3148 }
3149 
3150 codecvt<char16_t, char, mbstate_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3151 codecvt<char16_t, char, mbstate_t>::do_unshift(state_type&,
3152     extern_type* to, extern_type*, extern_type*& to_nxt) const
3153 {
3154     to_nxt = to;
3155     return noconv;
3156 }
3157 
3158 int
do_encoding() const3159 codecvt<char16_t, char, mbstate_t>::do_encoding() const  _NOEXCEPT
3160 {
3161     return 0;
3162 }
3163 
3164 bool
do_always_noconv() const3165 codecvt<char16_t, char, mbstate_t>::do_always_noconv() const  _NOEXCEPT
3166 {
3167     return false;
3168 }
3169 
3170 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3171 codecvt<char16_t, char, mbstate_t>::do_length(state_type&,
3172     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3173 {
3174     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3175     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3176     return utf8_to_utf16_length(_frm, _frm_end, mx);
3177 }
3178 
3179 int
do_max_length() const3180 codecvt<char16_t, char, mbstate_t>::do_max_length() const  _NOEXCEPT
3181 {
3182     return 4;
3183 }
3184 
3185 // template <> class codecvt<char32_t, char, mbstate_t>
3186 
3187 locale::id codecvt<char32_t, char, mbstate_t>::id;
3188 
~codecvt()3189 codecvt<char32_t, char, mbstate_t>::~codecvt()
3190 {
3191 }
3192 
3193 codecvt<char32_t, char, mbstate_t>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3194 codecvt<char32_t, char, mbstate_t>::do_out(state_type&,
3195     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3196     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3197 {
3198     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
3199     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
3200     const uint32_t* _frm_nxt = _frm;
3201     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3202     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3203     uint8_t* _to_nxt = _to;
3204     result r = ucs4_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt);
3205     frm_nxt = frm + (_frm_nxt - _frm);
3206     to_nxt = to + (_to_nxt - _to);
3207     return r;
3208 }
3209 
3210 codecvt<char32_t, char, mbstate_t>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3211 codecvt<char32_t, char, mbstate_t>::do_in(state_type&,
3212     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3213     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3214 {
3215     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3216     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3217     const uint8_t* _frm_nxt = _frm;
3218     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
3219     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
3220     uint32_t* _to_nxt = _to;
3221     result r = utf8_to_ucs4(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt);
3222     frm_nxt = frm + (_frm_nxt - _frm);
3223     to_nxt = to + (_to_nxt - _to);
3224     return r;
3225 }
3226 
3227 codecvt<char32_t, char, mbstate_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3228 codecvt<char32_t, char, mbstate_t>::do_unshift(state_type&,
3229     extern_type* to, extern_type*, extern_type*& to_nxt) const
3230 {
3231     to_nxt = to;
3232     return noconv;
3233 }
3234 
3235 int
do_encoding() const3236 codecvt<char32_t, char, mbstate_t>::do_encoding() const  _NOEXCEPT
3237 {
3238     return 0;
3239 }
3240 
3241 bool
do_always_noconv() const3242 codecvt<char32_t, char, mbstate_t>::do_always_noconv() const  _NOEXCEPT
3243 {
3244     return false;
3245 }
3246 
3247 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3248 codecvt<char32_t, char, mbstate_t>::do_length(state_type&,
3249     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3250 {
3251     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3252     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3253     return utf8_to_ucs4_length(_frm, _frm_end, mx);
3254 }
3255 
3256 int
do_max_length() const3257 codecvt<char32_t, char, mbstate_t>::do_max_length() const  _NOEXCEPT
3258 {
3259     return 4;
3260 }
3261 
3262 // __codecvt_utf8<wchar_t>
3263 
3264 __codecvt_utf8<wchar_t>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3265 __codecvt_utf8<wchar_t>::do_out(state_type&,
3266     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3267     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3268 {
3269 #if defined(_LIBCPP_SHORT_WCHAR)
3270     const uint16_t* _frm = reinterpret_cast<const uint16_t*>(frm);
3271     const uint16_t* _frm_end = reinterpret_cast<const uint16_t*>(frm_end);
3272     const uint16_t* _frm_nxt = _frm;
3273 #else
3274     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
3275     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
3276     const uint32_t* _frm_nxt = _frm;
3277 #endif
3278     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3279     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3280     uint8_t* _to_nxt = _to;
3281 #if defined(_LIBCPP_SHORT_WCHAR)
3282     result r = ucs2_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3283                             _Maxcode_, _Mode_);
3284 #else
3285     result r = ucs4_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3286                             _Maxcode_, _Mode_);
3287 #endif
3288     frm_nxt = frm + (_frm_nxt - _frm);
3289     to_nxt = to + (_to_nxt - _to);
3290     return r;
3291 }
3292 
3293 __codecvt_utf8<wchar_t>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3294 __codecvt_utf8<wchar_t>::do_in(state_type&,
3295     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3296     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3297 {
3298     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3299     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3300     const uint8_t* _frm_nxt = _frm;
3301 #if defined(_LIBCPP_SHORT_WCHAR)
3302     uint16_t* _to = reinterpret_cast<uint16_t*>(to);
3303     uint16_t* _to_end = reinterpret_cast<uint16_t*>(to_end);
3304     uint16_t* _to_nxt = _to;
3305     result r = utf8_to_ucs2(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3306                             _Maxcode_, _Mode_);
3307 #else
3308     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
3309     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
3310     uint32_t* _to_nxt = _to;
3311     result r = utf8_to_ucs4(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3312                             _Maxcode_, _Mode_);
3313 #endif
3314     frm_nxt = frm + (_frm_nxt - _frm);
3315     to_nxt = to + (_to_nxt - _to);
3316     return r;
3317 }
3318 
3319 __codecvt_utf8<wchar_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3320 __codecvt_utf8<wchar_t>::do_unshift(state_type&,
3321     extern_type* to, extern_type*, extern_type*& to_nxt) const
3322 {
3323     to_nxt = to;
3324     return noconv;
3325 }
3326 
3327 int
do_encoding() const3328 __codecvt_utf8<wchar_t>::do_encoding() const  _NOEXCEPT
3329 {
3330     return 0;
3331 }
3332 
3333 bool
do_always_noconv() const3334 __codecvt_utf8<wchar_t>::do_always_noconv() const  _NOEXCEPT
3335 {
3336     return false;
3337 }
3338 
3339 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3340 __codecvt_utf8<wchar_t>::do_length(state_type&,
3341     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3342 {
3343     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3344     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3345     return utf8_to_ucs4_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3346 }
3347 
3348 int
do_max_length() const3349 __codecvt_utf8<wchar_t>::do_max_length() const  _NOEXCEPT
3350 {
3351     if (_Mode_ & consume_header)
3352         return 7;
3353     return 4;
3354 }
3355 
3356 // __codecvt_utf8<char16_t>
3357 
3358 __codecvt_utf8<char16_t>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3359 __codecvt_utf8<char16_t>::do_out(state_type&,
3360     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3361     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3362 {
3363     const uint16_t* _frm = reinterpret_cast<const uint16_t*>(frm);
3364     const uint16_t* _frm_end = reinterpret_cast<const uint16_t*>(frm_end);
3365     const uint16_t* _frm_nxt = _frm;
3366     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3367     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3368     uint8_t* _to_nxt = _to;
3369     result r = ucs2_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3370                             _Maxcode_, _Mode_);
3371     frm_nxt = frm + (_frm_nxt - _frm);
3372     to_nxt = to + (_to_nxt - _to);
3373     return r;
3374 }
3375 
3376 __codecvt_utf8<char16_t>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3377 __codecvt_utf8<char16_t>::do_in(state_type&,
3378     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3379     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3380 {
3381     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3382     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3383     const uint8_t* _frm_nxt = _frm;
3384     uint16_t* _to = reinterpret_cast<uint16_t*>(to);
3385     uint16_t* _to_end = reinterpret_cast<uint16_t*>(to_end);
3386     uint16_t* _to_nxt = _to;
3387     result r = utf8_to_ucs2(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3388                             _Maxcode_, _Mode_);
3389     frm_nxt = frm + (_frm_nxt - _frm);
3390     to_nxt = to + (_to_nxt - _to);
3391     return r;
3392 }
3393 
3394 __codecvt_utf8<char16_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3395 __codecvt_utf8<char16_t>::do_unshift(state_type&,
3396     extern_type* to, extern_type*, extern_type*& to_nxt) const
3397 {
3398     to_nxt = to;
3399     return noconv;
3400 }
3401 
3402 int
do_encoding() const3403 __codecvt_utf8<char16_t>::do_encoding() const  _NOEXCEPT
3404 {
3405     return 0;
3406 }
3407 
3408 bool
do_always_noconv() const3409 __codecvt_utf8<char16_t>::do_always_noconv() const  _NOEXCEPT
3410 {
3411     return false;
3412 }
3413 
3414 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3415 __codecvt_utf8<char16_t>::do_length(state_type&,
3416     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3417 {
3418     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3419     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3420     return utf8_to_ucs2_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3421 }
3422 
3423 int
do_max_length() const3424 __codecvt_utf8<char16_t>::do_max_length() const  _NOEXCEPT
3425 {
3426     if (_Mode_ & consume_header)
3427         return 6;
3428     return 3;
3429 }
3430 
3431 // __codecvt_utf8<char32_t>
3432 
3433 __codecvt_utf8<char32_t>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3434 __codecvt_utf8<char32_t>::do_out(state_type&,
3435     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3436     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3437 {
3438     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
3439     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
3440     const uint32_t* _frm_nxt = _frm;
3441     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3442     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3443     uint8_t* _to_nxt = _to;
3444     result r = ucs4_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3445                             _Maxcode_, _Mode_);
3446     frm_nxt = frm + (_frm_nxt - _frm);
3447     to_nxt = to + (_to_nxt - _to);
3448     return r;
3449 }
3450 
3451 __codecvt_utf8<char32_t>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3452 __codecvt_utf8<char32_t>::do_in(state_type&,
3453     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3454     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3455 {
3456     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3457     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3458     const uint8_t* _frm_nxt = _frm;
3459     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
3460     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
3461     uint32_t* _to_nxt = _to;
3462     result r = utf8_to_ucs4(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3463                             _Maxcode_, _Mode_);
3464     frm_nxt = frm + (_frm_nxt - _frm);
3465     to_nxt = to + (_to_nxt - _to);
3466     return r;
3467 }
3468 
3469 __codecvt_utf8<char32_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3470 __codecvt_utf8<char32_t>::do_unshift(state_type&,
3471     extern_type* to, extern_type*, extern_type*& to_nxt) const
3472 {
3473     to_nxt = to;
3474     return noconv;
3475 }
3476 
3477 int
do_encoding() const3478 __codecvt_utf8<char32_t>::do_encoding() const  _NOEXCEPT
3479 {
3480     return 0;
3481 }
3482 
3483 bool
do_always_noconv() const3484 __codecvt_utf8<char32_t>::do_always_noconv() const  _NOEXCEPT
3485 {
3486     return false;
3487 }
3488 
3489 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3490 __codecvt_utf8<char32_t>::do_length(state_type&,
3491     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3492 {
3493     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3494     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3495     return utf8_to_ucs4_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3496 }
3497 
3498 int
do_max_length() const3499 __codecvt_utf8<char32_t>::do_max_length() const  _NOEXCEPT
3500 {
3501     if (_Mode_ & consume_header)
3502         return 7;
3503     return 4;
3504 }
3505 
3506 // __codecvt_utf16<wchar_t, false>
3507 
3508 __codecvt_utf16<wchar_t, false>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3509 __codecvt_utf16<wchar_t, false>::do_out(state_type&,
3510     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3511     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3512 {
3513     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
3514     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
3515     const uint32_t* _frm_nxt = _frm;
3516     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3517     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3518     uint8_t* _to_nxt = _to;
3519     result r = ucs4_to_utf16be(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3520                                _Maxcode_, _Mode_);
3521     frm_nxt = frm + (_frm_nxt - _frm);
3522     to_nxt = to + (_to_nxt - _to);
3523     return r;
3524 }
3525 
3526 __codecvt_utf16<wchar_t, false>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3527 __codecvt_utf16<wchar_t, false>::do_in(state_type&,
3528     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3529     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3530 {
3531     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3532     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3533     const uint8_t* _frm_nxt = _frm;
3534     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
3535     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
3536     uint32_t* _to_nxt = _to;
3537     result r = utf16be_to_ucs4(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3538                                _Maxcode_, _Mode_);
3539     frm_nxt = frm + (_frm_nxt - _frm);
3540     to_nxt = to + (_to_nxt - _to);
3541     return r;
3542 }
3543 
3544 __codecvt_utf16<wchar_t, false>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3545 __codecvt_utf16<wchar_t, false>::do_unshift(state_type&,
3546     extern_type* to, extern_type*, extern_type*& to_nxt) const
3547 {
3548     to_nxt = to;
3549     return noconv;
3550 }
3551 
3552 int
do_encoding() const3553 __codecvt_utf16<wchar_t, false>::do_encoding() const  _NOEXCEPT
3554 {
3555     return 0;
3556 }
3557 
3558 bool
do_always_noconv() const3559 __codecvt_utf16<wchar_t, false>::do_always_noconv() const  _NOEXCEPT
3560 {
3561     return false;
3562 }
3563 
3564 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3565 __codecvt_utf16<wchar_t, false>::do_length(state_type&,
3566     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3567 {
3568     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3569     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3570     return utf16be_to_ucs4_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3571 }
3572 
3573 int
do_max_length() const3574 __codecvt_utf16<wchar_t, false>::do_max_length() const  _NOEXCEPT
3575 {
3576     if (_Mode_ & consume_header)
3577         return 6;
3578     return 4;
3579 }
3580 
3581 // __codecvt_utf16<wchar_t, true>
3582 
3583 __codecvt_utf16<wchar_t, true>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3584 __codecvt_utf16<wchar_t, true>::do_out(state_type&,
3585     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3586     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3587 {
3588     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
3589     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
3590     const uint32_t* _frm_nxt = _frm;
3591     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3592     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3593     uint8_t* _to_nxt = _to;
3594     result r = ucs4_to_utf16le(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3595                                _Maxcode_, _Mode_);
3596     frm_nxt = frm + (_frm_nxt - _frm);
3597     to_nxt = to + (_to_nxt - _to);
3598     return r;
3599 }
3600 
3601 __codecvt_utf16<wchar_t, true>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3602 __codecvt_utf16<wchar_t, true>::do_in(state_type&,
3603     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3604     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3605 {
3606     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3607     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3608     const uint8_t* _frm_nxt = _frm;
3609     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
3610     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
3611     uint32_t* _to_nxt = _to;
3612     result r = utf16le_to_ucs4(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3613                                _Maxcode_, _Mode_);
3614     frm_nxt = frm + (_frm_nxt - _frm);
3615     to_nxt = to + (_to_nxt - _to);
3616     return r;
3617 }
3618 
3619 __codecvt_utf16<wchar_t, true>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3620 __codecvt_utf16<wchar_t, true>::do_unshift(state_type&,
3621     extern_type* to, extern_type*, extern_type*& to_nxt) const
3622 {
3623     to_nxt = to;
3624     return noconv;
3625 }
3626 
3627 int
do_encoding() const3628 __codecvt_utf16<wchar_t, true>::do_encoding() const  _NOEXCEPT
3629 {
3630     return 0;
3631 }
3632 
3633 bool
do_always_noconv() const3634 __codecvt_utf16<wchar_t, true>::do_always_noconv() const  _NOEXCEPT
3635 {
3636     return false;
3637 }
3638 
3639 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3640 __codecvt_utf16<wchar_t, true>::do_length(state_type&,
3641     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3642 {
3643     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3644     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3645     return utf16le_to_ucs4_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3646 }
3647 
3648 int
do_max_length() const3649 __codecvt_utf16<wchar_t, true>::do_max_length() const  _NOEXCEPT
3650 {
3651     if (_Mode_ & consume_header)
3652         return 6;
3653     return 4;
3654 }
3655 
3656 // __codecvt_utf16<char16_t, false>
3657 
3658 __codecvt_utf16<char16_t, false>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3659 __codecvt_utf16<char16_t, false>::do_out(state_type&,
3660     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3661     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3662 {
3663     const uint16_t* _frm = reinterpret_cast<const uint16_t*>(frm);
3664     const uint16_t* _frm_end = reinterpret_cast<const uint16_t*>(frm_end);
3665     const uint16_t* _frm_nxt = _frm;
3666     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3667     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3668     uint8_t* _to_nxt = _to;
3669     result r = ucs2_to_utf16be(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3670                                _Maxcode_, _Mode_);
3671     frm_nxt = frm + (_frm_nxt - _frm);
3672     to_nxt = to + (_to_nxt - _to);
3673     return r;
3674 }
3675 
3676 __codecvt_utf16<char16_t, false>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3677 __codecvt_utf16<char16_t, false>::do_in(state_type&,
3678     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3679     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3680 {
3681     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3682     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3683     const uint8_t* _frm_nxt = _frm;
3684     uint16_t* _to = reinterpret_cast<uint16_t*>(to);
3685     uint16_t* _to_end = reinterpret_cast<uint16_t*>(to_end);
3686     uint16_t* _to_nxt = _to;
3687     result r = utf16be_to_ucs2(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3688                                _Maxcode_, _Mode_);
3689     frm_nxt = frm + (_frm_nxt - _frm);
3690     to_nxt = to + (_to_nxt - _to);
3691     return r;
3692 }
3693 
3694 __codecvt_utf16<char16_t, false>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3695 __codecvt_utf16<char16_t, false>::do_unshift(state_type&,
3696     extern_type* to, extern_type*, extern_type*& to_nxt) const
3697 {
3698     to_nxt = to;
3699     return noconv;
3700 }
3701 
3702 int
do_encoding() const3703 __codecvt_utf16<char16_t, false>::do_encoding() const  _NOEXCEPT
3704 {
3705     return 0;
3706 }
3707 
3708 bool
do_always_noconv() const3709 __codecvt_utf16<char16_t, false>::do_always_noconv() const  _NOEXCEPT
3710 {
3711     return false;
3712 }
3713 
3714 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3715 __codecvt_utf16<char16_t, false>::do_length(state_type&,
3716     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3717 {
3718     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3719     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3720     return utf16be_to_ucs2_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3721 }
3722 
3723 int
do_max_length() const3724 __codecvt_utf16<char16_t, false>::do_max_length() const  _NOEXCEPT
3725 {
3726     if (_Mode_ & consume_header)
3727         return 4;
3728     return 2;
3729 }
3730 
3731 // __codecvt_utf16<char16_t, true>
3732 
3733 __codecvt_utf16<char16_t, true>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3734 __codecvt_utf16<char16_t, true>::do_out(state_type&,
3735     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3736     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3737 {
3738     const uint16_t* _frm = reinterpret_cast<const uint16_t*>(frm);
3739     const uint16_t* _frm_end = reinterpret_cast<const uint16_t*>(frm_end);
3740     const uint16_t* _frm_nxt = _frm;
3741     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3742     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3743     uint8_t* _to_nxt = _to;
3744     result r = ucs2_to_utf16le(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3745                                _Maxcode_, _Mode_);
3746     frm_nxt = frm + (_frm_nxt - _frm);
3747     to_nxt = to + (_to_nxt - _to);
3748     return r;
3749 }
3750 
3751 __codecvt_utf16<char16_t, true>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3752 __codecvt_utf16<char16_t, true>::do_in(state_type&,
3753     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3754     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3755 {
3756     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3757     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3758     const uint8_t* _frm_nxt = _frm;
3759     uint16_t* _to = reinterpret_cast<uint16_t*>(to);
3760     uint16_t* _to_end = reinterpret_cast<uint16_t*>(to_end);
3761     uint16_t* _to_nxt = _to;
3762     result r = utf16le_to_ucs2(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3763                                _Maxcode_, _Mode_);
3764     frm_nxt = frm + (_frm_nxt - _frm);
3765     to_nxt = to + (_to_nxt - _to);
3766     return r;
3767 }
3768 
3769 __codecvt_utf16<char16_t, true>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3770 __codecvt_utf16<char16_t, true>::do_unshift(state_type&,
3771     extern_type* to, extern_type*, extern_type*& to_nxt) const
3772 {
3773     to_nxt = to;
3774     return noconv;
3775 }
3776 
3777 int
do_encoding() const3778 __codecvt_utf16<char16_t, true>::do_encoding() const  _NOEXCEPT
3779 {
3780     return 0;
3781 }
3782 
3783 bool
do_always_noconv() const3784 __codecvt_utf16<char16_t, true>::do_always_noconv() const  _NOEXCEPT
3785 {
3786     return false;
3787 }
3788 
3789 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3790 __codecvt_utf16<char16_t, true>::do_length(state_type&,
3791     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3792 {
3793     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3794     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3795     return utf16le_to_ucs2_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3796 }
3797 
3798 int
do_max_length() const3799 __codecvt_utf16<char16_t, true>::do_max_length() const  _NOEXCEPT
3800 {
3801     if (_Mode_ & consume_header)
3802         return 4;
3803     return 2;
3804 }
3805 
3806 // __codecvt_utf16<char32_t, false>
3807 
3808 __codecvt_utf16<char32_t, false>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3809 __codecvt_utf16<char32_t, false>::do_out(state_type&,
3810     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3811     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3812 {
3813     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
3814     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
3815     const uint32_t* _frm_nxt = _frm;
3816     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3817     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3818     uint8_t* _to_nxt = _to;
3819     result r = ucs4_to_utf16be(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3820                                _Maxcode_, _Mode_);
3821     frm_nxt = frm + (_frm_nxt - _frm);
3822     to_nxt = to + (_to_nxt - _to);
3823     return r;
3824 }
3825 
3826 __codecvt_utf16<char32_t, false>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3827 __codecvt_utf16<char32_t, false>::do_in(state_type&,
3828     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3829     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3830 {
3831     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3832     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3833     const uint8_t* _frm_nxt = _frm;
3834     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
3835     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
3836     uint32_t* _to_nxt = _to;
3837     result r = utf16be_to_ucs4(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3838                                _Maxcode_, _Mode_);
3839     frm_nxt = frm + (_frm_nxt - _frm);
3840     to_nxt = to + (_to_nxt - _to);
3841     return r;
3842 }
3843 
3844 __codecvt_utf16<char32_t, false>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3845 __codecvt_utf16<char32_t, false>::do_unshift(state_type&,
3846     extern_type* to, extern_type*, extern_type*& to_nxt) const
3847 {
3848     to_nxt = to;
3849     return noconv;
3850 }
3851 
3852 int
do_encoding() const3853 __codecvt_utf16<char32_t, false>::do_encoding() const  _NOEXCEPT
3854 {
3855     return 0;
3856 }
3857 
3858 bool
do_always_noconv() const3859 __codecvt_utf16<char32_t, false>::do_always_noconv() const  _NOEXCEPT
3860 {
3861     return false;
3862 }
3863 
3864 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3865 __codecvt_utf16<char32_t, false>::do_length(state_type&,
3866     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3867 {
3868     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3869     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3870     return utf16be_to_ucs4_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3871 }
3872 
3873 int
do_max_length() const3874 __codecvt_utf16<char32_t, false>::do_max_length() const  _NOEXCEPT
3875 {
3876     if (_Mode_ & consume_header)
3877         return 6;
3878     return 4;
3879 }
3880 
3881 // __codecvt_utf16<char32_t, true>
3882 
3883 __codecvt_utf16<char32_t, true>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3884 __codecvt_utf16<char32_t, true>::do_out(state_type&,
3885     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3886     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3887 {
3888     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
3889     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
3890     const uint32_t* _frm_nxt = _frm;
3891     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3892     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3893     uint8_t* _to_nxt = _to;
3894     result r = ucs4_to_utf16le(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3895                                _Maxcode_, _Mode_);
3896     frm_nxt = frm + (_frm_nxt - _frm);
3897     to_nxt = to + (_to_nxt - _to);
3898     return r;
3899 }
3900 
3901 __codecvt_utf16<char32_t, true>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3902 __codecvt_utf16<char32_t, true>::do_in(state_type&,
3903     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3904     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3905 {
3906     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3907     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3908     const uint8_t* _frm_nxt = _frm;
3909     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
3910     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
3911     uint32_t* _to_nxt = _to;
3912     result r = utf16le_to_ucs4(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3913                                _Maxcode_, _Mode_);
3914     frm_nxt = frm + (_frm_nxt - _frm);
3915     to_nxt = to + (_to_nxt - _to);
3916     return r;
3917 }
3918 
3919 __codecvt_utf16<char32_t, true>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3920 __codecvt_utf16<char32_t, true>::do_unshift(state_type&,
3921     extern_type* to, extern_type*, extern_type*& to_nxt) const
3922 {
3923     to_nxt = to;
3924     return noconv;
3925 }
3926 
3927 int
do_encoding() const3928 __codecvt_utf16<char32_t, true>::do_encoding() const  _NOEXCEPT
3929 {
3930     return 0;
3931 }
3932 
3933 bool
do_always_noconv() const3934 __codecvt_utf16<char32_t, true>::do_always_noconv() const  _NOEXCEPT
3935 {
3936     return false;
3937 }
3938 
3939 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const3940 __codecvt_utf16<char32_t, true>::do_length(state_type&,
3941     const extern_type* frm, const extern_type* frm_end, size_t mx) const
3942 {
3943     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3944     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3945     return utf16le_to_ucs4_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
3946 }
3947 
3948 int
do_max_length() const3949 __codecvt_utf16<char32_t, true>::do_max_length() const  _NOEXCEPT
3950 {
3951     if (_Mode_ & consume_header)
3952         return 6;
3953     return 4;
3954 }
3955 
3956 // __codecvt_utf8_utf16<wchar_t>
3957 
3958 __codecvt_utf8_utf16<wchar_t>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const3959 __codecvt_utf8_utf16<wchar_t>::do_out(state_type&,
3960     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
3961     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
3962 {
3963     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
3964     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
3965     const uint32_t* _frm_nxt = _frm;
3966     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
3967     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
3968     uint8_t* _to_nxt = _to;
3969     result r = utf16_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3970                              _Maxcode_, _Mode_);
3971     frm_nxt = frm + (_frm_nxt - _frm);
3972     to_nxt = to + (_to_nxt - _to);
3973     return r;
3974 }
3975 
3976 __codecvt_utf8_utf16<wchar_t>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const3977 __codecvt_utf8_utf16<wchar_t>::do_in(state_type&,
3978     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
3979     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
3980 {
3981     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
3982     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
3983     const uint8_t* _frm_nxt = _frm;
3984     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
3985     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
3986     uint32_t* _to_nxt = _to;
3987     result r = utf8_to_utf16(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
3988                              _Maxcode_, _Mode_);
3989     frm_nxt = frm + (_frm_nxt - _frm);
3990     to_nxt = to + (_to_nxt - _to);
3991     return r;
3992 }
3993 
3994 __codecvt_utf8_utf16<wchar_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const3995 __codecvt_utf8_utf16<wchar_t>::do_unshift(state_type&,
3996     extern_type* to, extern_type*, extern_type*& to_nxt) const
3997 {
3998     to_nxt = to;
3999     return noconv;
4000 }
4001 
4002 int
do_encoding() const4003 __codecvt_utf8_utf16<wchar_t>::do_encoding() const  _NOEXCEPT
4004 {
4005     return 0;
4006 }
4007 
4008 bool
do_always_noconv() const4009 __codecvt_utf8_utf16<wchar_t>::do_always_noconv() const  _NOEXCEPT
4010 {
4011     return false;
4012 }
4013 
4014 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const4015 __codecvt_utf8_utf16<wchar_t>::do_length(state_type&,
4016     const extern_type* frm, const extern_type* frm_end, size_t mx) const
4017 {
4018     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
4019     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
4020     return utf8_to_utf16_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
4021 }
4022 
4023 int
do_max_length() const4024 __codecvt_utf8_utf16<wchar_t>::do_max_length() const  _NOEXCEPT
4025 {
4026     if (_Mode_ & consume_header)
4027         return 7;
4028     return 4;
4029 }
4030 
4031 // __codecvt_utf8_utf16<char16_t>
4032 
4033 __codecvt_utf8_utf16<char16_t>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const4034 __codecvt_utf8_utf16<char16_t>::do_out(state_type&,
4035     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
4036     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
4037 {
4038     const uint16_t* _frm = reinterpret_cast<const uint16_t*>(frm);
4039     const uint16_t* _frm_end = reinterpret_cast<const uint16_t*>(frm_end);
4040     const uint16_t* _frm_nxt = _frm;
4041     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
4042     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
4043     uint8_t* _to_nxt = _to;
4044     result r = utf16_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
4045                              _Maxcode_, _Mode_);
4046     frm_nxt = frm + (_frm_nxt - _frm);
4047     to_nxt = to + (_to_nxt - _to);
4048     return r;
4049 }
4050 
4051 __codecvt_utf8_utf16<char16_t>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const4052 __codecvt_utf8_utf16<char16_t>::do_in(state_type&,
4053     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
4054     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
4055 {
4056     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
4057     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
4058     const uint8_t* _frm_nxt = _frm;
4059     uint16_t* _to = reinterpret_cast<uint16_t*>(to);
4060     uint16_t* _to_end = reinterpret_cast<uint16_t*>(to_end);
4061     uint16_t* _to_nxt = _to;
4062     result r = utf8_to_utf16(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
4063                              _Maxcode_, _Mode_);
4064     frm_nxt = frm + (_frm_nxt - _frm);
4065     to_nxt = to + (_to_nxt - _to);
4066     return r;
4067 }
4068 
4069 __codecvt_utf8_utf16<char16_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const4070 __codecvt_utf8_utf16<char16_t>::do_unshift(state_type&,
4071     extern_type* to, extern_type*, extern_type*& to_nxt) const
4072 {
4073     to_nxt = to;
4074     return noconv;
4075 }
4076 
4077 int
do_encoding() const4078 __codecvt_utf8_utf16<char16_t>::do_encoding() const  _NOEXCEPT
4079 {
4080     return 0;
4081 }
4082 
4083 bool
do_always_noconv() const4084 __codecvt_utf8_utf16<char16_t>::do_always_noconv() const  _NOEXCEPT
4085 {
4086     return false;
4087 }
4088 
4089 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const4090 __codecvt_utf8_utf16<char16_t>::do_length(state_type&,
4091     const extern_type* frm, const extern_type* frm_end, size_t mx) const
4092 {
4093     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
4094     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
4095     return utf8_to_utf16_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
4096 }
4097 
4098 int
do_max_length() const4099 __codecvt_utf8_utf16<char16_t>::do_max_length() const  _NOEXCEPT
4100 {
4101     if (_Mode_ & consume_header)
4102         return 7;
4103     return 4;
4104 }
4105 
4106 // __codecvt_utf8_utf16<char32_t>
4107 
4108 __codecvt_utf8_utf16<char32_t>::result
do_out(state_type &,const intern_type * frm,const intern_type * frm_end,const intern_type * & frm_nxt,extern_type * to,extern_type * to_end,extern_type * & to_nxt) const4109 __codecvt_utf8_utf16<char32_t>::do_out(state_type&,
4110     const intern_type* frm, const intern_type* frm_end, const intern_type*& frm_nxt,
4111     extern_type* to, extern_type* to_end, extern_type*& to_nxt) const
4112 {
4113     const uint32_t* _frm = reinterpret_cast<const uint32_t*>(frm);
4114     const uint32_t* _frm_end = reinterpret_cast<const uint32_t*>(frm_end);
4115     const uint32_t* _frm_nxt = _frm;
4116     uint8_t* _to = reinterpret_cast<uint8_t*>(to);
4117     uint8_t* _to_end = reinterpret_cast<uint8_t*>(to_end);
4118     uint8_t* _to_nxt = _to;
4119     result r = utf16_to_utf8(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
4120                              _Maxcode_, _Mode_);
4121     frm_nxt = frm + (_frm_nxt - _frm);
4122     to_nxt = to + (_to_nxt - _to);
4123     return r;
4124 }
4125 
4126 __codecvt_utf8_utf16<char32_t>::result
do_in(state_type &,const extern_type * frm,const extern_type * frm_end,const extern_type * & frm_nxt,intern_type * to,intern_type * to_end,intern_type * & to_nxt) const4127 __codecvt_utf8_utf16<char32_t>::do_in(state_type&,
4128     const extern_type* frm, const extern_type* frm_end, const extern_type*& frm_nxt,
4129     intern_type* to, intern_type* to_end, intern_type*& to_nxt) const
4130 {
4131     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
4132     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
4133     const uint8_t* _frm_nxt = _frm;
4134     uint32_t* _to = reinterpret_cast<uint32_t*>(to);
4135     uint32_t* _to_end = reinterpret_cast<uint32_t*>(to_end);
4136     uint32_t* _to_nxt = _to;
4137     result r = utf8_to_utf16(_frm, _frm_end, _frm_nxt, _to, _to_end, _to_nxt,
4138                              _Maxcode_, _Mode_);
4139     frm_nxt = frm + (_frm_nxt - _frm);
4140     to_nxt = to + (_to_nxt - _to);
4141     return r;
4142 }
4143 
4144 __codecvt_utf8_utf16<char32_t>::result
do_unshift(state_type &,extern_type * to,extern_type *,extern_type * & to_nxt) const4145 __codecvt_utf8_utf16<char32_t>::do_unshift(state_type&,
4146     extern_type* to, extern_type*, extern_type*& to_nxt) const
4147 {
4148     to_nxt = to;
4149     return noconv;
4150 }
4151 
4152 int
do_encoding() const4153 __codecvt_utf8_utf16<char32_t>::do_encoding() const  _NOEXCEPT
4154 {
4155     return 0;
4156 }
4157 
4158 bool
do_always_noconv() const4159 __codecvt_utf8_utf16<char32_t>::do_always_noconv() const  _NOEXCEPT
4160 {
4161     return false;
4162 }
4163 
4164 int
do_length(state_type &,const extern_type * frm,const extern_type * frm_end,size_t mx) const4165 __codecvt_utf8_utf16<char32_t>::do_length(state_type&,
4166     const extern_type* frm, const extern_type* frm_end, size_t mx) const
4167 {
4168     const uint8_t* _frm = reinterpret_cast<const uint8_t*>(frm);
4169     const uint8_t* _frm_end = reinterpret_cast<const uint8_t*>(frm_end);
4170     return utf8_to_utf16_length(_frm, _frm_end, mx, _Maxcode_, _Mode_);
4171 }
4172 
4173 int
do_max_length() const4174 __codecvt_utf8_utf16<char32_t>::do_max_length() const  _NOEXCEPT
4175 {
4176     if (_Mode_ & consume_header)
4177         return 7;
4178     return 4;
4179 }
4180 
4181 // __narrow_to_utf8<16>
4182 
~__narrow_to_utf8()4183 __narrow_to_utf8<16>::~__narrow_to_utf8()
4184 {
4185 }
4186 
4187 // __narrow_to_utf8<32>
4188 
~__narrow_to_utf8()4189 __narrow_to_utf8<32>::~__narrow_to_utf8()
4190 {
4191 }
4192 
4193 // __widen_from_utf8<16>
4194 
~__widen_from_utf8()4195 __widen_from_utf8<16>::~__widen_from_utf8()
4196 {
4197 }
4198 
4199 // __widen_from_utf8<32>
4200 
~__widen_from_utf8()4201 __widen_from_utf8<32>::~__widen_from_utf8()
4202 {
4203 }
4204 
4205 
checked_string_to_wchar_convert(wchar_t & dest,const char * ptr,locale_t loc)4206 static bool checked_string_to_wchar_convert(wchar_t& dest,
4207                                             const char* ptr,
4208                                             locale_t loc) {
4209   if (*ptr == '\0')
4210     return false;
4211   mbstate_t mb = {};
4212   wchar_t out;
4213   size_t ret = __libcpp_mbrtowc_l(&out, ptr, strlen(ptr), &mb, loc);
4214   if (ret == static_cast<size_t>(-1) || ret == static_cast<size_t>(-2)) {
4215     return false;
4216   }
4217   dest = out;
4218   return true;
4219 }
4220 
checked_string_to_char_convert(char & dest,const char * ptr,locale_t __loc)4221 static bool checked_string_to_char_convert(char& dest,
4222                                            const char* ptr,
4223                                            locale_t __loc) {
4224   if (*ptr == '\0')
4225     return false;
4226   if (!ptr[1]) {
4227     dest = *ptr;
4228     return true;
4229   }
4230   // First convert the MBS into a wide char then attempt to narrow it using
4231   // wctob_l.
4232   wchar_t wout;
4233   if (!checked_string_to_wchar_convert(wout, ptr, __loc))
4234     return false;
4235   int res;
4236   if ((res = __libcpp_wctob_l(wout, __loc)) != char_traits<char>::eof()) {
4237     dest = res;
4238     return true;
4239   }
4240   // FIXME: Work around specific multibyte sequences that we can reasonable
4241   // translate into a different single byte.
4242   switch (wout) {
4243   case L'\u202F': // narrow non-breaking space
4244   case L'\u00A0': // non-breaking space
4245     dest = ' ';
4246     return true;
4247   default:
4248     return false;
4249   }
4250   _LIBCPP_UNREACHABLE();
4251 }
4252 
4253 
4254 // numpunct<char> && numpunct<wchar_t>
4255 
4256 locale::id numpunct< char  >::id;
4257 locale::id numpunct<wchar_t>::id;
4258 
numpunct(size_t refs)4259 numpunct<char>::numpunct(size_t refs)
4260     : locale::facet(refs),
4261       __decimal_point_('.'),
4262       __thousands_sep_(',')
4263 {
4264 }
4265 
numpunct(size_t refs)4266 numpunct<wchar_t>::numpunct(size_t refs)
4267     : locale::facet(refs),
4268       __decimal_point_(L'.'),
4269       __thousands_sep_(L',')
4270 {
4271 }
4272 
~numpunct()4273 numpunct<char>::~numpunct()
4274 {
4275 }
4276 
~numpunct()4277 numpunct<wchar_t>::~numpunct()
4278 {
4279 }
4280 
do_decimal_point() const4281  char   numpunct< char  >::do_decimal_point() const {return __decimal_point_;}
do_decimal_point() const4282 wchar_t numpunct<wchar_t>::do_decimal_point() const {return __decimal_point_;}
4283 
do_thousands_sep() const4284  char   numpunct< char  >::do_thousands_sep() const {return __thousands_sep_;}
do_thousands_sep() const4285 wchar_t numpunct<wchar_t>::do_thousands_sep() const {return __thousands_sep_;}
4286 
do_grouping() const4287 string numpunct< char  >::do_grouping() const {return __grouping_;}
do_grouping() const4288 string numpunct<wchar_t>::do_grouping() const {return __grouping_;}
4289 
do_truename() const4290  string numpunct< char  >::do_truename() const {return "true";}
do_truename() const4291 wstring numpunct<wchar_t>::do_truename() const {return L"true";}
4292 
do_falsename() const4293  string numpunct< char  >::do_falsename() const {return "false";}
do_falsename() const4294 wstring numpunct<wchar_t>::do_falsename() const {return L"false";}
4295 
4296 // numpunct_byname<char>
4297 
numpunct_byname(const char * nm,size_t refs)4298 numpunct_byname<char>::numpunct_byname(const char* nm, size_t refs)
4299     : numpunct<char>(refs)
4300 {
4301     __init(nm);
4302 }
4303 
numpunct_byname(const string & nm,size_t refs)4304 numpunct_byname<char>::numpunct_byname(const string& nm, size_t refs)
4305     : numpunct<char>(refs)
4306 {
4307     __init(nm.c_str());
4308 }
4309 
~numpunct_byname()4310 numpunct_byname<char>::~numpunct_byname()
4311 {
4312 }
4313 
4314 void
__init(const char * nm)4315 numpunct_byname<char>::__init(const char* nm)
4316 {
4317     if (strcmp(nm, "C") != 0)
4318     {
4319         __libcpp_unique_locale loc(nm);
4320         if (!loc)
4321             __throw_runtime_error("numpunct_byname<char>::numpunct_byname"
4322                                 " failed to construct for " + string(nm));
4323 
4324         lconv* lc = __libcpp_localeconv_l(loc.get());
4325         checked_string_to_char_convert(__decimal_point_, lc->decimal_point,
4326                                        loc.get());
4327         checked_string_to_char_convert(__thousands_sep_, lc->thousands_sep,
4328                                        loc.get());
4329         __grouping_ = lc->grouping;
4330         // localization for truename and falsename is not available
4331     }
4332 }
4333 
4334 // numpunct_byname<wchar_t>
4335 
numpunct_byname(const char * nm,size_t refs)4336 numpunct_byname<wchar_t>::numpunct_byname(const char* nm, size_t refs)
4337     : numpunct<wchar_t>(refs)
4338 {
4339     __init(nm);
4340 }
4341 
numpunct_byname(const string & nm,size_t refs)4342 numpunct_byname<wchar_t>::numpunct_byname(const string& nm, size_t refs)
4343     : numpunct<wchar_t>(refs)
4344 {
4345     __init(nm.c_str());
4346 }
4347 
~numpunct_byname()4348 numpunct_byname<wchar_t>::~numpunct_byname()
4349 {
4350 }
4351 
4352 void
__init(const char * nm)4353 numpunct_byname<wchar_t>::__init(const char* nm)
4354 {
4355     if (strcmp(nm, "C") != 0)
4356     {
4357         __libcpp_unique_locale loc(nm);
4358         if (!loc)
4359             __throw_runtime_error("numpunct_byname<wchar_t>::numpunct_byname"
4360                                 " failed to construct for " + string(nm));
4361 
4362         lconv* lc = __libcpp_localeconv_l(loc.get());
4363         checked_string_to_wchar_convert(__decimal_point_, lc->decimal_point,
4364                                         loc.get());
4365         checked_string_to_wchar_convert(__thousands_sep_, lc->thousands_sep,
4366                                         loc.get());
4367         __grouping_ = lc->grouping;
4368         // localization for truename and falsename is not available
4369     }
4370 }
4371 
4372 // num_get helpers
4373 
4374 int
__get_base(ios_base & iob)4375 __num_get_base::__get_base(ios_base& iob)
4376 {
4377     ios_base::fmtflags __basefield = iob.flags() & ios_base::basefield;
4378     if (__basefield == ios_base::oct)
4379         return 8;
4380     else if (__basefield == ios_base::hex)
4381         return 16;
4382     else if (__basefield == 0)
4383         return 0;
4384     return 10;
4385 }
4386 
4387 const char __num_get_base::__src[33] = "0123456789abcdefABCDEFxX+-pPiInN";
4388 
4389 void
__check_grouping(const string & __grouping,unsigned * __g,unsigned * __g_end,ios_base::iostate & __err)4390 __check_grouping(const string& __grouping, unsigned* __g, unsigned* __g_end,
4391                  ios_base::iostate& __err)
4392 {
4393     if (__grouping.size() != 0)
4394     {
4395         reverse(__g, __g_end);
4396         const char* __ig = __grouping.data();
4397         const char* __eg = __ig + __grouping.size();
4398         for (unsigned* __r = __g; __r < __g_end-1; ++__r)
4399         {
4400             if (0 < *__ig && *__ig < numeric_limits<char>::max())
4401             {
4402                 if (static_cast<unsigned>(*__ig) != *__r)
4403                 {
4404                     __err = ios_base::failbit;
4405                     return;
4406                 }
4407             }
4408             if (__eg - __ig > 1)
4409                 ++__ig;
4410         }
4411         if (0 < *__ig && *__ig < numeric_limits<char>::max())
4412         {
4413             if (static_cast<unsigned>(*__ig) < __g_end[-1] || __g_end[-1] == 0)
4414                 __err = ios_base::failbit;
4415         }
4416     }
4417 }
4418 
4419 void
__format_int(char * __fmtp,const char * __len,bool __signd,ios_base::fmtflags __flags)4420 __num_put_base::__format_int(char* __fmtp, const char* __len, bool __signd,
4421                              ios_base::fmtflags __flags)
4422 {
4423     if (__flags & ios_base::showpos)
4424         *__fmtp++ = '+';
4425     if (__flags & ios_base::showbase)
4426         *__fmtp++ = '#';
4427     while(*__len)
4428         *__fmtp++ = *__len++;
4429     if ((__flags & ios_base::basefield) == ios_base::oct)
4430         *__fmtp = 'o';
4431     else if ((__flags & ios_base::basefield) == ios_base::hex)
4432     {
4433         if (__flags & ios_base::uppercase)
4434             *__fmtp = 'X';
4435         else
4436             *__fmtp = 'x';
4437     }
4438     else if (__signd)
4439         *__fmtp = 'd';
4440     else
4441         *__fmtp = 'u';
4442 }
4443 
4444 bool
__format_float(char * __fmtp,const char * __len,ios_base::fmtflags __flags)4445 __num_put_base::__format_float(char* __fmtp, const char* __len,
4446                                ios_base::fmtflags __flags)
4447 {
4448     bool specify_precision = true;
4449     if (__flags & ios_base::showpos)
4450         *__fmtp++ = '+';
4451     if (__flags & ios_base::showpoint)
4452         *__fmtp++ = '#';
4453     ios_base::fmtflags floatfield = __flags & ios_base::floatfield;
4454     bool uppercase = (__flags & ios_base::uppercase) != 0;
4455     if (floatfield == (ios_base::fixed | ios_base::scientific))
4456         specify_precision = false;
4457     else
4458     {
4459         *__fmtp++ = '.';
4460         *__fmtp++ = '*';
4461     }
4462     while(*__len)
4463         *__fmtp++ = *__len++;
4464     if (floatfield == ios_base::fixed)
4465     {
4466         if (uppercase)
4467             *__fmtp = 'F';
4468         else
4469             *__fmtp = 'f';
4470     }
4471     else if (floatfield == ios_base::scientific)
4472     {
4473         if (uppercase)
4474             *__fmtp = 'E';
4475         else
4476             *__fmtp = 'e';
4477     }
4478     else if (floatfield == (ios_base::fixed | ios_base::scientific))
4479     {
4480         if (uppercase)
4481             *__fmtp = 'A';
4482         else
4483             *__fmtp = 'a';
4484     }
4485     else
4486     {
4487         if (uppercase)
4488             *__fmtp = 'G';
4489         else
4490             *__fmtp = 'g';
4491     }
4492     return specify_precision;
4493 }
4494 
4495 char*
__identify_padding(char * __nb,char * __ne,const ios_base & __iob)4496 __num_put_base::__identify_padding(char* __nb, char* __ne,
4497                                    const ios_base& __iob)
4498 {
4499     switch (__iob.flags() & ios_base::adjustfield)
4500     {
4501     case ios_base::internal:
4502         if (__nb[0] == '-' || __nb[0] == '+')
4503             return __nb+1;
4504         if (__ne - __nb >= 2 && __nb[0] == '0'
4505                             && (__nb[1] == 'x' || __nb[1] == 'X'))
4506             return __nb+2;
4507         break;
4508     case ios_base::left:
4509         return __ne;
4510     case ios_base::right:
4511     default:
4512         break;
4513     }
4514     return __nb;
4515 }
4516 
4517 // time_get
4518 
4519 static
4520 string*
init_weeks()4521 init_weeks()
4522 {
4523     static string weeks[14];
4524     weeks[0]  = "Sunday";
4525     weeks[1]  = "Monday";
4526     weeks[2]  = "Tuesday";
4527     weeks[3]  = "Wednesday";
4528     weeks[4]  = "Thursday";
4529     weeks[5]  = "Friday";
4530     weeks[6]  = "Saturday";
4531     weeks[7]  = "Sun";
4532     weeks[8]  = "Mon";
4533     weeks[9]  = "Tue";
4534     weeks[10] = "Wed";
4535     weeks[11] = "Thu";
4536     weeks[12] = "Fri";
4537     weeks[13] = "Sat";
4538     return weeks;
4539 }
4540 
4541 static
4542 wstring*
init_wweeks()4543 init_wweeks()
4544 {
4545     static wstring weeks[14];
4546     weeks[0]  = L"Sunday";
4547     weeks[1]  = L"Monday";
4548     weeks[2]  = L"Tuesday";
4549     weeks[3]  = L"Wednesday";
4550     weeks[4]  = L"Thursday";
4551     weeks[5]  = L"Friday";
4552     weeks[6]  = L"Saturday";
4553     weeks[7]  = L"Sun";
4554     weeks[8]  = L"Mon";
4555     weeks[9]  = L"Tue";
4556     weeks[10] = L"Wed";
4557     weeks[11] = L"Thu";
4558     weeks[12] = L"Fri";
4559     weeks[13] = L"Sat";
4560     return weeks;
4561 }
4562 
4563 template <>
4564 const string*
__weeks() const4565 __time_get_c_storage<char>::__weeks() const
4566 {
4567     static const string* weeks = init_weeks();
4568     return weeks;
4569 }
4570 
4571 template <>
4572 const wstring*
__weeks() const4573 __time_get_c_storage<wchar_t>::__weeks() const
4574 {
4575     static const wstring* weeks = init_wweeks();
4576     return weeks;
4577 }
4578 
4579 static
4580 string*
init_months()4581 init_months()
4582 {
4583     static string months[24];
4584     months[0]  = "January";
4585     months[1]  = "February";
4586     months[2]  = "March";
4587     months[3]  = "April";
4588     months[4]  = "May";
4589     months[5]  = "June";
4590     months[6]  = "July";
4591     months[7]  = "August";
4592     months[8]  = "September";
4593     months[9]  = "October";
4594     months[10] = "November";
4595     months[11] = "December";
4596     months[12] = "Jan";
4597     months[13] = "Feb";
4598     months[14] = "Mar";
4599     months[15] = "Apr";
4600     months[16] = "May";
4601     months[17] = "Jun";
4602     months[18] = "Jul";
4603     months[19] = "Aug";
4604     months[20] = "Sep";
4605     months[21] = "Oct";
4606     months[22] = "Nov";
4607     months[23] = "Dec";
4608     return months;
4609 }
4610 
4611 static
4612 wstring*
init_wmonths()4613 init_wmonths()
4614 {
4615     static wstring months[24];
4616     months[0]  = L"January";
4617     months[1]  = L"February";
4618     months[2]  = L"March";
4619     months[3]  = L"April";
4620     months[4]  = L"May";
4621     months[5]  = L"June";
4622     months[6]  = L"July";
4623     months[7]  = L"August";
4624     months[8]  = L"September";
4625     months[9]  = L"October";
4626     months[10] = L"November";
4627     months[11] = L"December";
4628     months[12] = L"Jan";
4629     months[13] = L"Feb";
4630     months[14] = L"Mar";
4631     months[15] = L"Apr";
4632     months[16] = L"May";
4633     months[17] = L"Jun";
4634     months[18] = L"Jul";
4635     months[19] = L"Aug";
4636     months[20] = L"Sep";
4637     months[21] = L"Oct";
4638     months[22] = L"Nov";
4639     months[23] = L"Dec";
4640     return months;
4641 }
4642 
4643 template <>
4644 const string*
__months() const4645 __time_get_c_storage<char>::__months() const
4646 {
4647     static const string* months = init_months();
4648     return months;
4649 }
4650 
4651 template <>
4652 const wstring*
__months() const4653 __time_get_c_storage<wchar_t>::__months() const
4654 {
4655     static const wstring* months = init_wmonths();
4656     return months;
4657 }
4658 
4659 static
4660 string*
init_am_pm()4661 init_am_pm()
4662 {
4663     static string am_pm[2];
4664     am_pm[0]  = "AM";
4665     am_pm[1]  = "PM";
4666     return am_pm;
4667 }
4668 
4669 static
4670 wstring*
init_wam_pm()4671 init_wam_pm()
4672 {
4673     static wstring am_pm[2];
4674     am_pm[0]  = L"AM";
4675     am_pm[1]  = L"PM";
4676     return am_pm;
4677 }
4678 
4679 template <>
4680 const string*
__am_pm() const4681 __time_get_c_storage<char>::__am_pm() const
4682 {
4683     static const string* am_pm = init_am_pm();
4684     return am_pm;
4685 }
4686 
4687 template <>
4688 const wstring*
__am_pm() const4689 __time_get_c_storage<wchar_t>::__am_pm() const
4690 {
4691     static const wstring* am_pm = init_wam_pm();
4692     return am_pm;
4693 }
4694 
4695 template <>
4696 const string&
__x() const4697 __time_get_c_storage<char>::__x() const
4698 {
4699     static string s("%m/%d/%y");
4700     return s;
4701 }
4702 
4703 template <>
4704 const wstring&
__x() const4705 __time_get_c_storage<wchar_t>::__x() const
4706 {
4707     static wstring s(L"%m/%d/%y");
4708     return s;
4709 }
4710 
4711 template <>
4712 const string&
__X() const4713 __time_get_c_storage<char>::__X() const
4714 {
4715     static string s("%H:%M:%S");
4716     return s;
4717 }
4718 
4719 template <>
4720 const wstring&
__X() const4721 __time_get_c_storage<wchar_t>::__X() const
4722 {
4723     static wstring s(L"%H:%M:%S");
4724     return s;
4725 }
4726 
4727 template <>
4728 const string&
__c() const4729 __time_get_c_storage<char>::__c() const
4730 {
4731     static string s("%a %b %d %H:%M:%S %Y");
4732     return s;
4733 }
4734 
4735 template <>
4736 const wstring&
__c() const4737 __time_get_c_storage<wchar_t>::__c() const
4738 {
4739     static wstring s(L"%a %b %d %H:%M:%S %Y");
4740     return s;
4741 }
4742 
4743 template <>
4744 const string&
__r() const4745 __time_get_c_storage<char>::__r() const
4746 {
4747     static string s("%I:%M:%S %p");
4748     return s;
4749 }
4750 
4751 template <>
4752 const wstring&
__r() const4753 __time_get_c_storage<wchar_t>::__r() const
4754 {
4755     static wstring s(L"%I:%M:%S %p");
4756     return s;
4757 }
4758 
4759 // time_get_byname
4760 
__time_get(const char * nm)4761 __time_get::__time_get(const char* nm)
4762     : __loc_(newlocale(LC_ALL_MASK, nm, 0))
4763 {
4764     if (__loc_ == 0)
4765         __throw_runtime_error("time_get_byname"
4766                             " failed to construct for " + string(nm));
4767 }
4768 
__time_get(const string & nm)4769 __time_get::__time_get(const string& nm)
4770     : __loc_(newlocale(LC_ALL_MASK, nm.c_str(), 0))
4771 {
4772     if (__loc_ == 0)
4773         __throw_runtime_error("time_get_byname"
4774                             " failed to construct for " + nm);
4775 }
4776 
~__time_get()4777 __time_get::~__time_get()
4778 {
4779     freelocale(__loc_);
4780 }
4781 #if defined(__clang__)
4782 #pragma clang diagnostic ignored "-Wmissing-field-initializers"
4783 #endif
4784 #if defined(__GNUG__)
4785 #pragma GCC   diagnostic ignored "-Wmissing-field-initializers"
4786 #endif
4787 
4788 template <>
4789 string
__analyze(char fmt,const ctype<char> & ct)4790 __time_get_storage<char>::__analyze(char fmt, const ctype<char>& ct)
4791 {
4792     tm t = {0};
4793     t.tm_sec = 59;
4794     t.tm_min = 55;
4795     t.tm_hour = 23;
4796     t.tm_mday = 31;
4797     t.tm_mon = 11;
4798     t.tm_year = 161;
4799     t.tm_wday = 6;
4800     t.tm_yday = 364;
4801     t.tm_isdst = -1;
4802     char buf[100];
4803     char f[3] = {0};
4804     f[0] = '%';
4805     f[1] = fmt;
4806     size_t n = strftime_l(buf, countof(buf), f, &t, __loc_);
4807     char* bb = buf;
4808     char* be = buf + n;
4809     string result;
4810     while (bb != be)
4811     {
4812         if (ct.is(ctype_base::space, *bb))
4813         {
4814             result.push_back(' ');
4815             for (++bb; bb != be && ct.is(ctype_base::space, *bb); ++bb)
4816                 ;
4817             continue;
4818         }
4819         char* w = bb;
4820         ios_base::iostate err = ios_base::goodbit;
4821         ptrdiff_t i = __scan_keyword(w, be, this->__weeks_, this->__weeks_+14,
4822                                ct, err, false)
4823                                - this->__weeks_;
4824         if (i < 14)
4825         {
4826             result.push_back('%');
4827             if (i < 7)
4828                 result.push_back('A');
4829             else
4830                 result.push_back('a');
4831             bb = w;
4832             continue;
4833         }
4834         w = bb;
4835         i = __scan_keyword(w, be, this->__months_, this->__months_+24,
4836                            ct, err, false)
4837                            - this->__months_;
4838         if (i < 24)
4839         {
4840             result.push_back('%');
4841             if (i < 12)
4842                 result.push_back('B');
4843             else
4844                 result.push_back('b');
4845             if (fmt == 'x' && ct.is(ctype_base::digit, this->__months_[i][0]))
4846                 result.back() = 'm';
4847             bb = w;
4848             continue;
4849         }
4850         if (this->__am_pm_[0].size() + this->__am_pm_[1].size() > 0)
4851         {
4852             w = bb;
4853             i = __scan_keyword(w, be, this->__am_pm_, this->__am_pm_+2,
4854                                ct, err, false) - this->__am_pm_;
4855             if (i < 2)
4856             {
4857                 result.push_back('%');
4858                 result.push_back('p');
4859                 bb = w;
4860                 continue;
4861             }
4862         }
4863         w = bb;
4864         if (ct.is(ctype_base::digit, *bb))
4865         {
4866             switch(__get_up_to_n_digits(bb, be, err, ct, 4))
4867             {
4868             case 6:
4869                 result.push_back('%');
4870                 result.push_back('w');
4871                 break;
4872             case 7:
4873                 result.push_back('%');
4874                 result.push_back('u');
4875                 break;
4876             case 11:
4877                 result.push_back('%');
4878                 result.push_back('I');
4879                 break;
4880             case 12:
4881                 result.push_back('%');
4882                 result.push_back('m');
4883                 break;
4884             case 23:
4885                 result.push_back('%');
4886                 result.push_back('H');
4887                 break;
4888             case 31:
4889                 result.push_back('%');
4890                 result.push_back('d');
4891                 break;
4892             case 55:
4893                 result.push_back('%');
4894                 result.push_back('M');
4895                 break;
4896             case 59:
4897                 result.push_back('%');
4898                 result.push_back('S');
4899                 break;
4900             case 61:
4901                 result.push_back('%');
4902                 result.push_back('y');
4903                 break;
4904             case 364:
4905                 result.push_back('%');
4906                 result.push_back('j');
4907                 break;
4908             case 2061:
4909                 result.push_back('%');
4910                 result.push_back('Y');
4911                 break;
4912             default:
4913                 for (; w != bb; ++w)
4914                     result.push_back(*w);
4915                 break;
4916             }
4917             continue;
4918         }
4919         if (*bb == '%')
4920         {
4921             result.push_back('%');
4922             result.push_back('%');
4923             ++bb;
4924             continue;
4925         }
4926         result.push_back(*bb);
4927         ++bb;
4928     }
4929     return result;
4930 }
4931 
4932 #if defined(__clang__)
4933 #pragma clang diagnostic ignored "-Wmissing-braces"
4934 #endif
4935 
4936 template <>
4937 wstring
__analyze(char fmt,const ctype<wchar_t> & ct)4938 __time_get_storage<wchar_t>::__analyze(char fmt, const ctype<wchar_t>& ct)
4939 {
4940     tm t = {0};
4941     t.tm_sec = 59;
4942     t.tm_min = 55;
4943     t.tm_hour = 23;
4944     t.tm_mday = 31;
4945     t.tm_mon = 11;
4946     t.tm_year = 161;
4947     t.tm_wday = 6;
4948     t.tm_yday = 364;
4949     t.tm_isdst = -1;
4950     char buf[100];
4951     char f[3] = {0};
4952     f[0] = '%';
4953     f[1] = fmt;
4954     strftime_l(buf, countof(buf), f, &t, __loc_);
4955     wchar_t wbuf[100];
4956     wchar_t* wbb = wbuf;
4957     mbstate_t mb = {0};
4958     const char* bb = buf;
4959     size_t j = __libcpp_mbsrtowcs_l( wbb, &bb, countof(wbuf), &mb, __loc_);
4960     if (j == size_t(-1))
4961         __throw_runtime_error("locale not supported");
4962     wchar_t* wbe = wbb + j;
4963     wstring result;
4964     while (wbb != wbe)
4965     {
4966         if (ct.is(ctype_base::space, *wbb))
4967         {
4968             result.push_back(L' ');
4969             for (++wbb; wbb != wbe && ct.is(ctype_base::space, *wbb); ++wbb)
4970                 ;
4971             continue;
4972         }
4973         wchar_t* w = wbb;
4974         ios_base::iostate err = ios_base::goodbit;
4975         ptrdiff_t i = __scan_keyword(w, wbe, this->__weeks_, this->__weeks_+14,
4976                                ct, err, false)
4977                                - this->__weeks_;
4978         if (i < 14)
4979         {
4980             result.push_back(L'%');
4981             if (i < 7)
4982                 result.push_back(L'A');
4983             else
4984                 result.push_back(L'a');
4985             wbb = w;
4986             continue;
4987         }
4988         w = wbb;
4989         i = __scan_keyword(w, wbe, this->__months_, this->__months_+24,
4990                            ct, err, false)
4991                            - this->__months_;
4992         if (i < 24)
4993         {
4994             result.push_back(L'%');
4995             if (i < 12)
4996                 result.push_back(L'B');
4997             else
4998                 result.push_back(L'b');
4999             if (fmt == 'x' && ct.is(ctype_base::digit, this->__months_[i][0]))
5000                 result.back() = L'm';
5001             wbb = w;
5002             continue;
5003         }
5004         if (this->__am_pm_[0].size() + this->__am_pm_[1].size() > 0)
5005         {
5006             w = wbb;
5007             i = __scan_keyword(w, wbe, this->__am_pm_, this->__am_pm_+2,
5008                                ct, err, false) - this->__am_pm_;
5009             if (i < 2)
5010             {
5011                 result.push_back(L'%');
5012                 result.push_back(L'p');
5013                 wbb = w;
5014                 continue;
5015             }
5016         }
5017         w = wbb;
5018         if (ct.is(ctype_base::digit, *wbb))
5019         {
5020             switch(__get_up_to_n_digits(wbb, wbe, err, ct, 4))
5021             {
5022             case 6:
5023                 result.push_back(L'%');
5024                 result.push_back(L'w');
5025                 break;
5026             case 7:
5027                 result.push_back(L'%');
5028                 result.push_back(L'u');
5029                 break;
5030             case 11:
5031                 result.push_back(L'%');
5032                 result.push_back(L'I');
5033                 break;
5034             case 12:
5035                 result.push_back(L'%');
5036                 result.push_back(L'm');
5037                 break;
5038             case 23:
5039                 result.push_back(L'%');
5040                 result.push_back(L'H');
5041                 break;
5042             case 31:
5043                 result.push_back(L'%');
5044                 result.push_back(L'd');
5045                 break;
5046             case 55:
5047                 result.push_back(L'%');
5048                 result.push_back(L'M');
5049                 break;
5050             case 59:
5051                 result.push_back(L'%');
5052                 result.push_back(L'S');
5053                 break;
5054             case 61:
5055                 result.push_back(L'%');
5056                 result.push_back(L'y');
5057                 break;
5058             case 364:
5059                 result.push_back(L'%');
5060                 result.push_back(L'j');
5061                 break;
5062             case 2061:
5063                 result.push_back(L'%');
5064                 result.push_back(L'Y');
5065                 break;
5066             default:
5067                 for (; w != wbb; ++w)
5068                     result.push_back(*w);
5069                 break;
5070             }
5071             continue;
5072         }
5073         if (ct.narrow(*wbb, 0) == '%')
5074         {
5075             result.push_back(L'%');
5076             result.push_back(L'%');
5077             ++wbb;
5078             continue;
5079         }
5080         result.push_back(*wbb);
5081         ++wbb;
5082     }
5083     return result;
5084 }
5085 
5086 template <>
5087 void
init(const ctype<char> & ct)5088 __time_get_storage<char>::init(const ctype<char>& ct)
5089 {
5090     tm t = {0};
5091     char buf[100];
5092     // __weeks_
5093     for (int i = 0; i < 7; ++i)
5094     {
5095         t.tm_wday = i;
5096         strftime_l(buf, countof(buf), "%A", &t, __loc_);
5097         __weeks_[i] = buf;
5098         strftime_l(buf, countof(buf), "%a", &t, __loc_);
5099         __weeks_[i+7] = buf;
5100     }
5101     // __months_
5102     for (int i = 0; i < 12; ++i)
5103     {
5104         t.tm_mon = i;
5105         strftime_l(buf, countof(buf), "%B", &t, __loc_);
5106         __months_[i] = buf;
5107         strftime_l(buf, countof(buf), "%b", &t, __loc_);
5108         __months_[i+12] = buf;
5109     }
5110     // __am_pm_
5111     t.tm_hour = 1;
5112     strftime_l(buf, countof(buf), "%p", &t, __loc_);
5113     __am_pm_[0] = buf;
5114     t.tm_hour = 13;
5115     strftime_l(buf, countof(buf), "%p", &t, __loc_);
5116     __am_pm_[1] = buf;
5117     __c_ = __analyze('c', ct);
5118     __r_ = __analyze('r', ct);
5119     __x_ = __analyze('x', ct);
5120     __X_ = __analyze('X', ct);
5121 }
5122 
5123 template <>
5124 void
init(const ctype<wchar_t> & ct)5125 __time_get_storage<wchar_t>::init(const ctype<wchar_t>& ct)
5126 {
5127     tm t = {0};
5128     char buf[100];
5129     wchar_t wbuf[100];
5130     wchar_t* wbe;
5131     mbstate_t mb = {0};
5132     // __weeks_
5133     for (int i = 0; i < 7; ++i)
5134     {
5135         t.tm_wday = i;
5136         strftime_l(buf, countof(buf), "%A", &t, __loc_);
5137         mb = mbstate_t();
5138         const char* bb = buf;
5139         size_t j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, __loc_);
5140         if (j == size_t(-1))
5141             __throw_runtime_error("locale not supported");
5142         wbe = wbuf + j;
5143         __weeks_[i].assign(wbuf, wbe);
5144         strftime_l(buf, countof(buf), "%a", &t, __loc_);
5145         mb = mbstate_t();
5146         bb = buf;
5147         j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, __loc_);
5148         if (j == size_t(-1))
5149             __throw_runtime_error("locale not supported");
5150         wbe = wbuf + j;
5151         __weeks_[i+7].assign(wbuf, wbe);
5152     }
5153     // __months_
5154     for (int i = 0; i < 12; ++i)
5155     {
5156         t.tm_mon = i;
5157         strftime_l(buf, countof(buf), "%B", &t, __loc_);
5158         mb = mbstate_t();
5159         const char* bb = buf;
5160         size_t j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, __loc_);
5161         if (j == size_t(-1))
5162             __throw_runtime_error("locale not supported");
5163         wbe = wbuf + j;
5164         __months_[i].assign(wbuf, wbe);
5165         strftime_l(buf, countof(buf), "%b", &t, __loc_);
5166         mb = mbstate_t();
5167         bb = buf;
5168         j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, __loc_);
5169         if (j == size_t(-1))
5170             __throw_runtime_error("locale not supported");
5171         wbe = wbuf + j;
5172         __months_[i+12].assign(wbuf, wbe);
5173     }
5174     // __am_pm_
5175     t.tm_hour = 1;
5176     strftime_l(buf, countof(buf), "%p", &t, __loc_);
5177     mb = mbstate_t();
5178     const char* bb = buf;
5179     size_t j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, __loc_);
5180     if (j == size_t(-1))
5181         __throw_runtime_error("locale not supported");
5182     wbe = wbuf + j;
5183     __am_pm_[0].assign(wbuf, wbe);
5184     t.tm_hour = 13;
5185     strftime_l(buf, countof(buf), "%p", &t, __loc_);
5186     mb = mbstate_t();
5187     bb = buf;
5188     j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, __loc_);
5189     if (j == size_t(-1))
5190         __throw_runtime_error("locale not supported");
5191     wbe = wbuf + j;
5192     __am_pm_[1].assign(wbuf, wbe);
5193     __c_ = __analyze('c', ct);
5194     __r_ = __analyze('r', ct);
5195     __x_ = __analyze('x', ct);
5196     __X_ = __analyze('X', ct);
5197 }
5198 
5199 template <class CharT>
5200 struct _LIBCPP_HIDDEN __time_get_temp
5201     : public ctype_byname<CharT>
5202 {
__time_get_temp__time_get_temp5203     explicit __time_get_temp(const char* nm)
5204         : ctype_byname<CharT>(nm, 1) {}
__time_get_temp__time_get_temp5205     explicit __time_get_temp(const string& nm)
5206         : ctype_byname<CharT>(nm, 1) {}
5207 };
5208 
5209 template <>
__time_get_storage(const char * __nm)5210 __time_get_storage<char>::__time_get_storage(const char* __nm)
5211     : __time_get(__nm)
5212 {
5213     const __time_get_temp<char> ct(__nm);
5214     init(ct);
5215 }
5216 
5217 template <>
__time_get_storage(const string & __nm)5218 __time_get_storage<char>::__time_get_storage(const string& __nm)
5219     : __time_get(__nm)
5220 {
5221     const __time_get_temp<char> ct(__nm);
5222     init(ct);
5223 }
5224 
5225 template <>
__time_get_storage(const char * __nm)5226 __time_get_storage<wchar_t>::__time_get_storage(const char* __nm)
5227     : __time_get(__nm)
5228 {
5229     const __time_get_temp<wchar_t> ct(__nm);
5230     init(ct);
5231 }
5232 
5233 template <>
__time_get_storage(const string & __nm)5234 __time_get_storage<wchar_t>::__time_get_storage(const string& __nm)
5235     : __time_get(__nm)
5236 {
5237     const __time_get_temp<wchar_t> ct(__nm);
5238     init(ct);
5239 }
5240 
5241 template <>
5242 time_base::dateorder
__do_date_order() const5243 __time_get_storage<char>::__do_date_order() const
5244 {
5245     unsigned i;
5246     for (i = 0; i < __x_.size(); ++i)
5247         if (__x_[i] == '%')
5248             break;
5249     ++i;
5250     switch (__x_[i])
5251     {
5252     case 'y':
5253     case 'Y':
5254         for (++i; i < __x_.size(); ++i)
5255             if (__x_[i] == '%')
5256                 break;
5257         if (i == __x_.size())
5258             break;
5259         ++i;
5260         switch (__x_[i])
5261         {
5262         case 'm':
5263             for (++i; i < __x_.size(); ++i)
5264                 if (__x_[i] == '%')
5265                     break;
5266             if (i == __x_.size())
5267                 break;
5268             ++i;
5269             if (__x_[i] == 'd')
5270                 return time_base::ymd;
5271             break;
5272         case 'd':
5273             for (++i; i < __x_.size(); ++i)
5274                 if (__x_[i] == '%')
5275                     break;
5276             if (i == __x_.size())
5277                 break;
5278             ++i;
5279             if (__x_[i] == 'm')
5280                 return time_base::ydm;
5281             break;
5282         }
5283         break;
5284     case 'm':
5285         for (++i; i < __x_.size(); ++i)
5286             if (__x_[i] == '%')
5287                 break;
5288         if (i == __x_.size())
5289             break;
5290         ++i;
5291         if (__x_[i] == 'd')
5292         {
5293             for (++i; i < __x_.size(); ++i)
5294                 if (__x_[i] == '%')
5295                     break;
5296             if (i == __x_.size())
5297                 break;
5298             ++i;
5299             if (__x_[i] == 'y' || __x_[i] == 'Y')
5300                 return time_base::mdy;
5301             break;
5302         }
5303         break;
5304     case 'd':
5305         for (++i; i < __x_.size(); ++i)
5306             if (__x_[i] == '%')
5307                 break;
5308         if (i == __x_.size())
5309             break;
5310         ++i;
5311         if (__x_[i] == 'm')
5312         {
5313             for (++i; i < __x_.size(); ++i)
5314                 if (__x_[i] == '%')
5315                     break;
5316             if (i == __x_.size())
5317                 break;
5318             ++i;
5319             if (__x_[i] == 'y' || __x_[i] == 'Y')
5320                 return time_base::dmy;
5321             break;
5322         }
5323         break;
5324     }
5325     return time_base::no_order;
5326 }
5327 
5328 template <>
5329 time_base::dateorder
__do_date_order() const5330 __time_get_storage<wchar_t>::__do_date_order() const
5331 {
5332     unsigned i;
5333     for (i = 0; i < __x_.size(); ++i)
5334         if (__x_[i] == L'%')
5335             break;
5336     ++i;
5337     switch (__x_[i])
5338     {
5339     case L'y':
5340     case L'Y':
5341         for (++i; i < __x_.size(); ++i)
5342             if (__x_[i] == L'%')
5343                 break;
5344         if (i == __x_.size())
5345             break;
5346         ++i;
5347         switch (__x_[i])
5348         {
5349         case L'm':
5350             for (++i; i < __x_.size(); ++i)
5351                 if (__x_[i] == L'%')
5352                     break;
5353             if (i == __x_.size())
5354                 break;
5355             ++i;
5356             if (__x_[i] == L'd')
5357                 return time_base::ymd;
5358             break;
5359         case L'd':
5360             for (++i; i < __x_.size(); ++i)
5361                 if (__x_[i] == L'%')
5362                     break;
5363             if (i == __x_.size())
5364                 break;
5365             ++i;
5366             if (__x_[i] == L'm')
5367                 return time_base::ydm;
5368             break;
5369         }
5370         break;
5371     case L'm':
5372         for (++i; i < __x_.size(); ++i)
5373             if (__x_[i] == L'%')
5374                 break;
5375         if (i == __x_.size())
5376             break;
5377         ++i;
5378         if (__x_[i] == L'd')
5379         {
5380             for (++i; i < __x_.size(); ++i)
5381                 if (__x_[i] == L'%')
5382                     break;
5383             if (i == __x_.size())
5384                 break;
5385             ++i;
5386             if (__x_[i] == L'y' || __x_[i] == L'Y')
5387                 return time_base::mdy;
5388             break;
5389         }
5390         break;
5391     case L'd':
5392         for (++i; i < __x_.size(); ++i)
5393             if (__x_[i] == L'%')
5394                 break;
5395         if (i == __x_.size())
5396             break;
5397         ++i;
5398         if (__x_[i] == L'm')
5399         {
5400             for (++i; i < __x_.size(); ++i)
5401                 if (__x_[i] == L'%')
5402                     break;
5403             if (i == __x_.size())
5404                 break;
5405             ++i;
5406             if (__x_[i] == L'y' || __x_[i] == L'Y')
5407                 return time_base::dmy;
5408             break;
5409         }
5410         break;
5411     }
5412     return time_base::no_order;
5413 }
5414 
5415 // time_put
5416 
__time_put(const char * nm)5417 __time_put::__time_put(const char* nm)
5418     : __loc_(newlocale(LC_ALL_MASK, nm, 0))
5419 {
5420     if (__loc_ == 0)
5421         __throw_runtime_error("time_put_byname"
5422                             " failed to construct for " + string(nm));
5423 }
5424 
__time_put(const string & nm)5425 __time_put::__time_put(const string& nm)
5426     : __loc_(newlocale(LC_ALL_MASK, nm.c_str(), 0))
5427 {
5428     if (__loc_ == 0)
5429         __throw_runtime_error("time_put_byname"
5430                             " failed to construct for " + nm);
5431 }
5432 
~__time_put()5433 __time_put::~__time_put()
5434 {
5435     if (__loc_ != _LIBCPP_GET_C_LOCALE)
5436         freelocale(__loc_);
5437 }
5438 
5439 void
__do_put(char * __nb,char * & __ne,const tm * __tm,char __fmt,char __mod) const5440 __time_put::__do_put(char* __nb, char*& __ne, const tm* __tm,
5441                      char __fmt, char __mod) const
5442 {
5443     char fmt[] = {'%', __fmt, __mod, 0};
5444     if (__mod != 0)
5445         swap(fmt[1], fmt[2]);
5446     size_t n = strftime_l(__nb, countof(__nb, __ne), fmt, __tm, __loc_);
5447     __ne = __nb + n;
5448 }
5449 
5450 void
__do_put(wchar_t * __wb,wchar_t * & __we,const tm * __tm,char __fmt,char __mod) const5451 __time_put::__do_put(wchar_t* __wb, wchar_t*& __we, const tm* __tm,
5452                      char __fmt, char __mod) const
5453 {
5454     char __nar[100];
5455     char* __ne = __nar + 100;
5456     __do_put(__nar, __ne, __tm, __fmt, __mod);
5457     mbstate_t mb = {0};
5458     const char* __nb = __nar;
5459     size_t j = __libcpp_mbsrtowcs_l(__wb, &__nb, countof(__wb, __we), &mb, __loc_);
5460     if (j == size_t(-1))
5461         __throw_runtime_error("locale not supported");
5462     __we = __wb + j;
5463 }
5464 
5465 // moneypunct_byname
5466 
5467 template <class charT>
5468 static
5469 void
__init_pat(money_base::pattern & pat,basic_string<charT> & __curr_symbol_,bool intl,char cs_precedes,char sep_by_space,char sign_posn,charT space_char)5470 __init_pat(money_base::pattern& pat, basic_string<charT>& __curr_symbol_,
5471            bool intl, char cs_precedes, char sep_by_space, char sign_posn,
5472            charT space_char)
5473 {
5474     const char sign = static_cast<char>(money_base::sign);
5475     const char space = static_cast<char>(money_base::space);
5476     const char none = static_cast<char>(money_base::none);
5477     const char symbol = static_cast<char>(money_base::symbol);
5478     const char value = static_cast<char>(money_base::value);
5479     const bool symbol_contains_sep = intl && __curr_symbol_.size() == 4;
5480 
5481     // Comments on case branches reflect 'C11 7.11.2.1 The localeconv
5482     // function'. "Space between sign and symbol or value" means that
5483     // if the sign is adjacent to the symbol, there's a space between
5484     // them, and otherwise there's a space between the sign and value.
5485     //
5486     // C11's localeconv specifies that the fourth character of an
5487     // international curr_symbol is used to separate the sign and
5488     // value when sep_by_space says to do so. C++ can't represent
5489     // that, so we just use a space.  When sep_by_space says to
5490     // separate the symbol and value-or-sign with a space, we rearrange the
5491     // curr_symbol to put its spacing character on the correct side of
5492     // the symbol.
5493     //
5494     // We also need to avoid adding an extra space between the sign
5495     // and value when the currency symbol is suppressed (by not
5496     // setting showbase).  We match glibc's strfmon by interpreting
5497     // sep_by_space==1 as "omit the space when the currency symbol is
5498     // absent".
5499     //
5500     // Users who want to get this right should use ICU instead.
5501 
5502     switch (cs_precedes)
5503     {
5504     case 0:  // value before curr_symbol
5505         if (symbol_contains_sep) {
5506             // Move the separator to before the symbol, to place it
5507             // between the value and symbol.
5508             rotate(__curr_symbol_.begin(), __curr_symbol_.begin() + 3,
5509                    __curr_symbol_.end());
5510         }
5511         switch (sign_posn)
5512         {
5513         case 0:  // Parentheses surround the quantity and currency symbol.
5514             pat.field[0] = sign;
5515             pat.field[1] = value;
5516             pat.field[2] = none;  // Any space appears in the symbol.
5517             pat.field[3] = symbol;
5518             switch (sep_by_space)
5519             {
5520             case 0:  // No space separates the currency symbol and value.
5521                 // This case may have changed between C99 and C11;
5522                 // assume the currency symbol matches the intention.
5523             case 2:  // Space between sign and currency or value.
5524                 // The "sign" is two parentheses, so no space here either.
5525                 return;
5526             case 1:  // Space between currency-and-sign or currency and value.
5527                 if (!symbol_contains_sep) {
5528                     // We insert the space into the symbol instead of
5529                     // setting pat.field[2]=space so that when
5530                     // showbase is not set, the space goes away too.
5531                     __curr_symbol_.insert(0, 1, space_char);
5532                 }
5533                 return;
5534             default:
5535                 break;
5536             }
5537             break;
5538         case 1:  // The sign string precedes the quantity and currency symbol.
5539             pat.field[0] = sign;
5540             pat.field[3] = symbol;
5541             switch (sep_by_space)
5542             {
5543             case 0:  // No space separates the currency symbol and value.
5544                 pat.field[1] = value;
5545                 pat.field[2] = none;
5546                 return;
5547             case 1:  // Space between currency-and-sign or currency and value.
5548                 pat.field[1] = value;
5549                 pat.field[2] = none;
5550                 if (!symbol_contains_sep) {
5551                     // We insert the space into the symbol instead of
5552                     // setting pat.field[2]=space so that when
5553                     // showbase is not set, the space goes away too.
5554                     __curr_symbol_.insert(0, 1, space_char);
5555                 }
5556                 return;
5557             case 2:  // Space between sign and currency or value.
5558                 pat.field[1] = space;
5559                 pat.field[2] = value;
5560                 if (symbol_contains_sep) {
5561                     // Remove the separator from the symbol, since it
5562                     // has already appeared after the sign.
5563                     __curr_symbol_.erase(__curr_symbol_.begin());
5564                 }
5565                 return;
5566             default:
5567                 break;
5568             }
5569             break;
5570         case 2:  // The sign string succeeds the quantity and currency symbol.
5571             pat.field[0] = value;
5572             pat.field[3] = sign;
5573             switch (sep_by_space)
5574             {
5575             case 0:  // No space separates the currency symbol and value.
5576                 pat.field[1] = none;
5577                 pat.field[2] = symbol;
5578                 return;
5579             case 1:  // Space between currency-and-sign or currency and value.
5580                 if (!symbol_contains_sep) {
5581                     // We insert the space into the symbol instead of
5582                     // setting pat.field[1]=space so that when
5583                     // showbase is not set, the space goes away too.
5584                     __curr_symbol_.insert(0, 1, space_char);
5585                 }
5586                 pat.field[1] = none;
5587                 pat.field[2] = symbol;
5588                 return;
5589             case 2:  // Space between sign and currency or value.
5590                 pat.field[1] = symbol;
5591                 pat.field[2] = space;
5592                 if (symbol_contains_sep) {
5593                     // Remove the separator from the symbol, since it
5594                     // should not be removed if showbase is absent.
5595                     __curr_symbol_.erase(__curr_symbol_.begin());
5596                 }
5597                 return;
5598             default:
5599                 break;
5600             }
5601             break;
5602         case 3:  // The sign string immediately precedes the currency symbol.
5603             pat.field[0] = value;
5604             pat.field[3] = symbol;
5605             switch (sep_by_space)
5606             {
5607             case 0:  // No space separates the currency symbol and value.
5608                 pat.field[1] = none;
5609                 pat.field[2] = sign;
5610                 return;
5611             case 1:  // Space between currency-and-sign or currency and value.
5612                 pat.field[1] = space;
5613                 pat.field[2] = sign;
5614                 if (symbol_contains_sep) {
5615                     // Remove the separator from the symbol, since it
5616                     // has already appeared before the sign.
5617                     __curr_symbol_.erase(__curr_symbol_.begin());
5618                 }
5619                 return;
5620             case 2:  // Space between sign and currency or value.
5621                 pat.field[1] = sign;
5622                 pat.field[2] = none;
5623                 if (!symbol_contains_sep) {
5624                     // We insert the space into the symbol instead of
5625                     // setting pat.field[2]=space so that when
5626                     // showbase is not set, the space goes away too.
5627                     __curr_symbol_.insert(0, 1, space_char);
5628                 }
5629                 return;
5630             default:
5631                 break;
5632             }
5633             break;
5634         case 4:  // The sign string immediately succeeds the currency symbol.
5635             pat.field[0] = value;
5636             pat.field[3] = sign;
5637             switch (sep_by_space)
5638             {
5639             case 0:  // No space separates the currency symbol and value.
5640                 pat.field[1] = none;
5641                 pat.field[2] = symbol;
5642                 return;
5643             case 1:  // Space between currency-and-sign or currency and value.
5644                 pat.field[1] = none;
5645                 pat.field[2] = symbol;
5646                 if (!symbol_contains_sep) {
5647                     // We insert the space into the symbol instead of
5648                     // setting pat.field[1]=space so that when
5649                     // showbase is not set, the space goes away too.
5650                     __curr_symbol_.insert(0, 1, space_char);
5651                 }
5652                 return;
5653             case 2:  // Space between sign and currency or value.
5654                 pat.field[1] = symbol;
5655                 pat.field[2] = space;
5656                 if (symbol_contains_sep) {
5657                     // Remove the separator from the symbol, since it
5658                     // should not disappear when showbase is absent.
5659                     __curr_symbol_.erase(__curr_symbol_.begin());
5660                 }
5661                 return;
5662             default:
5663                 break;
5664             }
5665             break;
5666         default:
5667             break;
5668         }
5669         break;
5670     case 1:  // curr_symbol before value
5671         switch (sign_posn)
5672         {
5673         case 0:  // Parentheses surround the quantity and currency symbol.
5674             pat.field[0] = sign;
5675             pat.field[1] = symbol;
5676             pat.field[2] = none;  // Any space appears in the symbol.
5677             pat.field[3] = value;
5678             switch (sep_by_space)
5679             {
5680             case 0:  // No space separates the currency symbol and value.
5681                 // This case may have changed between C99 and C11;
5682                 // assume the currency symbol matches the intention.
5683             case 2:  // Space between sign and currency or value.
5684                 // The "sign" is two parentheses, so no space here either.
5685                 return;
5686             case 1:  // Space between currency-and-sign or currency and value.
5687                 if (!symbol_contains_sep) {
5688                     // We insert the space into the symbol instead of
5689                     // setting pat.field[2]=space so that when
5690                     // showbase is not set, the space goes away too.
5691                     __curr_symbol_.insert(0, 1, space_char);
5692                 }
5693                 return;
5694             default:
5695                 break;
5696             }
5697             break;
5698         case 1:  // The sign string precedes the quantity and currency symbol.
5699             pat.field[0] = sign;
5700             pat.field[3] = value;
5701             switch (sep_by_space)
5702             {
5703             case 0:  // No space separates the currency symbol and value.
5704                 pat.field[1] = symbol;
5705                 pat.field[2] = none;
5706                 return;
5707             case 1:  // Space between currency-and-sign or currency and value.
5708                 pat.field[1] = symbol;
5709                 pat.field[2] = none;
5710                 if (!symbol_contains_sep) {
5711                     // We insert the space into the symbol instead of
5712                     // setting pat.field[2]=space so that when
5713                     // showbase is not set, the space goes away too.
5714                     __curr_symbol_.push_back(space_char);
5715                 }
5716                 return;
5717             case 2:  // Space between sign and currency or value.
5718                 pat.field[1] = space;
5719                 pat.field[2] = symbol;
5720                 if (symbol_contains_sep) {
5721                     // Remove the separator from the symbol, since it
5722                     // has already appeared after the sign.
5723                     __curr_symbol_.pop_back();
5724                 }
5725                 return;
5726             default:
5727                 break;
5728             }
5729             break;
5730         case 2:  // The sign string succeeds the quantity and currency symbol.
5731             pat.field[0] = symbol;
5732             pat.field[3] = sign;
5733             switch (sep_by_space)
5734             {
5735             case 0:  // No space separates the currency symbol and value.
5736                 pat.field[1] = none;
5737                 pat.field[2] = value;
5738                 return;
5739             case 1:  // Space between currency-and-sign or currency and value.
5740                 pat.field[1] = none;
5741                 pat.field[2] = value;
5742                 if (!symbol_contains_sep) {
5743                     // We insert the space into the symbol instead of
5744                     // setting pat.field[1]=space so that when
5745                     // showbase is not set, the space goes away too.
5746                     __curr_symbol_.push_back(space_char);
5747                 }
5748                 return;
5749             case 2:  // Space between sign and currency or value.
5750                 pat.field[1] = value;
5751                 pat.field[2] = space;
5752                 if (symbol_contains_sep) {
5753                     // Remove the separator from the symbol, since it
5754                     // will appear before the sign.
5755                     __curr_symbol_.pop_back();
5756                 }
5757                 return;
5758             default:
5759                 break;
5760             }
5761             break;
5762         case 3:  // The sign string immediately precedes the currency symbol.
5763             pat.field[0] = sign;
5764             pat.field[3] = value;
5765             switch (sep_by_space)
5766             {
5767             case 0:  // No space separates the currency symbol and value.
5768                 pat.field[1] = symbol;
5769                 pat.field[2] = none;
5770                 return;
5771             case 1:  // Space between currency-and-sign or currency and value.
5772                 pat.field[1] = symbol;
5773                 pat.field[2] = none;
5774                 if (!symbol_contains_sep) {
5775                     // We insert the space into the symbol instead of
5776                     // setting pat.field[2]=space so that when
5777                     // showbase is not set, the space goes away too.
5778                     __curr_symbol_.push_back(space_char);
5779                 }
5780                 return;
5781             case 2:  // Space between sign and currency or value.
5782                 pat.field[1] = space;
5783                 pat.field[2] = symbol;
5784                 if (symbol_contains_sep) {
5785                     // Remove the separator from the symbol, since it
5786                     // has already appeared after the sign.
5787                     __curr_symbol_.pop_back();
5788                 }
5789                 return;
5790             default:
5791                 break;
5792             }
5793             break;
5794         case 4:  // The sign string immediately succeeds the currency symbol.
5795             pat.field[0] = symbol;
5796             pat.field[3] = value;
5797             switch (sep_by_space)
5798             {
5799             case 0:  // No space separates the currency symbol and value.
5800                 pat.field[1] = sign;
5801                 pat.field[2] = none;
5802                 return;
5803             case 1:  // Space between currency-and-sign or currency and value.
5804                 pat.field[1] = sign;
5805                 pat.field[2] = space;
5806                 if (symbol_contains_sep) {
5807                     // Remove the separator from the symbol, since it
5808                     // should not disappear when showbase is absent.
5809                     __curr_symbol_.pop_back();
5810                 }
5811                 return;
5812             case 2:  // Space between sign and currency or value.
5813                 pat.field[1] = none;
5814                 pat.field[2] = sign;
5815                 if (!symbol_contains_sep) {
5816                     // We insert the space into the symbol instead of
5817                     // setting pat.field[1]=space so that when
5818                     // showbase is not set, the space goes away too.
5819                     __curr_symbol_.push_back(space_char);
5820                 }
5821                 return;
5822            default:
5823                 break;
5824             }
5825             break;
5826         default:
5827             break;
5828         }
5829         break;
5830     default:
5831         break;
5832     }
5833     pat.field[0] = symbol;
5834     pat.field[1] = sign;
5835     pat.field[2] = none;
5836     pat.field[3] = value;
5837 }
5838 
5839 template<>
5840 void
init(const char * nm)5841 moneypunct_byname<char, false>::init(const char* nm)
5842 {
5843     typedef moneypunct<char, false> base;
5844     __libcpp_unique_locale loc(nm);
5845     if (!loc)
5846         __throw_runtime_error("moneypunct_byname"
5847                             " failed to construct for " + string(nm));
5848 
5849     lconv* lc = __libcpp_localeconv_l(loc.get());
5850     if (!checked_string_to_char_convert(__decimal_point_,
5851                                         lc->mon_decimal_point,
5852                                         loc.get()))
5853       __decimal_point_ = base::do_decimal_point();
5854     if (!checked_string_to_char_convert(__thousands_sep_,
5855                                         lc->mon_thousands_sep,
5856                                         loc.get()))
5857       __thousands_sep_ = base::do_thousands_sep();
5858 
5859     __grouping_ = lc->mon_grouping;
5860     __curr_symbol_ = lc->currency_symbol;
5861     if (lc->frac_digits != CHAR_MAX)
5862         __frac_digits_ = lc->frac_digits;
5863     else
5864         __frac_digits_ = base::do_frac_digits();
5865     if (lc->p_sign_posn == 0)
5866         __positive_sign_ = "()";
5867     else
5868         __positive_sign_ = lc->positive_sign;
5869     if (lc->n_sign_posn == 0)
5870         __negative_sign_ = "()";
5871     else
5872         __negative_sign_ = lc->negative_sign;
5873     // Assume the positive and negative formats will want spaces in
5874     // the same places in curr_symbol since there's no way to
5875     // represent anything else.
5876     string_type __dummy_curr_symbol = __curr_symbol_;
5877     __init_pat(__pos_format_, __dummy_curr_symbol, false,
5878                lc->p_cs_precedes, lc->p_sep_by_space, lc->p_sign_posn, ' ');
5879     __init_pat(__neg_format_, __curr_symbol_, false,
5880                lc->n_cs_precedes, lc->n_sep_by_space, lc->n_sign_posn, ' ');
5881 }
5882 
5883 template<>
5884 void
init(const char * nm)5885 moneypunct_byname<char, true>::init(const char* nm)
5886 {
5887     typedef moneypunct<char, true> base;
5888     __libcpp_unique_locale loc(nm);
5889     if (!loc)
5890         __throw_runtime_error("moneypunct_byname"
5891                             " failed to construct for " + string(nm));
5892 
5893     lconv* lc = __libcpp_localeconv_l(loc.get());
5894     if (!checked_string_to_char_convert(__decimal_point_,
5895                                         lc->mon_decimal_point,
5896                                         loc.get()))
5897       __decimal_point_ = base::do_decimal_point();
5898     if (!checked_string_to_char_convert(__thousands_sep_,
5899                                         lc->mon_thousands_sep,
5900                                         loc.get()))
5901       __thousands_sep_ = base::do_thousands_sep();
5902     __grouping_ = lc->mon_grouping;
5903     __curr_symbol_ = lc->int_curr_symbol;
5904     if (lc->int_frac_digits != CHAR_MAX)
5905         __frac_digits_ = lc->int_frac_digits;
5906     else
5907         __frac_digits_ = base::do_frac_digits();
5908 #if defined(_LIBCPP_MSVCRT) || defined(__MINGW32__)
5909     if (lc->p_sign_posn == 0)
5910 #else // _LIBCPP_MSVCRT
5911     if (lc->int_p_sign_posn == 0)
5912 #endif // !_LIBCPP_MSVCRT
5913         __positive_sign_ = "()";
5914     else
5915         __positive_sign_ = lc->positive_sign;
5916 #if defined(_LIBCPP_MSVCRT) || defined(__MINGW32__)
5917     if(lc->n_sign_posn == 0)
5918 #else // _LIBCPP_MSVCRT
5919     if (lc->int_n_sign_posn == 0)
5920 #endif // !_LIBCPP_MSVCRT
5921         __negative_sign_ = "()";
5922     else
5923         __negative_sign_ = lc->negative_sign;
5924     // Assume the positive and negative formats will want spaces in
5925     // the same places in curr_symbol since there's no way to
5926     // represent anything else.
5927     string_type __dummy_curr_symbol = __curr_symbol_;
5928 #if defined(_LIBCPP_MSVCRT) || defined(__MINGW32__)
5929     __init_pat(__pos_format_, __dummy_curr_symbol, true,
5930                lc->p_cs_precedes, lc->p_sep_by_space, lc->p_sign_posn, ' ');
5931     __init_pat(__neg_format_, __curr_symbol_, true,
5932                lc->n_cs_precedes, lc->n_sep_by_space, lc->n_sign_posn, ' ');
5933 #else // _LIBCPP_MSVCRT
5934     __init_pat(__pos_format_, __dummy_curr_symbol, true,
5935                lc->int_p_cs_precedes, lc->int_p_sep_by_space,
5936                lc->int_p_sign_posn, ' ');
5937     __init_pat(__neg_format_, __curr_symbol_, true,
5938                lc->int_n_cs_precedes, lc->int_n_sep_by_space,
5939                lc->int_n_sign_posn, ' ');
5940 #endif // !_LIBCPP_MSVCRT
5941 }
5942 
5943 template<>
5944 void
init(const char * nm)5945 moneypunct_byname<wchar_t, false>::init(const char* nm)
5946 {
5947     typedef moneypunct<wchar_t, false> base;
5948     __libcpp_unique_locale loc(nm);
5949     if (!loc)
5950         __throw_runtime_error("moneypunct_byname"
5951                             " failed to construct for " + string(nm));
5952     lconv* lc = __libcpp_localeconv_l(loc.get());
5953     if (!checked_string_to_wchar_convert(__decimal_point_,
5954                                          lc->mon_decimal_point,
5955                                          loc.get()))
5956       __decimal_point_ = base::do_decimal_point();
5957     if (!checked_string_to_wchar_convert(__thousands_sep_,
5958                                          lc->mon_thousands_sep,
5959                                          loc.get()))
5960       __thousands_sep_ = base::do_thousands_sep();
5961     __grouping_ = lc->mon_grouping;
5962     wchar_t wbuf[100];
5963     mbstate_t mb = {0};
5964     const char* bb = lc->currency_symbol;
5965     size_t j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, loc.get());
5966     if (j == size_t(-1))
5967         __throw_runtime_error("locale not supported");
5968     wchar_t* wbe = wbuf + j;
5969     __curr_symbol_.assign(wbuf, wbe);
5970     if (lc->frac_digits != CHAR_MAX)
5971         __frac_digits_ = lc->frac_digits;
5972     else
5973         __frac_digits_ = base::do_frac_digits();
5974     if (lc->p_sign_posn == 0)
5975         __positive_sign_ = L"()";
5976     else
5977     {
5978         mb = mbstate_t();
5979         bb = lc->positive_sign;
5980         j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, loc.get());
5981         if (j == size_t(-1))
5982             __throw_runtime_error("locale not supported");
5983         wbe = wbuf + j;
5984         __positive_sign_.assign(wbuf, wbe);
5985     }
5986     if (lc->n_sign_posn == 0)
5987         __negative_sign_ = L"()";
5988     else
5989     {
5990         mb = mbstate_t();
5991         bb = lc->negative_sign;
5992         j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, loc.get());
5993         if (j == size_t(-1))
5994             __throw_runtime_error("locale not supported");
5995         wbe = wbuf + j;
5996         __negative_sign_.assign(wbuf, wbe);
5997     }
5998     // Assume the positive and negative formats will want spaces in
5999     // the same places in curr_symbol since there's no way to
6000     // represent anything else.
6001     string_type __dummy_curr_symbol = __curr_symbol_;
6002     __init_pat(__pos_format_, __dummy_curr_symbol, false,
6003                lc->p_cs_precedes, lc->p_sep_by_space, lc->p_sign_posn, L' ');
6004     __init_pat(__neg_format_, __curr_symbol_, false,
6005                lc->n_cs_precedes, lc->n_sep_by_space, lc->n_sign_posn, L' ');
6006 }
6007 
6008 template<>
6009 void
init(const char * nm)6010 moneypunct_byname<wchar_t, true>::init(const char* nm)
6011 {
6012     typedef moneypunct<wchar_t, true> base;
6013     __libcpp_unique_locale loc(nm);
6014     if (!loc)
6015         __throw_runtime_error("moneypunct_byname"
6016                             " failed to construct for " + string(nm));
6017 
6018     lconv* lc = __libcpp_localeconv_l(loc.get());
6019     if (!checked_string_to_wchar_convert(__decimal_point_,
6020                                          lc->mon_decimal_point,
6021                                          loc.get()))
6022       __decimal_point_ = base::do_decimal_point();
6023     if (!checked_string_to_wchar_convert(__thousands_sep_,
6024                                          lc->mon_thousands_sep,
6025                                          loc.get()))
6026       __thousands_sep_ = base::do_thousands_sep();
6027     __grouping_ = lc->mon_grouping;
6028     wchar_t wbuf[100];
6029     mbstate_t mb = {0};
6030     const char* bb = lc->int_curr_symbol;
6031     size_t j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, loc.get());
6032     if (j == size_t(-1))
6033         __throw_runtime_error("locale not supported");
6034     wchar_t* wbe = wbuf + j;
6035     __curr_symbol_.assign(wbuf, wbe);
6036     if (lc->int_frac_digits != CHAR_MAX)
6037         __frac_digits_ = lc->int_frac_digits;
6038     else
6039         __frac_digits_ = base::do_frac_digits();
6040 #if defined(_LIBCPP_MSVCRT) || defined(__MINGW32__)
6041     if (lc->p_sign_posn == 0)
6042 #else // _LIBCPP_MSVCRT
6043     if (lc->int_p_sign_posn == 0)
6044 #endif // !_LIBCPP_MSVCRT
6045         __positive_sign_ = L"()";
6046     else
6047     {
6048         mb = mbstate_t();
6049         bb = lc->positive_sign;
6050         j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, loc.get());
6051         if (j == size_t(-1))
6052             __throw_runtime_error("locale not supported");
6053         wbe = wbuf + j;
6054         __positive_sign_.assign(wbuf, wbe);
6055     }
6056 #if defined(_LIBCPP_MSVCRT) || defined(__MINGW32__)
6057     if (lc->n_sign_posn == 0)
6058 #else // _LIBCPP_MSVCRT
6059     if (lc->int_n_sign_posn == 0)
6060 #endif // !_LIBCPP_MSVCRT
6061         __negative_sign_ = L"()";
6062     else
6063     {
6064         mb = mbstate_t();
6065         bb = lc->negative_sign;
6066         j = __libcpp_mbsrtowcs_l(wbuf, &bb, countof(wbuf), &mb, loc.get());
6067         if (j == size_t(-1))
6068             __throw_runtime_error("locale not supported");
6069         wbe = wbuf + j;
6070         __negative_sign_.assign(wbuf, wbe);
6071     }
6072     // Assume the positive and negative formats will want spaces in
6073     // the same places in curr_symbol since there's no way to
6074     // represent anything else.
6075     string_type __dummy_curr_symbol = __curr_symbol_;
6076 #if defined(_LIBCPP_MSVCRT) || defined(__MINGW32__)
6077     __init_pat(__pos_format_, __dummy_curr_symbol, true,
6078                lc->p_cs_precedes, lc->p_sep_by_space, lc->p_sign_posn, L' ');
6079     __init_pat(__neg_format_, __curr_symbol_, true,
6080                lc->n_cs_precedes, lc->n_sep_by_space, lc->n_sign_posn, L' ');
6081 #else // _LIBCPP_MSVCRT
6082     __init_pat(__pos_format_, __dummy_curr_symbol, true,
6083                lc->int_p_cs_precedes, lc->int_p_sep_by_space,
6084                lc->int_p_sign_posn, L' ');
6085     __init_pat(__neg_format_, __curr_symbol_, true,
6086                lc->int_n_cs_precedes, lc->int_n_sep_by_space,
6087                lc->int_n_sign_posn, L' ');
6088 #endif // !_LIBCPP_MSVCRT
6089 }
6090 
__do_nothing(void *)6091 void __do_nothing(void*) {}
6092 
__throw_runtime_error(const char * msg)6093 void __throw_runtime_error(const char* msg)
6094 {
6095 #ifndef _LIBCPP_NO_EXCEPTIONS
6096     throw runtime_error(msg);
6097 #else
6098     (void)msg;
6099     _VSTD::abort();
6100 #endif
6101 }
6102 
6103 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS collate<char>;
6104 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS collate<wchar_t>;
6105 
6106 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS num_get<char>;
6107 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS num_get<wchar_t>;
6108 
6109 template struct _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS __num_get<char>;
6110 template struct _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS __num_get<wchar_t>;
6111 
6112 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS num_put<char>;
6113 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS num_put<wchar_t>;
6114 
6115 template struct _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS __num_put<char>;
6116 template struct _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS __num_put<wchar_t>;
6117 
6118 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS time_get<char>;
6119 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS time_get<wchar_t>;
6120 
6121 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS time_get_byname<char>;
6122 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS time_get_byname<wchar_t>;
6123 
6124 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS time_put<char>;
6125 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS time_put<wchar_t>;
6126 
6127 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS time_put_byname<char>;
6128 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS time_put_byname<wchar_t>;
6129 
6130 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS moneypunct<char, false>;
6131 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS moneypunct<char, true>;
6132 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS moneypunct<wchar_t, false>;
6133 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS moneypunct<wchar_t, true>;
6134 
6135 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS moneypunct_byname<char, false>;
6136 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS moneypunct_byname<char, true>;
6137 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS moneypunct_byname<wchar_t, false>;
6138 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS moneypunct_byname<wchar_t, true>;
6139 
6140 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS money_get<char>;
6141 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS money_get<wchar_t>;
6142 
6143 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS __money_get<char>;
6144 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS __money_get<wchar_t>;
6145 
6146 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS money_put<char>;
6147 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS money_put<wchar_t>;
6148 
6149 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS __money_put<char>;
6150 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS __money_put<wchar_t>;
6151 
6152 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS messages<char>;
6153 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS messages<wchar_t>;
6154 
6155 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS messages_byname<char>;
6156 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS messages_byname<wchar_t>;
6157 
6158 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS codecvt_byname<char, char, mbstate_t>;
6159 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS codecvt_byname<wchar_t, char, mbstate_t>;
6160 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS codecvt_byname<char16_t, char, mbstate_t>;
6161 template class _LIBCPP_CLASS_TEMPLATE_INSTANTIATION_VIS codecvt_byname<char32_t, char, mbstate_t>;
6162 
6163 _LIBCPP_END_NAMESPACE_STD
6164