Home | History | Annotate | Download | only in include
      1 // -*- C++ -*-
      2 //===-------------------------- codecvt -----------------------------------===//
      3 //
      4 //                     The LLVM Compiler Infrastructure
      5 //
      6 // This file is dual licensed under the MIT and the University of Illinois Open
      7 // Source Licenses. See LICENSE.TXT for details.
      8 //
      9 //===----------------------------------------------------------------------===//
     10 
     11 #ifndef _LIBCPP_CODECVT
     12 #define _LIBCPP_CODECVT
     13 
     14 /*
     15     codecvt synopsis
     16 
     17 namespace std
     18 {
     19 
     20 enum codecvt_mode
     21 {
     22     consume_header = 4,
     23     generate_header = 2,
     24     little_endian = 1
     25 };
     26 
     27 template <class Elem, unsigned long Maxcode = 0x10ffff,
     28           codecvt_mode Mode = (codecvt_mode)0>
     29 class codecvt_utf8
     30     : public codecvt<Elem, char, mbstate_t>
     31 {
     32     // unspecified
     33 };
     34 
     35 template <class Elem, unsigned long Maxcode = 0x10ffff,
     36           codecvt_mode Mode = (codecvt_mode)0>
     37 class codecvt_utf16
     38     : public codecvt<Elem, char, mbstate_t>
     39 {
     40     // unspecified
     41 };
     42 
     43 template <class Elem, unsigned long Maxcode = 0x10ffff,
     44           codecvt_mode Mode = (codecvt_mode)0>
     45 class codecvt_utf8_utf16
     46     : public codecvt<Elem, char, mbstate_t>
     47 {
     48     // unspecified
     49 };
     50 
     51 }  // std
     52 
     53 */
     54 
     55 #include <__config>
     56 #include <__locale>
     57 
     58 #if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
     59 #pragma GCC system_header
     60 #endif
     61 
     62 _LIBCPP_BEGIN_NAMESPACE_STD
     63 
     64 enum codecvt_mode
     65 {
     66     consume_header = 4,
     67     generate_header = 2,
     68     little_endian = 1
     69 };
     70 
     71 // codecvt_utf8
     72 
     73 template <class _Elem> class __codecvt_utf8;
     74 
     75 template <>
     76 class __codecvt_utf8<wchar_t>
     77     : public codecvt<wchar_t, char, mbstate_t>
     78 {
     79     unsigned long _Maxcode_;
     80     codecvt_mode _Mode_;
     81 public:
     82     typedef wchar_t   intern_type;
     83     typedef char      extern_type;
     84     typedef mbstate_t state_type;
     85 
     86     _LIBCPP_ALWAYS_INLINE
     87     explicit __codecvt_utf8(size_t __refs, unsigned long _Maxcode,
     88                             codecvt_mode _Mode)
     89         : codecvt<wchar_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
     90           _Mode_(_Mode) {}
     91 protected:
     92     virtual result
     93         do_out(state_type& __st,
     94                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
     95                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
     96     virtual result
     97         do_in(state_type& __st,
     98               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
     99               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    100     virtual result
    101         do_unshift(state_type& __st,
    102                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    103     virtual int do_encoding() const throw();
    104     virtual bool do_always_noconv() const throw();
    105     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    106                           size_t __mx) const;
    107     virtual int do_max_length() const throw();
    108 };
    109 
    110 template <>
    111 class __codecvt_utf8<char16_t>
    112     : public codecvt<char16_t, char, mbstate_t>
    113 {
    114     unsigned long _Maxcode_;
    115     codecvt_mode _Mode_;
    116 public:
    117     typedef char16_t  intern_type;
    118     typedef char      extern_type;
    119     typedef mbstate_t state_type;
    120 
    121     _LIBCPP_ALWAYS_INLINE
    122     explicit __codecvt_utf8(size_t __refs, unsigned long _Maxcode,
    123                             codecvt_mode _Mode)
    124         : codecvt<char16_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    125           _Mode_(_Mode) {}
    126 protected:
    127     virtual result
    128         do_out(state_type& __st,
    129                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    130                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    131     virtual result
    132         do_in(state_type& __st,
    133               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    134               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    135     virtual result
    136         do_unshift(state_type& __st,
    137                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    138     virtual int do_encoding() const throw();
    139     virtual bool do_always_noconv() const throw();
    140     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    141                           size_t __mx) const;
    142     virtual int do_max_length() const throw();
    143 };
    144 
    145 template <>
    146 class __codecvt_utf8<char32_t>
    147     : public codecvt<char32_t, char, mbstate_t>
    148 {
    149     unsigned long _Maxcode_;
    150     codecvt_mode _Mode_;
    151 public:
    152     typedef char32_t  intern_type;
    153     typedef char      extern_type;
    154     typedef mbstate_t state_type;
    155 
    156     _LIBCPP_ALWAYS_INLINE
    157     explicit __codecvt_utf8(size_t __refs, unsigned long _Maxcode,
    158                             codecvt_mode _Mode)
    159         : codecvt<char32_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    160           _Mode_(_Mode) {}
    161 protected:
    162     virtual result
    163         do_out(state_type& __st,
    164                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    165                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    166     virtual result
    167         do_in(state_type& __st,
    168               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    169               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    170     virtual result
    171         do_unshift(state_type& __st,
    172                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    173     virtual int do_encoding() const throw();
    174     virtual bool do_always_noconv() const throw();
    175     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    176                           size_t __mx) const;
    177     virtual int do_max_length() const throw();
    178 };
    179 
    180 template <class _Elem, unsigned long _Maxcode = 0x10ffff,
    181           codecvt_mode _Mode = (codecvt_mode)0>
    182 class _LIBCPP_TYPE_VIS codecvt_utf8
    183     : public __codecvt_utf8<_Elem>
    184 {
    185 public:
    186     _LIBCPP_ALWAYS_INLINE
    187     explicit codecvt_utf8(size_t __refs = 0)
    188         : __codecvt_utf8<_Elem>(__refs, _Maxcode, _Mode) {}
    189 
    190     _LIBCPP_ALWAYS_INLINE
    191     ~codecvt_utf8() {}
    192 };
    193 
    194 // codecvt_utf16
    195 
    196 template <class _Elem, bool _LittleEndian> class __codecvt_utf16;
    197 
    198 template <>
    199 class __codecvt_utf16<wchar_t, false>
    200     : public codecvt<wchar_t, char, mbstate_t>
    201 {
    202     unsigned long _Maxcode_;
    203     codecvt_mode _Mode_;
    204 public:
    205     typedef wchar_t   intern_type;
    206     typedef char      extern_type;
    207     typedef mbstate_t state_type;
    208 
    209     _LIBCPP_ALWAYS_INLINE
    210     explicit __codecvt_utf16(size_t __refs, unsigned long _Maxcode,
    211                             codecvt_mode _Mode)
    212         : codecvt<wchar_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    213           _Mode_(_Mode) {}
    214 protected:
    215     virtual result
    216         do_out(state_type& __st,
    217                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    218                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    219     virtual result
    220         do_in(state_type& __st,
    221               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    222               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    223     virtual result
    224         do_unshift(state_type& __st,
    225                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    226     virtual int do_encoding() const throw();
    227     virtual bool do_always_noconv() const throw();
    228     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    229                           size_t __mx) const;
    230     virtual int do_max_length() const throw();
    231 };
    232 
    233 template <>
    234 class __codecvt_utf16<wchar_t, true>
    235     : public codecvt<wchar_t, char, mbstate_t>
    236 {
    237     unsigned long _Maxcode_;
    238     codecvt_mode _Mode_;
    239 public:
    240     typedef wchar_t   intern_type;
    241     typedef char      extern_type;
    242     typedef mbstate_t state_type;
    243 
    244     _LIBCPP_ALWAYS_INLINE
    245     explicit __codecvt_utf16(size_t __refs, unsigned long _Maxcode,
    246                             codecvt_mode _Mode)
    247         : codecvt<wchar_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    248           _Mode_(_Mode) {}
    249 protected:
    250     virtual result
    251         do_out(state_type& __st,
    252                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    253                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    254     virtual result
    255         do_in(state_type& __st,
    256               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    257               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    258     virtual result
    259         do_unshift(state_type& __st,
    260                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    261     virtual int do_encoding() const throw();
    262     virtual bool do_always_noconv() const throw();
    263     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    264                           size_t __mx) const;
    265     virtual int do_max_length() const throw();
    266 };
    267 
    268 template <>
    269 class __codecvt_utf16<char16_t, false>
    270     : public codecvt<char16_t, char, mbstate_t>
    271 {
    272     unsigned long _Maxcode_;
    273     codecvt_mode _Mode_;
    274 public:
    275     typedef char16_t  intern_type;
    276     typedef char      extern_type;
    277     typedef mbstate_t state_type;
    278 
    279     _LIBCPP_ALWAYS_INLINE
    280     explicit __codecvt_utf16(size_t __refs, unsigned long _Maxcode,
    281                             codecvt_mode _Mode)
    282         : codecvt<char16_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    283           _Mode_(_Mode) {}
    284 protected:
    285     virtual result
    286         do_out(state_type& __st,
    287                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    288                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    289     virtual result
    290         do_in(state_type& __st,
    291               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    292               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    293     virtual result
    294         do_unshift(state_type& __st,
    295                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    296     virtual int do_encoding() const throw();
    297     virtual bool do_always_noconv() const throw();
    298     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    299                           size_t __mx) const;
    300     virtual int do_max_length() const throw();
    301 };
    302 
    303 template <>
    304 class __codecvt_utf16<char16_t, true>
    305     : public codecvt<char16_t, char, mbstate_t>
    306 {
    307     unsigned long _Maxcode_;
    308     codecvt_mode _Mode_;
    309 public:
    310     typedef char16_t  intern_type;
    311     typedef char      extern_type;
    312     typedef mbstate_t state_type;
    313 
    314     _LIBCPP_ALWAYS_INLINE
    315     explicit __codecvt_utf16(size_t __refs, unsigned long _Maxcode,
    316                             codecvt_mode _Mode)
    317         : codecvt<char16_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    318           _Mode_(_Mode) {}
    319 protected:
    320     virtual result
    321         do_out(state_type& __st,
    322                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    323                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    324     virtual result
    325         do_in(state_type& __st,
    326               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    327               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    328     virtual result
    329         do_unshift(state_type& __st,
    330                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    331     virtual int do_encoding() const throw();
    332     virtual bool do_always_noconv() const throw();
    333     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    334                           size_t __mx) const;
    335     virtual int do_max_length() const throw();
    336 };
    337 
    338 template <>
    339 class __codecvt_utf16<char32_t, false>
    340     : public codecvt<char32_t, char, mbstate_t>
    341 {
    342     unsigned long _Maxcode_;
    343     codecvt_mode _Mode_;
    344 public:
    345     typedef char32_t  intern_type;
    346     typedef char      extern_type;
    347     typedef mbstate_t state_type;
    348 
    349     _LIBCPP_ALWAYS_INLINE
    350     explicit __codecvt_utf16(size_t __refs, unsigned long _Maxcode,
    351                             codecvt_mode _Mode)
    352         : codecvt<char32_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    353           _Mode_(_Mode) {}
    354 protected:
    355     virtual result
    356         do_out(state_type& __st,
    357                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    358                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    359     virtual result
    360         do_in(state_type& __st,
    361               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    362               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    363     virtual result
    364         do_unshift(state_type& __st,
    365                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    366     virtual int do_encoding() const throw();
    367     virtual bool do_always_noconv() const throw();
    368     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    369                           size_t __mx) const;
    370     virtual int do_max_length() const throw();
    371 };
    372 
    373 template <>
    374 class __codecvt_utf16<char32_t, true>
    375     : public codecvt<char32_t, char, mbstate_t>
    376 {
    377     unsigned long _Maxcode_;
    378     codecvt_mode _Mode_;
    379 public:
    380     typedef char32_t  intern_type;
    381     typedef char      extern_type;
    382     typedef mbstate_t state_type;
    383 
    384     _LIBCPP_ALWAYS_INLINE
    385     explicit __codecvt_utf16(size_t __refs, unsigned long _Maxcode,
    386                             codecvt_mode _Mode)
    387         : codecvt<char32_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    388           _Mode_(_Mode) {}
    389 protected:
    390     virtual result
    391         do_out(state_type& __st,
    392                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    393                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    394     virtual result
    395         do_in(state_type& __st,
    396               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    397               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    398     virtual result
    399         do_unshift(state_type& __st,
    400                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    401     virtual int do_encoding() const throw();
    402     virtual bool do_always_noconv() const throw();
    403     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    404                           size_t __mx) const;
    405     virtual int do_max_length() const throw();
    406 };
    407 
    408 template <class _Elem, unsigned long _Maxcode = 0x10ffff,
    409           codecvt_mode _Mode = (codecvt_mode)0>
    410 class _LIBCPP_TYPE_VIS codecvt_utf16
    411     : public __codecvt_utf16<_Elem, _Mode & little_endian>
    412 {
    413 public:
    414     _LIBCPP_ALWAYS_INLINE
    415     explicit codecvt_utf16(size_t __refs = 0)
    416         : __codecvt_utf16<_Elem, _Mode & little_endian>(__refs, _Maxcode, _Mode) {}
    417 
    418     _LIBCPP_ALWAYS_INLINE
    419     ~codecvt_utf16() {}
    420 };
    421 
    422 // codecvt_utf8_utf16
    423 
    424 template <class _Elem> class __codecvt_utf8_utf16;
    425 
    426 template <>
    427 class __codecvt_utf8_utf16<wchar_t>
    428     : public codecvt<wchar_t, char, mbstate_t>
    429 {
    430     unsigned long _Maxcode_;
    431     codecvt_mode _Mode_;
    432 public:
    433     typedef wchar_t   intern_type;
    434     typedef char      extern_type;
    435     typedef mbstate_t state_type;
    436 
    437     _LIBCPP_ALWAYS_INLINE
    438     explicit __codecvt_utf8_utf16(size_t __refs, unsigned long _Maxcode,
    439                             codecvt_mode _Mode)
    440         : codecvt<wchar_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    441           _Mode_(_Mode) {}
    442 protected:
    443     virtual result
    444         do_out(state_type& __st,
    445                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    446                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    447     virtual result
    448         do_in(state_type& __st,
    449               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    450               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    451     virtual result
    452         do_unshift(state_type& __st,
    453                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    454     virtual int do_encoding() const throw();
    455     virtual bool do_always_noconv() const throw();
    456     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    457                           size_t __mx) const;
    458     virtual int do_max_length() const throw();
    459 };
    460 
    461 template <>
    462 class __codecvt_utf8_utf16<char32_t>
    463     : public codecvt<char32_t, char, mbstate_t>
    464 {
    465     unsigned long _Maxcode_;
    466     codecvt_mode _Mode_;
    467 public:
    468     typedef char32_t  intern_type;
    469     typedef char      extern_type;
    470     typedef mbstate_t state_type;
    471 
    472     _LIBCPP_ALWAYS_INLINE
    473     explicit __codecvt_utf8_utf16(size_t __refs, unsigned long _Maxcode,
    474                             codecvt_mode _Mode)
    475         : codecvt<char32_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    476           _Mode_(_Mode) {}
    477 protected:
    478     virtual result
    479         do_out(state_type& __st,
    480                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    481                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    482     virtual result
    483         do_in(state_type& __st,
    484               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    485               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    486     virtual result
    487         do_unshift(state_type& __st,
    488                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    489     virtual int do_encoding() const throw();
    490     virtual bool do_always_noconv() const throw();
    491     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    492                           size_t __mx) const;
    493     virtual int do_max_length() const throw();
    494 };
    495 
    496 template <>
    497 class __codecvt_utf8_utf16<char16_t>
    498     : public codecvt<char16_t, char, mbstate_t>
    499 {
    500     unsigned long _Maxcode_;
    501     codecvt_mode _Mode_;
    502 public:
    503     typedef char16_t  intern_type;
    504     typedef char      extern_type;
    505     typedef mbstate_t state_type;
    506 
    507     _LIBCPP_ALWAYS_INLINE
    508     explicit __codecvt_utf8_utf16(size_t __refs, unsigned long _Maxcode,
    509                             codecvt_mode _Mode)
    510         : codecvt<char16_t, char, mbstate_t>(__refs), _Maxcode_(_Maxcode),
    511           _Mode_(_Mode) {}
    512 protected:
    513     virtual result
    514         do_out(state_type& __st,
    515                const intern_type* __frm, const intern_type* __frm_end, const intern_type*& __frm_nxt,
    516                extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    517     virtual result
    518         do_in(state_type& __st,
    519               const extern_type* __frm, const extern_type* __frm_end, const extern_type*& __frm_nxt,
    520               intern_type* __to, intern_type* __to_end, intern_type*& __to_nxt) const;
    521     virtual result
    522         do_unshift(state_type& __st,
    523                    extern_type* __to, extern_type* __to_end, extern_type*& __to_nxt) const;
    524     virtual int do_encoding() const throw();
    525     virtual bool do_always_noconv() const throw();
    526     virtual int do_length(state_type&, const extern_type* __frm, const extern_type* __end,
    527                           size_t __mx) const;
    528     virtual int do_max_length() const throw();
    529 };
    530 
    531 template <class _Elem, unsigned long _Maxcode = 0x10ffff,
    532           codecvt_mode _Mode = (codecvt_mode)0>
    533 class _LIBCPP_TYPE_VIS codecvt_utf8_utf16
    534     : public __codecvt_utf8_utf16<_Elem>
    535 {
    536 public:
    537     _LIBCPP_ALWAYS_INLINE
    538     explicit codecvt_utf8_utf16(size_t __refs = 0)
    539         : __codecvt_utf8_utf16<_Elem>(__refs, _Maxcode, _Mode) {}
    540 
    541     _LIBCPP_ALWAYS_INLINE
    542     ~codecvt_utf8_utf16() {}
    543 };
    544 
    545 _LIBCPP_END_NAMESPACE_STD
    546 
    547 #endif  // _LIBCPP_CODECVT
    548