STL/stl/inc/xlocale

3367 строки
126 KiB
C++

// xlocale internal header
// Copyright (c) Microsoft Corporation.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
#ifndef _XLOCALE_
#define _XLOCALE_
#include <yvals_core.h>
#if _STL_COMPILER_PREPROCESSOR
#include <climits>
#include <cstring>
#include <memory>
#include <typeinfo>
#include <xfacet>
#include <xlocinfo>
#pragma pack(push, _CRT_PACKING)
#pragma warning(push, _STL_WARNING_LEVEL)
#pragma warning(disable : _STL_DISABLED_WARNINGS)
_STL_DISABLE_CLANG_WARNINGS
#pragma push_macro("new")
#undef new
_STD_BEGIN
template <class _Dummy>
class _Locbase {}; // TRANSITION, ABI, affects sizeof(locale)
_EXPORT_STD template <class _Elem>
class collate;
extern "C++" struct _CRTIMP2_PURE_IMPORT _Crt_new_delete { // base class for marking allocations as CRT blocks
#ifdef _DEBUG
void* __CLRCALL_OR_CDECL operator new(size_t _Size) { // replace operator new
void* _Ptr = operator new(_Size, nothrow);
if (!_Ptr) {
_Xbad_alloc();
}
return _Ptr;
}
void* __CLRCALL_OR_CDECL operator new(size_t _Size, const nothrow_t&) noexcept { // replace nothrow operator new
return _malloc_dbg(_Size > 0 ? _Size : 1, _CRT_BLOCK, __FILE__, __LINE__);
}
void __CLRCALL_OR_CDECL operator delete(void* _Ptr) noexcept { // replace operator delete
_CSTD free(_Ptr);
}
void __CLRCALL_OR_CDECL operator delete(void* _Ptr, const nothrow_t&) noexcept { // replace nothrow operator delete
operator delete(_Ptr);
}
void* __CLRCALL_OR_CDECL operator new(size_t, void* _Ptr) noexcept { // imitate True Placement New
return _Ptr;
}
void __CLRCALL_OR_CDECL operator delete(void*, void*) noexcept {} // imitate True Placement Delete
#endif // _DEBUG
};
_EXPORT_STD extern "C++" class locale : public _Locbase<int>, public _Crt_new_delete {
public:
using category = int;
static constexpr category collate = _M_COLLATE;
static constexpr category ctype = _M_CTYPE;
static constexpr category monetary = _M_MONETARY;
static constexpr category numeric = _M_NUMERIC;
static constexpr category time = _M_TIME;
static constexpr category messages = _M_MESSAGES;
static constexpr category all = _M_ALL;
static constexpr category none = 0;
class _CRTIMP2_PURE_IMPORT id { // identifier stamp, unique for each distinct kind of facet
public:
#ifdef _CRTBLD // TRANSITION, ABI: preserved for binary compatibility
__CLR_OR_THIS_CALL id(size_t _Val = 0) : _Id(_Val) {}
#else // ^^^ defined(_CRTBLD) / !defined(_CRTBLD) vvv
template <int = 0> // TRANSITION, ABI
id() noexcept /* strengthened */ {}
#endif // ^^^ !defined(_CRTBLD) ^^^
id(const id&) = delete;
id& operator=(const id&) = delete;
template <int = 0> // TRANSITION, ABI
size_t _Get_index() { // get stamp, with lazy allocation
if (_Id == 0) { // still zero, allocate stamp
_BEGIN_LOCK(_LOCK_LOCALE)
if (_Id == 0) {
_Id = static_cast<size_t>(++_Id_cnt);
}
_END_LOCK()
}
return _Id;
}
#ifdef _CRTBLD // TRANSITION, ABI: preserved for binary compatibility
__CLR_OR_THIS_CALL operator size_t() {
return _Get_index();
}
#endif // defined(_CRTBLD)
private:
size_t _Id = 0; // the identifier stamp
__PURE_APPDOMAIN_GLOBAL static int _Id_cnt;
};
struct _Facet_guard;
class _CRTIMP2_PURE_IMPORT facet : public _Facet_base, public _Crt_new_delete {
// base class for all locale facets, performs reference counting
private:
friend _Facet_guard;
public:
static size_t __CLRCALL_OR_CDECL _Getcat(const facet** = nullptr, const locale* = nullptr) {
// get category value, or -1 if no corresponding C category
return static_cast<size_t>(-1);
}
void __CLR_OR_THIS_CALL _Incref() noexcept override { // increment use count
_MT_INCR(_Myrefs);
}
_Facet_base* __CLR_OR_THIS_CALL _Decref() noexcept override { // decrement use count
if (_MT_DECR(_Myrefs) == 0) {
return this;
}
return nullptr;
}
private:
_Atomic_counter_t _Myrefs; // the reference count
protected:
explicit __CLR_OR_THIS_CALL facet(size_t _Initrefs = 0) noexcept // strengthened
: _Myrefs(static_cast<_Atomic_counter_t>(_Initrefs)) // non-atomic initialization
{}
__CLR_OR_THIS_CALL ~facet() noexcept override {}
public:
__CLR_OR_THIS_CALL facet(const facet&) = delete;
facet& __CLR_OR_THIS_CALL operator=(const facet&) = delete;
};
struct _NODISCARD _Facet_guard {
facet* _Target;
~_Facet_guard() {
if (_Target) {
delete _Target->_Decref();
}
}
};
class _CRTIMP2_PURE_IMPORT _Locimp : public facet { // reference-counted actual implementation of a locale
protected:
__CLR_OR_THIS_CALL ~_Locimp() noexcept {
_Locimp_dtor(this);
}
private:
static _Locimp* __CLRCALL_PURE_OR_CDECL _New_Locimp(bool _Transparent = false);
static _Locimp* __CLRCALL_PURE_OR_CDECL _New_Locimp(const _Locimp& _Right);
static void __CLRCALL_PURE_OR_CDECL _Locimp_dtor(_Locimp*);
static void __CLRCALL_PURE_OR_CDECL _Locimp_Addfac(_Locimp*, facet*, size_t); // add a facet
static void __CLRCALL_PURE_OR_CDECL _Locimp_ctor(_Locimp*, const _Locimp&);
friend locale;
__CLR_OR_THIS_CALL _Locimp(bool _Transparent)
: locale::facet(1), _Facetvec(nullptr), _Facetcount(0), _Catmask(none), _Xparent(_Transparent), _Name("*") {
}
__CLR_OR_THIS_CALL _Locimp(const _Locimp& _Right)
: locale::facet(1), _Facetvec(nullptr), _Facetcount(_Right._Facetcount), _Catmask(_Right._Catmask),
_Xparent(_Right._Xparent), _Name(_Right._Name.c_str()) {
_Locimp_ctor(this, _Right);
}
void __CLR_OR_THIS_CALL _Addfac(facet* _Pfacet, size_t _Id) { // add a facet
_Locimp_Addfac(this, _Pfacet, _Id);
}
static _Locimp* __CLRCALL_OR_CDECL _Makeloc(
const _Locinfo&, category, _Locimp*, const locale*); // make essential facets
static void __CLRCALL_OR_CDECL _Makewloc(
const _Locinfo&, category, _Locimp*, const locale*); // make wchar_t facets
#if defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
static void __CLRCALL_OR_CDECL _Makeushloc(
const _Locinfo&, category, _Locimp*, const locale*); // make ushort facets
#endif // defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
static void __CLRCALL_OR_CDECL _Makexloc(
const _Locinfo&, category, _Locimp*, const locale*); // make remaining facets
facet** _Facetvec; // pointer to vector of facets
size_t _Facetcount; // size of vector of facets
category _Catmask; // mask describing implemented categories
bool _Xparent; // true if locale is transparent
_Yarn<char> _Name; // locale name, or "*" if not known
__PURE_APPDOMAIN_GLOBAL static _Locimp* _Clocptr;
public:
_Locimp& __CLR_OR_THIS_CALL operator=(const _Locimp&) = delete;
};
template <class _Elem, class _Traits, class _Alloc>
bool operator()(
const basic_string<_Elem, _Traits, _Alloc>& _Left, const basic_string<_Elem, _Traits, _Alloc>& _Right) const {
// compare _Left and _Right strings using collate facet in locale
const auto& _Coll_fac = _STD use_facet<_STD collate<_Elem>>(*this);
const _Elem* const _Left_data = _Left.data();
const _Elem* const _Right_data = _Right.data();
return _Coll_fac.compare(_Left_data, _Left_data + _Left.size(), _Right_data, _Right_data + _Right.size()) < 0;
}
template <class _Facet>
locale combine(const locale& _Loc) const { // combine two locales
_Facet* _Facptr;
_TRY_BEGIN
_Facptr = const_cast<_Facet*>(_STD addressof(_STD use_facet<_Facet>(_Loc)));
_CATCH_ALL
_Xruntime_error("locale::combine facet missing");
_CATCH_END
_Locimp* _Newimp = _Locimp::_New_Locimp(*_Ptr);
_Newimp->_Addfac(_Facptr, _Facet::id._Get_index());
_Newimp->_Catmask = none;
_Newimp->_Name = "*";
return locale{_Secret_locale_construct_tag{}, _Newimp};
}
template <class _Facet>
locale(const locale& _Loc, const _Facet* _Facptr) : _Ptr(_Locimp::_New_Locimp(*_Loc._Ptr)) {
if (_Facptr) { // replace facet
_Ptr->_Addfac(const_cast<_Facet*>(_Facptr), _Facet::id._Get_index());
_Ptr->_Catmask = none;
_Ptr->_Name = "*";
}
}
#pragma warning(push)
#pragma warning(disable : 26495) // Variable 'std::locale::_Ptr' is uninitialized.
// Always initialize a member variable (type.6).
// We must not explicitly initialize _Ptr here; we rely on it maintaining the value
// previously created in its storage. To be precise:
// In locale0.cpp, locale::_Init() uses True Placement New at classic_locale's address,
// and classic_locale is constructed from the _Noinit enumerator of type _Uninitialized.
// The sequencing is highly unusual; the True Placement New happens before the _Uninitialized construction,
// so while _Ptr here formally has indeterminate value, we expect it to actually keep the previous value.
locale(_Uninitialized) {} // defer construction
#pragma warning(pop)
locale(const locale& _Right) noexcept : _Ptr(_Right._Ptr) {
_Ptr->_Incref();
}
locale() noexcept : _Ptr(_Init(true)) {}
#if !defined(MRTDLL) || !defined(_CRTBLD)
locale(const locale& _Loc, const locale& _Other, category _Cat) : _Ptr(_Locimp::_New_Locimp(*_Loc._Ptr)) {
// construct a locale by copying named facets
if (_Cat != none) { // worth adding, do it
_STL_ASSERT((_Cat & all) == _Cat, "the bitmask value specifying category must be valid");
_Facet_guard _Guard{_Ptr};
_BEGIN_LOCINFO(_Lobj)
_Locimp::_Makeloc(_Lobj, _Cat, _Ptr, &_Other);
_Lobj._Addcats(_Loc._Ptr->_Catmask, _Loc.name().c_str());
_Lobj._Addcats(_Other._Ptr->_Catmask, _Other.name().c_str());
_Ptr->_Catmask = _Loc._Ptr->_Catmask | _Other._Ptr->_Catmask;
_Ptr->_Name = _Lobj._Getname();
_END_LOCINFO()
_Guard._Target = nullptr;
}
}
private:
void _Construct(const string& _Str, category _Cat) {
_STL_ASSERT((_Cat & all) == _Cat, "the bitmask value specifying category must be valid");
// construct a locale with named facets
bool _Bad = false;
_Init();
if (_Cat != none) { // worth adding, do it
_Facet_guard _Guard{_Ptr};
_BEGIN_LOCINFO(_Lobj(_Cat, _Str.c_str()))
if (_Badname(_Lobj)) {
_Bad = true;
} else { // name okay, build the locale
_Locimp::_Makeloc(_Lobj, _Cat, _Ptr, nullptr);
_Ptr->_Catmask = _Cat;
_Ptr->_Name = _Str.c_str();
}
_END_LOCINFO()
_Guard._Target = nullptr;
}
if (_Bad) { // Don't throw within _BEGIN_LOCINFO if we can avoid it
delete _Ptr->_Decref();
_Xruntime_error("bad locale name");
}
}
public:
explicit locale(const char* _Locname, category _Cat = all) : _Ptr(_Locimp::_New_Locimp()) {
// construct a locale with named facets
// _Locname might have been returned from setlocale().
// Therefore, _Construct() takes const string&.
if (_Locname) {
_Construct(_Locname, _Cat);
return;
}
_Xruntime_error("bad locale name");
}
locale(const locale& _Loc, const char* _Locname, category _Cat) : _Ptr(_Locimp::_New_Locimp(*_Loc._Ptr)) {
// construct a locale by copying, replacing named facets
// _Locname might have been returned from setlocale().
// Therefore, _Construct() takes const string&.
if (_Locname) {
_Construct(_Locname, _Cat);
return;
}
_Xruntime_error("bad locale name");
}
explicit locale(const string& _Str, category _Cat = all) : _Ptr(_Locimp::_New_Locimp()) {
// construct a locale with named facets
_Construct(_Str, _Cat);
}
locale(const locale& _Loc, const string& _Str, category _Cat) : _Ptr(_Locimp::_New_Locimp(*_Loc._Ptr)) {
// construct a locale by copying, replacing named facets
_Construct(_Str, _Cat);
}
#endif // !MRTDLL || !_CRTBLD
~locale() noexcept {
if (_Ptr) {
delete _Ptr->_Decref();
}
}
const locale& operator=(const locale& _Right) noexcept {
if (_Ptr != _Right._Ptr) { // different implementation, point at new one
delete _Ptr->_Decref();
_Ptr = _Right._Ptr;
_Ptr->_Incref();
}
return *this;
}
string name() const {
return _Ptr ? _Ptr->_Name.c_str() : string{};
}
_Ret_z_ const char* _C_str() const noexcept {
return _Ptr ? _Ptr->_Name.c_str() : "";
}
const facet* _Getfacet(size_t _Id) const { // look up a facet in locale object
const facet* _Facptr = _Id < _Ptr->_Facetcount ? _Ptr->_Facetvec[_Id] : nullptr; // null if id off end
if (_Facptr || !_Ptr->_Xparent) {
return _Facptr; // found facet or not transparent
}
// look in current locale
locale::_Locimp* _Ptr0 = _Getgloballocale();
if (_Id < _Ptr0->_Facetcount) {
return _Ptr0->_Facetvec[_Id]; // get from current locale
}
return nullptr; // no entry in current locale
}
_NODISCARD bool operator==(const locale& _Loc) const noexcept /* strengthened */ { // compare locales for equality
return _Ptr == _Loc._Ptr || (_CSTD strcmp(_C_str(), "*") != 0 && _CSTD strcmp(_C_str(), _Loc._C_str()) == 0);
}
#if !_HAS_CXX20
_NODISCARD bool operator!=(const locale& _Right) const noexcept /* strengthened */ {
return !(*this == _Right);
}
#endif // !_HAS_CXX20
static _MRTIMP2_PURE const locale& __CLRCALL_PURE_OR_CDECL classic(); // classic "C" locale
static _MRTIMP2_PURE locale __CLRCALL_PURE_OR_CDECL global(const locale&); // current locale
static _MRTIMP2_PURE locale __CLRCALL_PURE_OR_CDECL empty(); // empty (transparent) locale
private:
struct _Secret_locale_construct_tag {
explicit _Secret_locale_construct_tag() = default;
};
explicit locale(_Secret_locale_construct_tag, _Locimp* _Ptrimp) : _Ptr(_Ptrimp) {}
static _MRTIMP2_PURE _Locimp* __CLRCALL_PURE_OR_CDECL _Init(bool _Do_incref = false); // initialize locale
static _MRTIMP2_PURE _Locimp* __CLRCALL_PURE_OR_CDECL _Getgloballocale();
static _MRTIMP2_PURE void __CLRCALL_PURE_OR_CDECL _Setgloballocale(void*);
bool _Badname(const _Locinfo& _Lobj) { // test if name is "*"
return _CSTD strcmp(_Lobj._Getname(), "*") == 0;
}
_Locimp* _Ptr; // pointer to locale implementation object
};
template <class _Facet>
struct _Facetptr { // store pointer to lazy facet for use_facet
__PURE_APPDOMAIN_GLOBAL static const locale::facet* _Psave;
};
template <class _Facet>
__PURE_APPDOMAIN_GLOBAL const locale::facet* _Facetptr<_Facet>::_Psave = nullptr;
_EXPORT_STD template <class _Facet>
const _Facet& __CRTDECL use_facet(const locale& _Loc) { // get facet reference from locale
_BEGIN_LOCK(_LOCK_LOCALE) // the thread lock, make get atomic
const locale::facet* _Psave = _Facetptr<_Facet>::_Psave; // static pointer to lazy facet
const size_t _Id = _Facet::id._Get_index();
const locale::facet* _Pf = _Loc._Getfacet(_Id);
if (!_Pf) {
if (_Psave) {
_Pf = _Psave; // lazy facet already allocated
} else if (_Facet::_Getcat(&_Psave, &_Loc) == static_cast<size_t>(-1)) {
#if _HAS_EXCEPTIONS
_Throw_bad_cast(); // lazy disallowed
#else
_CSTD abort(); // lazy disallowed
#endif
} else { // queue up lazy facet for destruction
auto _Pfmod = const_cast<locale::facet*>(_Psave);
unique_ptr<_Facet_base> _Psave_guard(static_cast<_Facet_base*>(_Pfmod));
#if defined(_M_CEE)
_Facet_Register_m(_Pfmod);
#else // ^^^ defined(_M_CEE) / !defined(_M_CEE) vvv
_Facet_Register(_Pfmod);
#endif // ^^^ !defined(_M_CEE) ^^^
_Pfmod->_Incref();
_Facetptr<_Facet>::_Psave = _Psave;
_Pf = _Psave;
(void) _Psave_guard.release();
}
}
return static_cast<const _Facet&>(*_Pf); // should be dynamic_cast
_END_LOCK()
} // end of use_facet body
template <class _Elem>
char __CRTDECL _Maklocbyte(_Elem _Char, const _Locinfo::_Cvtvec&) {
// convert _Elem to char using _Cvtvec
return static_cast<char>(static_cast<unsigned char>(_Char));
}
template <>
inline char __CRTDECL _Maklocbyte(wchar_t _Char, const _Locinfo::_Cvtvec& _Cvt) {
// convert wchar_t to char using _Cvtvec
char _Byte = '\0';
mbstate_t _Mbst1 = {};
_Wcrtomb(&_Byte, _Char, &_Mbst1, &_Cvt);
return _Byte;
}
#if defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
template <>
inline char __CRTDECL _Maklocbyte(unsigned short _Char, const _Locinfo::_Cvtvec& _Cvt) {
// convert unsigned short to char using _Cvtvec
char _Byte = '\0';
mbstate_t _Mbst1 = {};
_Wcrtomb(&_Byte, static_cast<wchar_t>(_Char), &_Mbst1, &_Cvt);
return _Byte;
}
#endif // defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
template <class _Elem>
_Elem __CRTDECL _Maklocchr(char _Byte, _Elem*, const _Locinfo::_Cvtvec&) {
// convert char to _Elem using _Cvtvec
return static_cast<_Elem>(static_cast<unsigned char>(_Byte));
}
template <>
inline wchar_t __CRTDECL _Maklocchr(char _Byte, wchar_t*, const _Locinfo::_Cvtvec& _Cvt) {
// convert char to wchar_t using _Cvtvec
wchar_t _Wc = L'\0';
mbstate_t _Mbst1 = {};
_Mbrtowc(&_Wc, &_Byte, 1, &_Mbst1, &_Cvt);
return _Wc;
}
#if defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
template <>
inline unsigned short __CRTDECL _Maklocchr(char _Byte, unsigned short*, const _Locinfo::_Cvtvec& _Cvt) {
// convert char to unsigned short using _Cvtvec
unsigned short _Wc = 0;
mbstate_t _Mbst1 = {};
_Mbrtowc(reinterpret_cast<wchar_t*>(&_Wc), &_Byte, 1, &_Mbst1, &_Cvt);
return _Wc;
}
#endif // defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
template <class _Elem>
_Elem* __CRTDECL _Maklocstr(const char* _Ptr, _Elem*, const _Locinfo::_Cvtvec&) {
// convert C string to _Elem sequence using _Cvtvec
size_t _Count = _CSTD strlen(_Ptr) + 1;
_Elem* _Ptrdest = static_cast<_Elem*>(_calloc_dbg(_Count, sizeof(_Elem), _CRT_BLOCK, __FILE__, __LINE__));
if (!_Ptrdest) {
_Xbad_alloc();
}
for (_Elem* _Ptrnext = _Ptrdest; 0 < _Count; --_Count, ++_Ptrnext, ++_Ptr) {
*_Ptrnext = static_cast<_Elem>(static_cast<unsigned char>(*_Ptr));
}
return _Ptrdest;
}
template <>
inline wchar_t* __CRTDECL _Maklocstr(const char* _Ptr, wchar_t*, const _Locinfo::_Cvtvec& _Cvt) {
// convert C string to wchar_t sequence using _Cvtvec
size_t _Count;
size_t _Count1;
size_t _Wchars;
const char* _Ptr1;
int _Bytes;
wchar_t _Wc;
mbstate_t _Mbst1 = {};
_Count1 = _CSTD strlen(_Ptr) + 1;
for (_Count = _Count1, _Wchars = 0, _Ptr1 = _Ptr; 0 < _Count; _Count -= _Bytes, _Ptr1 += _Bytes, ++_Wchars) {
if ((_Bytes = _Mbrtowc(&_Wc, _Ptr1, _Count, &_Mbst1, &_Cvt)) <= 0) {
break;
}
}
++_Wchars; // count terminating nul
wchar_t* _Ptrdest = static_cast<wchar_t*>(_calloc_dbg(_Wchars, sizeof(wchar_t), _CRT_BLOCK, __FILE__, __LINE__));
if (!_Ptrdest) {
_Xbad_alloc();
}
wchar_t* _Ptrnext = _Ptrdest;
mbstate_t _Mbst2 = {};
for (; 0 < _Wchars; _Count -= _Bytes, _Ptr += _Bytes, --_Wchars, ++_Ptrnext) {
if ((_Bytes = _Mbrtowc(_Ptrnext, _Ptr, _Count1, &_Mbst2, &_Cvt)) <= 0) {
break;
}
}
*_Ptrnext = L'\0';
return _Ptrdest;
}
#if defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
template <>
inline unsigned short* __CRTDECL _Maklocstr(const char* _Ptr, unsigned short*, const _Locinfo::_Cvtvec& _Cvt) {
// convert C string to unsigned short sequence using _Cvtvec
size_t _Count;
size_t _Count1;
size_t _Wchars;
const char* _Ptr1;
int _Bytes;
unsigned short _Wc;
mbstate_t _Mbst1 = {};
_Count1 = _CSTD strlen(_Ptr) + 1;
for (_Count = _Count1, _Wchars = 0, _Ptr1 = _Ptr; 0 < _Count; _Count -= _Bytes, _Ptr1 += _Bytes, ++_Wchars) {
if ((_Bytes = _Mbrtowc(reinterpret_cast<wchar_t*>(&_Wc), _Ptr1, _Count, &_Mbst1, &_Cvt)) <= 0) {
break;
}
}
++_Wchars; // count terminating nul
wchar_t* _Ptrdest = static_cast<wchar_t*>(_calloc_dbg(_Wchars, sizeof(wchar_t), _CRT_BLOCK, __FILE__, __LINE__));
if (!_Ptrdest) {
_Xbad_alloc();
}
wchar_t* _Ptrnext = _Ptrdest;
mbstate_t _Mbst2 = {};
for (; 0 < _Wchars; _Count -= _Bytes, _Ptr += _Bytes, --_Wchars, ++_Ptrnext) {
if ((_Bytes = _Mbrtowc(_Ptrnext, _Ptr, _Count1, &_Mbst2, &_Cvt)) <= 0) {
break;
}
}
*_Ptrnext = L'\0';
return reinterpret_cast<unsigned short*>(_Ptrdest);
}
#endif // defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
_EXPORT_STD extern "C++" class _CRTIMP2_PURE_IMPORT codecvt_base // base class for codecvt
: public locale::facet // TRANSITION, ABI, shouldn't be derived from locale::facet
{
public:
enum { // constants for different parse states
ok,
partial,
error,
noconv
};
using result = int;
__CLR_OR_THIS_CALL codecvt_base(size_t _Refs = 0) noexcept // strengthened
: locale::facet(_Refs) {}
bool __CLR_OR_THIS_CALL always_noconv() const noexcept {
// return true if conversions never change input (from codecvt)
return do_always_noconv();
}
int __CLR_OR_THIS_CALL max_length() const noexcept {
// return maximum length required for a conversion (from codecvt)
return do_max_length();
}
int __CLR_OR_THIS_CALL encoding() const noexcept {
return do_encoding();
}
__CLR_OR_THIS_CALL ~codecvt_base() noexcept {}
protected:
virtual bool __CLR_OR_THIS_CALL do_always_noconv() const noexcept {
// return true if conversions never change input (from codecvt)
return false;
}
virtual int __CLR_OR_THIS_CALL do_max_length() const noexcept {
// return maximum length required for a conversion (from codecvt)
return 1;
}
virtual int __CLR_OR_THIS_CALL do_encoding() const noexcept {
return 1; // -1 ==> state dependent, 0 ==> varying length
}
};
template <class _Ty>
constexpr bool _Is_one_byte_char_like_v = _Is_any_of_v<remove_cv_t<_Ty>, signed char, unsigned char,
#ifdef __cpp_lib_byte
byte,
#endif // defined(__cpp_lib_byte)
#ifdef __cpp_char8_t
char8_t,
#endif // defined(__cpp_char8_t)
char>;
template <class _Elem, class _Byte>
constexpr bool _Is_codecvt_do_always_noconv_v =
is_same_v<_Byte, _Elem> || (_Is_one_byte_char_like_v<_Byte> && _Is_one_byte_char_like_v<_Elem>);
_EXPORT_STD extern "C++" template <class _Elem, class _Byte, class _Statype>
class codecvt : public codecvt_base { // facet for converting between _Elem and _Byte sequences
public:
// Explicitly specialized below:
// codecvt<wchar_t, char, mbstate_t>
// codecvt<unsigned short, char, mbstate_t> (extension)
// codecvt<char16_t, char, mbstate_t>
// codecvt<char32_t, char, mbstate_t>
// codecvt<char16_t, char8_t, mbstate_t>
// codecvt<char32_t, char8_t, mbstate_t>
static_assert(!_ENFORCE_FACET_SPECIALIZATIONS || is_same_v<codecvt, codecvt<char, char, mbstate_t>>,
_FACET_SPECIALIZATION_MESSAGE);
using intern_type = _Elem;
using extern_type = _Byte;
using state_type = _Statype;
result __CLR_OR_THIS_CALL in(_Statype& _State, const _Byte* _First1, const _Byte* _Last1, const _Byte*& _Mid1,
_Elem* _First2, _Elem* _Last2, _Elem*& _Mid2) const { // convert bytes [_First1, _Last1) to [_First2, _Last2)
return do_in(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL out(_Statype& _State, const _Elem* _First1, const _Elem* _Last1, const _Elem*& _Mid1,
_Byte* _First2, _Byte* _Last2, _Byte*& _Mid2) const { // convert [_First1, _Last1) to bytes [_First2, _Last2)
return do_out(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL unshift(_Statype& _State, _Byte* _First2, _Byte* _Last2, _Byte*& _Mid2) const {
// generate bytes to return to default shift state
return do_unshift(_State, _First2, _Last2, _Mid2);
}
int __CLR_OR_THIS_CALL length(_Statype& _State, const _Byte* _First1, const _Byte* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count _Elems
return do_length(_State, _First1, _Last1, _Count);
}
__PURE_APPDOMAIN_GLOBAL static locale::id id; // unique facet id
explicit __CLR_OR_THIS_CALL codecvt(size_t _Refs = 0) : codecvt_base(_Refs) {
_Init(_Locinfo());
}
explicit __CLR_OR_THIS_CALL codecvt(const _Locinfo& _Lobj, size_t _Refs = 0) : codecvt_base(_Refs) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
// return locale category mask and construct standard facet
if (_Ppf && !*_Ppf) {
*_Ppf = new codecvt(_Locinfo(_Ploc->_C_str()));
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~codecvt() noexcept override {}
void __CLR_OR_THIS_CALL _Init(const _Locinfo&) {} // initialize from _Locinfo object
bool __CLR_OR_THIS_CALL do_always_noconv() const noexcept override {
// return true if conversions never change input (from codecvt)
return _Is_codecvt_do_always_noconv_v<_Elem, _Byte>;
}
virtual result __CLR_OR_THIS_CALL do_in(_Statype&, const _Byte* _First1, const _Byte* _Last1, const _Byte*& _Mid1,
_Elem* _First2, _Elem* _Last2, _Elem*& _Mid2) const { // convert bytes [_First1, _Last1) to [_First2, _Last2)
_Mid1 = _First1;
_Mid2 = _First2;
if constexpr (_Is_codecvt_do_always_noconv_v<_Elem, _Byte>) {
return noconv; // convert nothing
} else {
// types differ, copy one for one
for (; _Mid1 != _Last1; ++_Mid1, ++_Mid2) {
if (_Mid2 == _Last2) {
return partial;
}
*_Mid2 = static_cast<_Elem>(*_Mid1);
}
return ok;
}
}
virtual result __CLR_OR_THIS_CALL do_out(_Statype&, const _Elem* _First1, const _Elem* _Last1, const _Elem*& _Mid1,
_Byte* _First2, _Byte* _Last2, _Byte*& _Mid2) const { // convert [_First1, _Last1) to bytes [_First2, _Last2)
_Mid1 = _First1;
_Mid2 = _First2;
if constexpr (_Is_codecvt_do_always_noconv_v<_Elem, _Byte>) {
return noconv; // convert nothing
} else {
// types differ, copy one for one
for (; _Mid1 != _Last1; ++_Mid1, ++_Mid2) {
if (_Mid2 == _Last2) {
return partial;
}
*_Mid2 = static_cast<_Byte>(*_Mid1);
}
return ok;
}
}
virtual result __CLR_OR_THIS_CALL do_unshift(_Statype&, _Byte* _First2, _Byte*, _Byte*& _Mid2) const {
// generate bytes to return to default shift state
_Mid2 = _First2;
return noconv; // no termination required
}
virtual int __CLR_OR_THIS_CALL do_length(
_Statype&, const _Byte* _First1, const _Byte* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count _Elems
// assumes 1:1 conversion
const auto _Dist = static_cast<size_t>((_STD min)(_Last1 - _First1, ptrdiff_t{INT_MAX}));
return static_cast<int>((_STD min)(_Count, _Dist));
}
};
#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wdllimport-static-field-def"
#endif // defined(__clang__)
template <class _Elem, class _Byte, class _Statype>
__PURE_APPDOMAIN_GLOBAL locale::id codecvt<_Elem, _Byte, _Statype>::id;
#ifdef __clang__
#pragma clang diagnostic pop
#endif // defined(__clang__)
template <class _CvtTy, class _Byte, class _Statype>
_NODISCARD int _Codecvt_do_length(
const _CvtTy& _Cvt, _Statype& _State, const _Byte* _First1, const _Byte* _Last1, size_t _Count) {
// return p - _First1, for the largest value p in [_First1, _Last1] such that _Cvt will successfully convert
// [_First1, p) to at most _Count wide characters
_STL_DISABLE_DEPRECATED_WARNING
using _Elem = typename _CvtTy::intern_type;
_STL_RESTORE_DEPRECATED_WARNING
_Adl_verify_range(_First1, _Last1);
const auto _Old_first1 = _First1;
while (_Count > 0 && _First1 != _Last1) { // convert another wide character
const _Byte* _Mid1;
_Elem* _Mid2;
_Elem _Ch;
// test result of single wide-char conversion
_STL_DISABLE_DEPRECATED_WARNING
const auto _Result = _Cvt._CvtTy::do_in(_State, _First1, _Last1, _Mid1, &_Ch, &_Ch + 1, _Mid2);
_STL_RESTORE_DEPRECATED_WARNING
if (_Result != codecvt_base::ok) {
if (_Result == codecvt_base::noconv) {
_First1 += (_STD min)(static_cast<size_t>(_Last1 - _First1), _Count);
}
break; // error, noconv, or partial
}
if (_Mid2 == &_Ch + 1) {
--_Count; // do_in converted an output character
}
_First1 = _Mid1;
}
return static_cast<int>((_STD min)(_First1 - _Old_first1, ptrdiff_t{INT_MAX}));
}
enum _Codecvt_mode { _Consume_header = 4, _Generate_header = 2 };
extern "C++" template <>
class _CRTIMP2_PURE_IMPORT_UNLESS_CODECVT_ID_SATELLITE _CXX20_DEPRECATE_CODECVT_FACETS
codecvt<char16_t, char, mbstate_t> : public codecvt_base {
// facet for converting between char16_t and UTF-8 byte sequences
public:
using intern_type = char16_t;
using extern_type = char;
using state_type = mbstate_t;
result __CLR_OR_THIS_CALL in(mbstate_t& _State, const char* _First1, const char* _Last1, const char*& _Mid1,
char16_t* _First2, char16_t* _Last2, char16_t*& _Mid2) const {
// convert bytes [_First1, _Last1) to [_First2, _Last2)
return do_in(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL out(mbstate_t& _State, const char16_t* _First1, const char16_t* _Last1,
const char16_t*& _Mid1, char* _First2, char* _Last2, char*& _Mid2) const {
// convert [_First1, _Last1) to bytes [_First2, _Last2)
return do_out(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL unshift(mbstate_t& _State, char* _First2, char* _Last2, char*& _Mid2) const {
// generate bytes to return to default shift state
return do_unshift(_State, _First2, _Last2, _Mid2);
}
int __CLR_OR_THIS_CALL length(mbstate_t& _State, const char* _First1, const char* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count UTF-16 code units
return do_length(_State, _First1, _Last1, _Count);
}
_CRT_SATELLITE_CODECVT_IDS_NOIMPORT static locale::id id;
explicit __CLR_OR_THIS_CALL codecvt(size_t _Refs = 0)
: codecvt_base(_Refs), _Maxcode(0x10ffff), _Mode(_Consume_header) {
_BEGIN_LOCINFO(_Lobj)
_Init(_Lobj);
_END_LOCINFO()
}
explicit __CLR_OR_THIS_CALL codecvt(const _Locinfo& _Lobj, size_t _Refs = 0)
: codecvt_base(_Refs), _Maxcode(0x10ffff), _Mode(_Consume_header) {
_Init(_Lobj);
}
__CLR_OR_THIS_CALL codecvt(
const _Locinfo& _Lobj, unsigned long _Maxcode_arg, _Codecvt_mode _Mode_arg, size_t _Refs = 0)
: codecvt_base(_Refs), _Maxcode(_Maxcode_arg), _Mode(_Mode_arg) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
// return locale category mask and construct standard facet
if (_Ppf && !*_Ppf) {
_STL_DISABLE_DEPRECATED_WARNING
*_Ppf = new codecvt(_Locinfo(_Ploc->_C_str()));
_STL_RESTORE_DEPRECATED_WARNING
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~codecvt() noexcept override {}
void __CLR_OR_THIS_CALL _Init(const _Locinfo&) {} // initialize
virtual result __CLR_OR_THIS_CALL do_in(mbstate_t& _State, const char* _First1, const char* _Last1,
const char*& _Mid1, char16_t* _First2, char16_t* _Last2, char16_t*& _Mid2) const {
// convert bytes [_First1, _Last1) to [_First2, _Last2)
unsigned short* _Pstate = reinterpret_cast<unsigned short*>(&_State);
_Mid1 = _First1;
_Mid2 = _First2;
while (_Mid1 != _Last1 && _Mid2 != _Last2) { // convert a multibyte sequence
unsigned char _By = static_cast<unsigned char>(*_Mid1);
unsigned long _Ch;
int _Nextra;
int _Nskip;
if (*_Pstate > 1) {
if (_By < 0x80 || 0xc0 <= _By) {
return codecvt::error; // not continuation byte
}
// deliver second half of two-word value
++_Mid1;
*_Mid2++ = static_cast<char16_t>(*_Pstate | (_By & 0x3f));
*_Pstate = 1;
continue;
}
if (_By < 0x80u) {
_Ch = _By;
_Nextra = 0;
} else if (_By < 0xc0u) { // 0x80-0xbf not first byte
++_Mid1;
return codecvt::error;
} else if (_By < 0xe0u) {
_Ch = static_cast<unsigned long>(_By & 0x1f);
_Nextra = 1;
} else if (_By < 0xf0u) {
_Ch = static_cast<unsigned long>(_By & 0x0f);
_Nextra = 2;
} else if (_By < 0xf8u) {
_Ch = static_cast<unsigned long>(_By & 0x07);
_Nextra = 3;
} else {
_Ch = static_cast<unsigned long>(_By & 0x03);
_Nextra = _By < 0xfc ? 4 : 5;
}
_Nskip = _Nextra < 3 ? 0 : 1; // leave a byte for 2nd word
_First1 = _Mid1; // roll back point
if (_Nextra == 0) {
++_Mid1;
} else if (_Last1 - _Mid1 < _Nextra + 1 - _Nskip) {
break; // not enough input
} else {
for (++_Mid1; _Nskip < _Nextra; --_Nextra, ++_Mid1) {
if ((_By = static_cast<unsigned char>(*_Mid1)) < 0x80u || 0xc0u <= _By) {
return codecvt::error; // not continuation byte
} else {
_Ch = _Ch << 6 | (_By & 0x3f);
}
}
}
if (0 < _Nskip) {
_Ch <<= 6; // get last byte on next call
}
if ((_Maxcode < 0x10ffffu ? _Maxcode : 0x10ffffu) < _Ch) {
return codecvt::error; // value too large
}
if (0xffffu < _Ch) { // deliver first half of two-word value, save second word
unsigned short _Ch0 = static_cast<unsigned short>(0xd800 | (_Ch >> 10) - 0x0040);
*_Mid2++ = static_cast<char16_t>(_Ch0);
*_Pstate = static_cast<unsigned short>(0xdc00 | (_Ch & 0x03ff));
continue;
}
if (_Nskip != 0) {
if (_Mid1 == _Last1) { // not enough bytes, noncanonical value
_Mid1 = _First1;
break;
}
if ((_By = static_cast<unsigned char>(*_Mid1++)) < 0x80u || 0xc0u <= _By) {
return codecvt::error; // not continuation byte
}
_Ch |= _By & 0x3f; // complete noncanonical value
}
if (*_Pstate == 0u) { // first time, maybe look for and consume header
*_Pstate = 1;
if ((_Mode & _Consume_header) != 0 && _Ch == 0xfeffu) { // drop header and retry
const result _Ans = do_in(_State, _Mid1, _Last1, _Mid1, _First2, _Last2, _Mid2);
if (_Ans == codecvt::partial) { // roll back header determination
*_Pstate = 0;
_Mid1 = _First1;
}
return _Ans;
}
}
*_Mid2++ = static_cast<char16_t>(_Ch);
}
return _First1 == _Mid1 ? codecvt::partial : codecvt::ok;
}
virtual result __CLR_OR_THIS_CALL do_out(mbstate_t& _State, const char16_t* _First1, const char16_t* _Last1,
const char16_t*& _Mid1, char* _First2, char* _Last2, char*& _Mid2) const {
// convert [_First1, _Last1) to bytes [_First2, _Last2)
unsigned short* _Pstate = reinterpret_cast<unsigned short*>(&_State);
_Mid1 = _First1;
_Mid2 = _First2;
while (_Mid1 != _Last1 && _Mid2 != _Last2) { // convert and put a wide char
unsigned long _Ch;
const unsigned short _Ch1 = static_cast<unsigned short>(*_Mid1);
bool _Save = false;
if (1 < *_Pstate) { // get saved MS 11 bits from *_Pstate
if (_Ch1 < 0xdc00u || 0xe000u <= _Ch1) {
return codecvt::error; // bad second word
}
_Ch = static_cast<unsigned long>((*_Pstate << 10) | (_Ch1 - 0xdc00));
} else if (0xd800u <= _Ch1 && _Ch1 < 0xdc00u) { // get new first word
_Ch = static_cast<unsigned long>((_Ch1 - 0xd800 + 0x0040) << 10);
_Save = true; // put only first byte, rest with second word
} else {
_Ch = _Ch1; // not first word, just put it
}
char _By;
int _Nextra;
if (_Ch < 0x0080u) {
_By = static_cast<char>(_Ch);
_Nextra = 0;
} else if (_Ch < 0x0800u) {
_By = static_cast<char>(0xc0 | _Ch >> 6);
_Nextra = 1;
} else if (_Ch < 0x10000u) {
_By = static_cast<char>(0xe0 | _Ch >> 12);
_Nextra = 2;
} else {
_By = static_cast<char>(0xf0 | _Ch >> 18);
_Nextra = 3;
}
int _Nput = _Nextra < 3 ? _Nextra + 1 : _Save ? 1 : 3;
if (_Last2 - _Mid2 < _Nput) {
break; // not enough room, even without header
}
if (*_Pstate == 0u && (_Mode & _Generate_header) != 0) {
if (_Last2 - _Mid2 < 3 + _Nput) {
break; // not enough room for header + output
}
// prepend header
*_Mid2++ = '\xef';
*_Mid2++ = '\xbb';
*_Mid2++ = '\xbf';
}
++_Mid1;
if (_Save || _Nextra < 3) { // put first byte of sequence, if not already put
*_Mid2++ = _By;
--_Nput;
}
for (; 0 < _Nput; --_Nput) {
*_Mid2++ = static_cast<char>((_Ch >> 6 * --_Nextra & 0x3f) | 0x80);
}
*_Pstate = static_cast<unsigned short>(_Save ? _Ch >> 10 : 1);
}
return _First1 == _Mid1 ? codecvt::partial : codecvt::ok;
}
virtual result __CLR_OR_THIS_CALL do_unshift(mbstate_t& _State, char* _First2, char*, char*& _Mid2) const {
// generate bytes to return to default shift state
unsigned short* _Pstate = reinterpret_cast<unsigned short*>(&_State);
_Mid2 = _First2;
return 1u < *_Pstate ? codecvt::error : codecvt::ok; // fail if trailing first word
}
friend int _Codecvt_do_length<>(const codecvt&, mbstate_t&, const char*, const char*, size_t);
virtual int __CLR_OR_THIS_CALL do_length(
mbstate_t& _State, const char* _First1, const char* _Last1, size_t _Count) const {
return _Codecvt_do_length(*this, _State, _First1, _Last1, _Count);
}
bool __CLR_OR_THIS_CALL do_always_noconv() const noexcept override {
// return true if conversions never change input
return false;
}
int __CLR_OR_THIS_CALL do_max_length() const noexcept override {
// return maximum length required for a conversion
if ((_Mode & _Consume_header) != 0) {
return 9; // header + max input
}
if ((_Mode & _Generate_header) != 0) {
return 7; // header + max output
}
return 6; // 6-byte max input sequence, no 3-byte header
}
int do_encoding() const noexcept override {
return 0; // 0 => varying length
}
private:
unsigned long _Maxcode; // default: 0x10ffff
_Codecvt_mode _Mode; // default: _Consume_header
};
extern "C++" template <>
class _CRTIMP2_PURE_IMPORT_UNLESS_CODECVT_ID_SATELLITE _CXX20_DEPRECATE_CODECVT_FACETS
codecvt<char32_t, char, mbstate_t> : public codecvt_base {
// facet for converting between char32_t and UTF-8 byte sequences
public:
using intern_type = char32_t;
using extern_type = char;
using state_type = mbstate_t;
result __CLR_OR_THIS_CALL in(mbstate_t& _State, const char* _First1, const char* _Last1, const char*& _Mid1,
char32_t* _First2, char32_t* _Last2, char32_t*& _Mid2) const {
// convert bytes [_First1, _Last1) to [_First2, _Last2)
return do_in(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL out(mbstate_t& _State, const char32_t* _First1, const char32_t* _Last1,
const char32_t*& _Mid1, char* _First2, char* _Last2, char*& _Mid2) const {
// convert [_First1, _Last1) to bytes [_First2, _Last2)
return do_out(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL unshift(mbstate_t& _State, char* _First2, char* _Last2, char*& _Mid2) const {
// generate bytes to return to default shift state
return do_unshift(_State, _First2, _Last2, _Mid2);
}
int __CLR_OR_THIS_CALL length(mbstate_t& _State, const char* _First1, const char* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count UTF-32 code units
return do_length(_State, _First1, _Last1, _Count);
}
_CRT_SATELLITE_CODECVT_IDS_NOIMPORT static locale::id id;
explicit __CLR_OR_THIS_CALL codecvt(size_t _Refs = 0)
: codecvt_base(_Refs), _Maxcode(0xffffffff), _Mode(_Consume_header) {
_BEGIN_LOCINFO(_Lobj)
_Init(_Lobj);
_END_LOCINFO()
}
explicit __CLR_OR_THIS_CALL codecvt(const _Locinfo& _Lobj, size_t _Refs = 0)
: codecvt_base(_Refs), _Maxcode(0xffffffff), _Mode(_Consume_header) {
_Init(_Lobj);
}
__CLR_OR_THIS_CALL codecvt(
const _Locinfo& _Lobj, unsigned long _Maxcode_arg, _Codecvt_mode _Mode_arg, size_t _Refs = 0)
: codecvt_base(_Refs), _Maxcode(_Maxcode_arg), _Mode(_Mode_arg) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
// return locale category mask and construct standard facet
if (_Ppf && !*_Ppf) {
_STL_DISABLE_DEPRECATED_WARNING
*_Ppf = new codecvt(_Locinfo(_Ploc->_C_str()));
_STL_RESTORE_DEPRECATED_WARNING
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~codecvt() noexcept override {}
void __CLR_OR_THIS_CALL _Init(const _Locinfo&) {} // initialize
virtual result __CLR_OR_THIS_CALL do_in(mbstate_t& _State, const char* _First1, const char* _Last1,
const char*& _Mid1, char32_t* _First2, char32_t* _Last2, char32_t*& _Mid2) const {
// convert bytes [_First1, _Last1) to [_First2, _Last2)
char* _Pstate = reinterpret_cast<char*>(&_State);
_Mid1 = _First1;
_Mid2 = _First2;
while (_Mid1 != _Last1 && _Mid2 != _Last2) { // convert a multibyte sequence
unsigned char _By = static_cast<unsigned char>(*_Mid1);
unsigned long _Ch;
int _Nextra;
if (_By < 0x80u) {
_Ch = _By;
_Nextra = 0;
} else if (_By < 0xc0u) { // 0x80-0xbf not first byte
++_Mid1;
return codecvt::error;
} else if (_By < 0xe0u) {
_Ch = static_cast<unsigned long>(_By & 0x1f);
_Nextra = 1;
} else if (_By < 0xf0u) {
_Ch = static_cast<unsigned long>(_By & 0x0f);
_Nextra = 2;
} else if (_By < 0xf8u) {
_Ch = static_cast<unsigned long>(_By & 0x07);
_Nextra = 3;
} else {
_Ch = static_cast<unsigned long>(_By & 0x03);
_Nextra = _By < 0xfc ? 4 : 5;
}
if (_Nextra == 0) {
++_Mid1;
} else if (_Last1 - _Mid1 < _Nextra + 1) {
break; // not enough input
} else {
for (++_Mid1; 0 < _Nextra; --_Nextra, ++_Mid1) {
if ((_By = static_cast<unsigned char>(*_Mid1)) < 0x80u || 0xc0u <= _By) {
return codecvt::error; // not continuation byte
} else {
_Ch = _Ch << 6 | (_By & 0x3f);
}
}
}
if (*_Pstate == 0) { // first time, maybe look for and consume header
*_Pstate = 1;
if ((_Mode & _Consume_header) != 0 && _Ch == 0xfeffu) { // drop header and retry
const result _Ans = do_in(_State, _Mid1, _Last1, _Mid1, _First2, _Last2, _Mid2);
if (_Ans == codecvt::partial) { // roll back header determination
*_Pstate = 0;
_Mid1 = _First1;
}
return _Ans;
}
}
if (_Maxcode < _Ch) {
return codecvt::error; // code too large
}
*_Mid2++ = static_cast<char32_t>(_Ch);
}
return _First1 == _Mid1 ? codecvt::partial : codecvt::ok;
}
virtual result __CLR_OR_THIS_CALL do_out(mbstate_t& _State, const char32_t* _First1, const char32_t* _Last1,
const char32_t*& _Mid1, char* _First2, char* _Last2, char*& _Mid2) const {
// convert [_First1, _Last1) to bytes [_First2, _Last2)
char* _Pstate = reinterpret_cast<char*>(&_State);
_Mid1 = _First1;
_Mid2 = _First2;
while (_Mid1 != _Last1 && _Mid2 != _Last2) { // convert and put a wide char
char _By;
int _Nextra;
unsigned long _Ch = static_cast<unsigned long>(*_Mid1);
if (_Maxcode < _Ch) {
return codecvt::error;
}
if (_Ch < 0x0080u) {
_By = static_cast<char>(_Ch);
_Nextra = 0;
} else if (_Ch < 0x0800u) {
_By = static_cast<char>(0xc0 | _Ch >> 6);
_Nextra = 1;
} else if (_Ch < 0x00010000u) {
_By = static_cast<char>(0xe0 | _Ch >> 12);
_Nextra = 2;
} else if (_Ch < 0x00200000u) {
_By = static_cast<char>(0xf0 | _Ch >> 18);
_Nextra = 3;
} else if (_Ch < 0x04000000u) {
_By = static_cast<char>(0xf8 | _Ch >> 24);
_Nextra = 4;
} else {
_By = static_cast<char>(0xfc | (_Ch >> 30 & 0x03));
_Nextra = 5;
}
if (*_Pstate == 0) { // first time, maybe generate header
*_Pstate = 1;
if ((_Mode & _Generate_header) != 0) {
if (_Last2 - _Mid2 < 3 + 1 + _Nextra) {
return codecvt::partial; // not enough room for both
}
// prepend header
*_Mid2++ = '\xef';
*_Mid2++ = '\xbb';
*_Mid2++ = '\xbf';
}
}
if (_Last2 - _Mid2 < 1 + _Nextra) {
break; // not enough room for output
}
++_Mid1;
for (*_Mid2++ = _By; 0 < _Nextra;) {
*_Mid2++ = static_cast<char>((_Ch >> 6 * --_Nextra & 0x3f) | 0x80);
}
}
return _First1 == _Mid1 ? codecvt::partial : codecvt::ok;
}
virtual result __CLR_OR_THIS_CALL do_unshift(mbstate_t&, char* _First2, char*, char*& _Mid2) const {
// generate bytes to return to default shift state
_Mid2 = _First2;
return codecvt::noconv;
}
friend int _Codecvt_do_length<>(const codecvt&, mbstate_t&, const char*, const char*, size_t);
virtual int __CLR_OR_THIS_CALL do_length(
mbstate_t& _State, const char* _First1, const char* _Last1, size_t _Count) const {
return _Codecvt_do_length(*this, _State, _First1, _Last1, _Count);
}
bool __CLR_OR_THIS_CALL do_always_noconv() const noexcept override {
// return true if conversions never change input
return false;
}
int __CLR_OR_THIS_CALL do_max_length() const noexcept override {
// return maximum length required for a conversion
return (_Mode & (_Consume_header | _Generate_header)) != 0 ? 9 : 6;
}
int __CLR_OR_THIS_CALL do_encoding() const noexcept override {
// return length of code sequence (from codecvt)
return (_Mode & (_Consume_header | _Generate_header)) != 0 ? -1
: 0; // -1 => state dependent, 0 => varying length
}
private:
unsigned long _Maxcode; // default: 0xffffffff
_Codecvt_mode _Mode; // default: _Consume_header
};
#if defined(__cpp_char8_t) && !defined(_M_CEE_PURE)
template <class _From, class _To>
struct _NODISCARD _Codecvt_guard {
const _From* const& _First1;
const _From*& _Mid1;
_To* const& _First2;
_To*& _Mid2;
_Codecvt_guard(const _From* const& _First1_, const _From*& _Mid1_, _To* const& _First2_, _To*& _Mid2_)
: _First1{_First1_}, _Mid1{_Mid1_}, _First2{_First2_}, _Mid2{_Mid2_} {}
_Codecvt_guard(const _Codecvt_guard&) = delete;
_Codecvt_guard& operator=(const _Codecvt_guard&) = delete;
~_Codecvt_guard() {
_Mid1 = _First1;
_Mid2 = _First2;
}
};
extern "C++" template <>
class _CXX20_DEPRECATE_CODECVT_CHAR8_T_FACETS codecvt<char16_t, char8_t, mbstate_t> : public codecvt_base {
// facet for converting between UTF-16 and UTF-8 sequences
public:
using intern_type = char16_t;
using extern_type = char8_t;
using state_type = mbstate_t;
result in(mbstate_t& _State, const char8_t* _First1, const char8_t* _Last1, const char8_t*& _Mid1,
char16_t* _First2, char16_t* _Last2, char16_t*& _Mid2) const {
// convert UTF-8 [_First1, _Last1) to UTF-16 [_First2, _Last2)
return do_in(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result out(mbstate_t& _State, const char16_t* _First1, const char16_t* _Last1, const char16_t*& _Mid1,
char8_t* _First2, char8_t* _Last2, char8_t*& _Mid2) const {
// convert UTF-16 [_First1, _Last1) to UTF-8 [_First2, _Last2)
return do_out(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result unshift(mbstate_t& _State, char8_t* _First2, char8_t* _Last2, char8_t*& _Mid2) const {
// generate bytes to return to default shift state
return do_unshift(_State, _First2, _Last2, _Mid2);
}
int length(mbstate_t& _State, const char8_t* _First1, const char8_t* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count UTF-16 code units
return do_length(_State, _First1, _Last1, _Count);
}
_CRT_SATELLITE_CODECVT_IDS static locale::id id;
explicit codecvt(size_t _Refs = 0) : codecvt_base(_Refs) {} // construct "from current locale"
explicit codecvt(const _Locinfo&, size_t _Refs = 0) : codecvt_base(_Refs) {} // construct "from specified locale"
static size_t _Getcat(const locale::facet** _Ppf = nullptr, const locale* = nullptr) {
// return locale category mask and construct standard facet
if (_Ppf && !*_Ppf) {
*_Ppf = new codecvt;
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~codecvt() noexcept override = default;
virtual result __CLR_OR_THIS_CALL do_in(mbstate_t&, const char8_t* _First1, const char8_t* _Last1,
const char8_t*& _Mid1, char16_t* _First2, char16_t* _Last2, char16_t*& _Mid2) const {
// convert UTF-8 [_First1, _Last1) to UTF-16 [_First2, _Last2)
_Adl_verify_range(_First1, _Last1);
_Adl_verify_range(_First2, _Last2);
_Codecvt_guard<char8_t, char16_t> _Guard{_First1, _Mid1, _First2, _Mid2};
for (; _First1 != _Last1; ++_First1, ++_First2) {
if (_First2 == _Last2) {
return partial;
}
char8_t _Lead_byte = *_First1;
if (_Lead_byte < 0b1000'0000u) { // single-byte sequence
*_First2 = static_cast<char16_t>(_Lead_byte);
continue;
}
int _Trailing_count = 1;
if (_Lead_byte < 0b1110'0000u) {
if (_Lead_byte < 0b1100'0000u) { // out-of-sequence trailing byte
return error;
}
// lead byte of 2-byte sequence
_Lead_byte &= 0b0001'1111u;
} else if (_Lead_byte < 0b1111'0000u) { // lead byte of 3-byte sequence
_Lead_byte &= 0b0000'1111u;
_Trailing_count = 2;
} else if (_Lead_byte < 0b1111'1000u) { // lead byte of 4-byte sequence
if (_Last2 - _First2 < 2) { // not enough output for a surrogate pair
return partial;
}
_Lead_byte &= 0b0000'0111u;
_Trailing_count = 3;
} else { // Invalid UTF-8 code unit
return error;
}
if (_Last1 - _First1 < _Trailing_count + 1) { // not enough input
return partial;
}
const char8_t* _Peek = _First1;
char32_t _Code_point = _Lead_byte;
do {
const char8_t _By = *++_Peek;
if ((_By & 0b1100'0000u) != 0b1000'0000u) { // out-of-sequence lead byte
return error;
}
_Code_point = (_Code_point << 6) | (_By & 0b11'1111u);
} while (--_Trailing_count != 0);
if (_Code_point < 0x10000u) {
if (_Code_point >= 0xd800u && _Code_point < 0xe000u) { // invalid code point (surrogate)
return error;
}
// Output single code unit
*_First2 = static_cast<char16_t>(_Code_point);
} else if (_Code_point >= 0x110000u) { // Invalid code point (out of range)
return error;
} else {
// Output surrogate pair
_Code_point -= 0x10000u;
// High surrogate: 0xd800 | <upper ten bits>
*_First2 = static_cast<char16_t>(0xd800u | (_Code_point >> 10));
// Low surrogate: 0xdc00 | <lower ten bits>
*++_First2 = static_cast<char16_t>(0xdc00u | (_Code_point & 0b11'1111'1111u));
}
_First1 = _Peek;
}
return ok;
}
virtual result __CLR_OR_THIS_CALL do_out(mbstate_t&, const char16_t* _First1, const char16_t* _Last1,
const char16_t*& _Mid1, char8_t* _First2, char8_t* _Last2, char8_t*& _Mid2) const {
// convert UTF-16 [_First1, _Last1) to UTF-8 [_First2, _Last2)
_Adl_verify_range(_First1, _Last1);
_Adl_verify_range(_First2, _Last2);
_Codecvt_guard<char16_t, char8_t> _Guard{_First1, _Mid1, _First2, _Mid2};
for (; _First1 != _Last1; ++_First1, ++_First2) {
if (_First2 == _Last2) { // no more output
return partial;
}
char32_t _Code_point = *_First1;
if (_Code_point < 0x80u) { // encode 1-byte sequence
*_First2 = static_cast<char8_t>(_Code_point);
continue;
}
int _Trailing_count = 1;
if (_Code_point < 0x800u) { // encode 2-byte sequence
*_First2 = static_cast<char8_t>(0b1100'0000u | (_Code_point >> 6));
} else if (_Code_point < 0xd800u || _Code_point >= 0xe000u) { // encode 3-byte sequence
*_First2 = static_cast<char8_t>(0b1110'0000u | (_Code_point >> 12));
_Trailing_count = 2;
} else if (_Code_point < 0xdc00u) { // high surrogate; parse the low surrogate
if (_Last1 - _First1 < 2) { // not enough input
return partial;
}
const char16_t _Low_surrogate = *++_First1;
if (_Low_surrogate < 0xdc00u || _Low_surrogate >= 0xe000u) { // invalid low surrogate
--_First1;
return error;
}
_Code_point = 0x10000u + (((_Code_point & 0b11'1111'1111u) << 10) | (_Low_surrogate & 0b11'1111'1111u));
// encode 4-byte sequence
*_First2 = static_cast<char8_t>(0b1111'0000u | (_Code_point >> 18));
_Trailing_count = 3;
} else { // out-of-sequence low surrogate
return error;
}
if (_Last2 - _First2 < _Trailing_count + 1) { // not enough output
if (_Trailing_count > 2) { // input was a surrogate pair; revert
--_First1;
}
return partial;
}
do {
--_Trailing_count;
*++_First2 = static_cast<char8_t>(0b1000'0000u | ((_Code_point >> (6 * _Trailing_count)) & 0b11'1111u));
} while (_Trailing_count != 0);
}
return ok;
}
virtual result __CLR_OR_THIS_CALL do_unshift(mbstate_t&, char8_t* _First2, char8_t*, char8_t*& _Mid2) const {
// terminate encoding sequence
_Mid2 = _First2;
return noconv; // no termination necessary
}
virtual int __CLR_OR_THIS_CALL do_length(
mbstate_t&, const char8_t* _First1, const char8_t* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count UTF-16 code units
_Adl_verify_range(_First1, _Last1);
const auto _Old_first1 = _First1;
for (; _First1 != _Last1 && _Count > 0u; ++_First1, --_Count) {
char32_t _Code_point = *_First1;
if (_Code_point < 0b1000'0000u) { // single-byte sequence
continue;
}
int _Trailing_count = 1;
if (_Code_point < 0b1110'0000u) {
if (_Code_point < 0b1100'0000u) { // out-of-sequence trailing byte
break;
}
// lead byte of 2-byte sequence
_Code_point &= 0b0001'1111u;
} else if (_Code_point < 0b1111'0000u) { // lead byte of 3-byte sequence
_Code_point &= 0b0000'1111u;
_Trailing_count = 2;
} else if (_Code_point < 0b1111'1000u) { // lead byte of 4-byte sequence
if (_Count < 2u) { // not enough output
break;
}
_Code_point &= 0b0000'0111u;
_Trailing_count = 3;
} else { // Invalid UTF-8 code unit
break;
}
if (_Last1 - _First1 < _Trailing_count + 1) { // not enough input
break;
}
const char8_t* _Peek = _First1;
bool _Done = false;
do {
const char8_t _By = *++_Peek;
if ((_By & 0b1100'0000u) != 0b1000'0000u) { // out-of-sequence lead byte
_Done = true;
break;
}
_Code_point = (_Code_point << 6) | (_By & 0b11'1111u);
} while (--_Trailing_count != 0);
if (_Done) {
break;
}
if (_Code_point < 0x10000u) { // Output single code unit
if (_Code_point >= 0xd800u && _Code_point < 0xe0000u) { // invalid code point (surrogate)
break;
}
} else if (_Code_point < 0x110000u) { // Output surrogate pair
--_Count;
} else { // Invalid code point (out of range)
break;
}
_First1 = _Peek;
}
return static_cast<int>((_STD min)(_First1 - _Old_first1, ptrdiff_t{INT_MAX}));
}
bool __CLR_OR_THIS_CALL do_always_noconv() const noexcept override {
// return true if conversions never change input
return false;
}
int __CLR_OR_THIS_CALL do_max_length() const noexcept override {
// return maximum length required for a conversion
return 4; // 4-byte max input sequence
}
int __CLR_OR_THIS_CALL do_encoding() const noexcept override {
// return length of code sequence (from codecvt)
return 0; // 0 => varying length
}
};
extern "C++" template <>
class _CXX20_DEPRECATE_CODECVT_CHAR8_T_FACETS codecvt<char32_t, char8_t, mbstate_t> : public codecvt_base {
// facet for converting between UTF-32 and UTF-8 sequences
public:
using intern_type = char32_t;
using extern_type = char8_t;
using state_type = mbstate_t;
result in(mbstate_t& _State, const char8_t* _First1, const char8_t* _Last1, const char8_t*& _Mid1,
char32_t* _First2, char32_t* _Last2, char32_t*& _Mid2) const {
// convert UTF-8 [_First1, _Last1) to UTF-32 [_First2, _Last2)
return do_in(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result out(mbstate_t& _State, const char32_t* _First1, const char32_t* _Last1, const char32_t*& _Mid1,
char8_t* _First2, char8_t* _Last2, char8_t*& _Mid2) const {
// convert UTF-32 [_First1, _Last1) to UTF-8 [_First2, _Last2)
return do_out(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result unshift(mbstate_t& _State, char8_t* _First2, char8_t* _Last2, char8_t*& _Mid2) const {
// generate bytes to return to default shift state
return do_unshift(_State, _First2, _Last2, _Mid2);
}
int length(mbstate_t& _State, const char8_t* _First1, const char8_t* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count UTF-32 code units
return do_length(_State, _First1, _Last1, _Count);
}
_CRT_SATELLITE_CODECVT_IDS static locale::id id;
explicit codecvt(size_t _Refs = 0) : codecvt_base(_Refs) {} // construct "from current locale"
explicit codecvt(const _Locinfo&, size_t _Refs = 0) : codecvt_base(_Refs) {} // construct "from specified locale"
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* = nullptr) {
// return locale category mask and construct standard facet
if (_Ppf && !*_Ppf) {
*_Ppf = new codecvt;
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~codecvt() noexcept override = default;
virtual result __CLR_OR_THIS_CALL do_in(mbstate_t&, const char8_t* _First1, const char8_t* _Last1,
const char8_t*& _Mid1, char32_t* _First2, char32_t* _Last2, char32_t*& _Mid2) const {
// convert UTF-8 [_First1, _Last1) to UTF-32 [_First2, _Last2)
_Adl_verify_range(_First1, _Last1);
_Adl_verify_range(_First2, _Last2);
_Codecvt_guard<char8_t, char32_t> _Guard{_First1, _Mid1, _First2, _Mid2};
for (; _First1 != _Last1; ++_First1, ++_First2) {
if (_First2 == _Last2) {
return partial;
}
char8_t _Lead_byte = *_First1;
if (_Lead_byte < 0b1000'0000u) { // single-byte sequence
*_First2 = _Lead_byte;
continue;
}
int _Trailing_count = 1;
if (_Lead_byte < 0b1110'0000u) {
if (_Lead_byte < 0b1100'0000u) { // out-of-sequence trailing byte
return partial;
}
// lead byte of 2-byte sequence
_Lead_byte &= 0b0001'1111u;
} else if (_Lead_byte < 0b1111'0000u) { // lead byte of 3-byte sequence
_Lead_byte &= 0b0000'1111u;
_Trailing_count = 2;
} else if (_Lead_byte < 0b1111'1000u) { // lead byte of 4-byte sequence
_Lead_byte &= 0b0000'0111u;
_Trailing_count = 3;
} else { // invalid UTF-8 code unit
return error;
}
if (_Last1 - _First1 < _Trailing_count + 1) { // not enough input
return partial;
}
const char8_t* _Peek = _First1;
char32_t _Code_point = _Lead_byte;
do {
const char8_t _By = *++_Peek;
if ((_By & 0b1100'0000u) != 0b1000'0000u) { // out-of-sequence lead byte
return error;
}
_Code_point = (_Code_point << 6) | (_By & 0b11'1111u);
} while (--_Trailing_count != 0);
if (_Code_point >= 0xd800u && (_Code_point < 0xe000u || _Code_point >= 0x110000u)) {
// invalid code point (surrogate or out of range)
return error;
}
_First1 = _Peek;
*_First2 = _Code_point;
}
return ok;
}
virtual result __CLR_OR_THIS_CALL do_out(mbstate_t&, const char32_t* _First1, const char32_t* _Last1,
const char32_t*& _Mid1, char8_t* _First2, char8_t* _Last2, char8_t*& _Mid2) const {
// convert UTF-32 [_First1, _Last1) to UTF-8 [_First2, _Last2)
_Adl_verify_range(_First1, _Last1);
_Adl_verify_range(_First2, _Last2);
_Codecvt_guard<char32_t, char8_t> _Guard{_First1, _Mid1, _First2, _Mid2};
for (; _First1 != _Last1; ++_First1, ++_First2) {
if (_First2 == _Last2) { // no more output
return partial;
}
const char32_t _Code_point = *_First1;
if (_Code_point < 0x80u) { // encode 1-byte sequence
*_First2 = static_cast<char8_t>(_Code_point);
continue;
}
int _Trailing_count = 1;
if (_Code_point < 0x800u) { // encode 2-byte sequence
*_First2 = static_cast<char8_t>(0b1100'0000u | (_Code_point >> 6));
} else if (_Code_point < 0x10000u) { // encode 3-byte sequence
if (_Code_point >= 0xd800u && _Code_point < 0xe000u) { // invalid code point (surrogate)
return error;
}
*_First2 = static_cast<char8_t>(0b1110'0000u | (_Code_point >> 12));
_Trailing_count = 2;
} else if (_Code_point < 0x110000u) { // encode 4-byte sequence
*_First2 = static_cast<char8_t>(0b1111'0000u | (_Code_point >> 18));
_Trailing_count = 3;
} else { // Invalid code point (out of range)
return error;
}
if (_Last2 - _First2 < _Trailing_count + 1) { // not enough output
return partial;
}
do {
--_Trailing_count;
*++_First2 = static_cast<char8_t>(0b1000'0000u | ((_Code_point >> (6 * _Trailing_count)) & 0b11'1111u));
} while (_Trailing_count != 0);
}
return ok;
}
virtual result __CLR_OR_THIS_CALL do_unshift(mbstate_t&, char8_t* _First2, char8_t*, char8_t*& _Mid2) const {
// terminate encoding sequence
_Mid2 = _First2;
return noconv; // no termination necessary
}
virtual int __CLR_OR_THIS_CALL do_length(
mbstate_t&, const char8_t* _First1, const char8_t* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count UTF-32 code units
_Adl_verify_range(_First1, _Last1);
const auto _Old_first1 = _First1;
for (; _First1 != _Last1 && _Count > 0u; ++_First1, --_Count) {
char32_t _Code_point = *_First1;
if (_Code_point < 0b1000'0000u) { // single-byte sequence
continue;
}
int _Trailing_count = 1;
if (_Code_point < 0b1110'0000u) {
if (_Code_point < 0b1100'0000u) { // out-of-sequence trailing byte
break;
}
// lead byte of 2-byte sequence
_Code_point &= 0b0001'1111u;
} else if (_Code_point < 0b1111'0000u) { // lead byte of 3-byte sequence
_Code_point &= 0b0000'1111u;
_Trailing_count = 2;
} else if (_Code_point < 0b1111'1000u) { // lead byte of 4-byte sequence
_Code_point &= 0b0000'0111u;
_Trailing_count = 3;
} else { // invalid UTF-8 code unit
break;
}
if (_Last1 - _First1 < _Trailing_count + 1) { // not enough input
break;
}
const char8_t* _Peek = _First1;
bool _Done = false;
do {
const char8_t _By = *++_Peek;
if ((_By & 0b1100'0000u) != 0b1000'0000u) { // out-of-sequence lead byte
_Done = true;
break;
}
_Code_point = (_Code_point << 6) | (_By & 0b11'1111u);
} while (--_Trailing_count != 0);
if (_Done || (_Code_point >= 0xd800u && (_Code_point < 0xe000u || _Code_point >= 0x110000u))) {
// invalid code point (surrogate or out of range)
break;
}
_First1 = _Peek;
}
return static_cast<int>((_STD min)(_First1 - _Old_first1, ptrdiff_t{INT_MAX}));
}
bool __CLR_OR_THIS_CALL do_always_noconv() const noexcept override {
// return true if conversions never change input
return false;
}
int __CLR_OR_THIS_CALL do_max_length() const noexcept override {
// return maximum length required for a conversion
return 4;
}
int __CLR_OR_THIS_CALL do_encoding() const noexcept override {
// return length of code sequence (from codecvt)
return 0; // varying length
}
};
#endif // defined(__cpp_char8_t) && !defined(_M_CEE_PURE)
extern "C++" template <>
class _CRTIMP2_PURE_IMPORT codecvt<wchar_t, char, mbstate_t> : public codecvt_base {
// facet for converting between wchar_t and char (_Byte) sequences
public:
using intern_type = wchar_t;
using extern_type = char;
using state_type = mbstate_t;
result __CLR_OR_THIS_CALL in(mbstate_t& _State, const char* _First1, const char* _Last1, const char*& _Mid1,
wchar_t* _First2, wchar_t* _Last2, wchar_t*& _Mid2) const {
// convert bytes [_First1, _Last1) to [_First2, _Last2)
return do_in(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL out(mbstate_t& _State, const wchar_t* _First1, const wchar_t* _Last1,
const wchar_t*& _Mid1, char* _First2, char* _Last2, char*& _Mid2) const {
// convert [_First1, _Last1) to bytes [_First2, _Last2)
return do_out(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL unshift(mbstate_t& _State, char* _First2, char* _Last2, char*& _Mid2) const {
// generate bytes to return to default shift state
return do_unshift(_State, _First2, _Last2, _Mid2);
}
int __CLR_OR_THIS_CALL length(mbstate_t& _State, const char* _First1, const char* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count wide characters
return do_length(_State, _First1, _Last1, _Count);
}
__PURE_APPDOMAIN_GLOBAL static locale::id id;
explicit __CLR_OR_THIS_CALL codecvt(size_t _Refs = 0) : codecvt_base(_Refs) {
_BEGIN_LOCINFO(_Lobj)
_Init(_Lobj);
_END_LOCINFO()
}
explicit __CLR_OR_THIS_CALL codecvt(const _Locinfo& _Lobj, size_t _Refs = 0) : codecvt_base(_Refs) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
// return locale category mask and construct standard facet
if (_Ppf && !*_Ppf) {
*_Ppf = new codecvt(_Locinfo(_Ploc->_C_str()));
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~codecvt() noexcept override {}
void __CLR_OR_THIS_CALL _Init(const _Locinfo& _Lobj) { // initialize from _Lobj
_Cvt = _Lobj._Getcvt();
}
virtual result __CLR_OR_THIS_CALL do_in(mbstate_t&, const char* _First1, const char* _Last1, const char*& _Mid1,
wchar_t* _First2, wchar_t* _Last2, wchar_t*& _Mid2) const {
// convert bytes [_First1, _Last1) to [_First2, _Last2)
mbstate_t _Mystate{};
_Adl_verify_range(_First1, _Last1);
_Adl_verify_range(_First2, _Last2);
_Mid1 = _First1;
_Mid2 = _First2;
for (;;) {
if (_Mid1 == _Last1) {
return ok;
}
if (_Mid2 == _Last2) {
return partial;
}
int _Bytes = _Mbrtowc(_Mid2, _Mid1, static_cast<size_t>(_Last1 - _Mid1), &_Mystate, &_Cvt);
switch (_Bytes) {
case -2: // partial conversion
return partial;
case -1: // failed conversion
return error;
case 0: // converted NULL character, TRANSITION, VSO-654347
_Bytes = 1;
_FALLTHROUGH;
default: // converted some other character
_Mid1 += _Bytes;
++_Mid2;
break;
}
}
}
virtual result __CLR_OR_THIS_CALL do_out(mbstate_t& _State, const wchar_t* _First1, const wchar_t* _Last1,
const wchar_t*& _Mid1, char* _First2, char* _Last2, char*& _Mid2) const {
// convert [_First1, _Last1) to bytes [_First2, _Last2)
_Adl_verify_range(_First1, _Last1);
_Adl_verify_range(_First2, _Last2);
_Mid1 = _First1;
_Mid2 = _First2;
int _Bytes;
while (_Mid1 != _Last1 && _Mid2 != _Last2) {
if (MB_LEN_MAX <= _Last2 - _Mid2) {
if ((_Bytes = _Wcrtomb(_Mid2, *_Mid1, &_State, &_Cvt)) < 0) {
return error; // locale-specific wcrtomb failed
} else {
++_Mid1;
_Mid2 += _Bytes;
}
} else { // destination too small, convert into buffer
char _Buf[MB_LEN_MAX];
mbstate_t _Stsave = _State;
if ((_Bytes = _Wcrtomb(_Buf, *_Mid1, &_State, &_Cvt)) < 0) {
return error; // locale-specific wcrtomb failed
} else if (_Last2 - _Mid2 < _Bytes) { // converted too many, roll back and return previous
_State = _Stsave;
break;
} else { // copy converted bytes from buffer
_CSTD memcpy(_Mid2, _Buf, static_cast<size_t>(_Bytes));
++_Mid1;
_Mid2 += _Bytes;
}
}
}
return _Mid1 == _Last1 ? ok : partial;
}
virtual result __CLR_OR_THIS_CALL do_unshift(mbstate_t& _State, char* _First2, char* _Last2, char*& _Mid2) const {
// generate bytes to return to default shift state
_Adl_verify_range(_First2, _Last2);
_Mid2 = _First2;
result _Ans = ok;
int _Bytes;
char _Buf[MB_LEN_MAX];
mbstate_t _Stsave = _State;
if ((_Bytes = _Wcrtomb(_Buf, L'\0', &_State, &_Cvt)) <= 0) {
_Ans = error; // locale-specific wcrtomb failed
} else if (_Last2 - _Mid2 < --_Bytes) { // converted too many, roll back and return
_State = _Stsave;
_Ans = partial;
} else if (0 < _Bytes) { // copy converted bytes from buffer
_CSTD memcpy(_Mid2, _Buf, static_cast<size_t>(_Bytes));
_Mid2 += _Bytes;
}
return _Ans;
}
virtual int __CLR_OR_THIS_CALL do_length(
mbstate_t& _State, const char* _First1, const char* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count wide characters
_Adl_verify_range(_First1, _Last1);
const auto _Old_first1 = _First1;
for (; _Count > 0u && _First1 != _Last1; --_Count) {
wchar_t _Ch;
int _Bytes = _Mbrtowc(&_Ch, _First1, static_cast<size_t>(_Last1 - _First1), &_State, &_Cvt);
if (_Bytes < 0) { // partial or failed conversion
break;
}
if (_Bytes == 0) { // converted NULL character, TRANSITION, VSO-654347
_Bytes = 1;
}
// converted _Bytes bytes to a wide character
_First1 += _Bytes;
}
return static_cast<int>((_STD min)(_First1 - _Old_first1, ptrdiff_t{INT_MAX}));
}
bool __CLR_OR_THIS_CALL do_always_noconv() const noexcept override {
// return true if conversions never change input
return false;
}
int __CLR_OR_THIS_CALL do_max_length() const noexcept override {
// return maximum length required for a conversion (from codecvt)
return static_cast<int>(_Cvt._Mbcurmax);
}
int __CLR_OR_THIS_CALL do_encoding() const noexcept override {
// return length of code sequence (from codecvt)
return _Cvt._Mbcurmax == 1; // 0 => varying length, 1 => fixed length
}
private:
_Locinfo::_Cvtvec _Cvt; // locale info passed to _Mbrtowc, _Wcrtomb
};
#if defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
extern "C++" template <>
class _CRTIMP2_PURE_IMPORT codecvt<unsigned short, char, mbstate_t> : public codecvt_base {
// facet for converting between unsigned short and char sequences
public:
using intern_type = unsigned short;
using extern_type = char;
using state_type = mbstate_t;
result __CLR_OR_THIS_CALL in(mbstate_t& _State, const char* _First1, const char* _Last1, const char*& _Mid1,
unsigned short* _First2, unsigned short* _Last2, unsigned short*& _Mid2) const {
// convert bytes [_First1, _Last1) to [_First2, _Last2)
return do_in(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL out(mbstate_t& _State, const unsigned short* _First1, const unsigned short* _Last1,
const unsigned short*& _Mid1, char* _First2, char* _Last2, char*& _Mid2) const {
// convert [_First1, _Last1) to bytes [_First2, _Last2)
return do_out(_State, _First1, _Last1, _Mid1, _First2, _Last2, _Mid2);
}
result __CLR_OR_THIS_CALL unshift(mbstate_t& _State, char* _First2, char* _Last2, char*& _Mid2) const {
// generate bytes to return to default shift state
return do_unshift(_State, _First2, _Last2, _Mid2);
}
int __CLR_OR_THIS_CALL length(mbstate_t& _State, const char* _First1, const char* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count _Elems
return do_length(_State, _First1, _Last1, _Count);
}
__PURE_APPDOMAIN_GLOBAL static locale::id id;
explicit __CLR_OR_THIS_CALL codecvt(size_t _Refs = 0) : codecvt_base(_Refs) {
_BEGIN_LOCINFO(_Lobj)
_Init(_Lobj);
_END_LOCINFO()
}
explicit __CLR_OR_THIS_CALL codecvt(const _Locinfo& _Lobj, size_t _Refs = 0) : codecvt_base(_Refs) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
// return locale category mask and construct standard facet
if (_Ppf && !*_Ppf) {
*_Ppf = new codecvt(_Locinfo(_Ploc->_C_str()));
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~codecvt() noexcept override {}
void __CLR_OR_THIS_CALL _Init(const _Locinfo& _Lobj) { // initialize from _Lobj
_Cvt = _Lobj._Getcvt();
}
virtual result __CLR_OR_THIS_CALL do_in(mbstate_t&, const char* _First1, const char* _Last1, const char*& _Mid1,
unsigned short* _First2, unsigned short* _Last2, unsigned short*& _Mid2) const {
// convert bytes [_First1, _Last1) to [_First2, _Last2)
mbstate_t _Mystate{};
_Adl_verify_range(_First1, _Last1);
_Adl_verify_range(_First2, _Last2);
_Mid1 = _First1;
_Mid2 = _First2;
for (;;) {
if (_Mid1 == _Last1) {
return ok;
}
if (_Mid2 == _Last2) {
return partial;
}
int _Bytes = _Mbrtowc(
reinterpret_cast<wchar_t*>(_Mid2), _Mid1, static_cast<size_t>(_Last1 - _Mid1), &_Mystate, &_Cvt);
switch (_Bytes) {
case -2: // partial conversion
return partial;
case -1: // failed conversion
return error;
case 0: // converted NULL character, TRANSITION, VSO-654347
_Bytes = 1;
_FALLTHROUGH;
default: // converted some other character
_Mid1 += _Bytes;
++_Mid2;
break;
}
}
}
virtual result __CLR_OR_THIS_CALL do_out(mbstate_t& _State, const unsigned short* _First1,
const unsigned short* _Last1, const unsigned short*& _Mid1, char* _First2, char* _Last2, char*& _Mid2) const {
// convert [_First1, _Last1) to bytes [_First2, _Last2)
_Adl_verify_range(_First1, _Last1);
_Adl_verify_range(_First2, _Last2);
_Mid1 = _First1;
_Mid2 = _First2;
int _Bytes;
while (_Mid1 != _Last1 && _Mid2 != _Last2) {
if (MB_LEN_MAX <= _Last2 - _Mid2) {
if ((_Bytes = _Wcrtomb(_Mid2, *_Mid1, &_State, &_Cvt)) < 0) {
return error; // locale-specific wcrtomb failed
} else {
++_Mid1;
_Mid2 += _Bytes;
}
} else { // destination too small, convert into buffer
char _Buf[MB_LEN_MAX];
mbstate_t _Stsave = _State;
if ((_Bytes = _Wcrtomb(_Buf, *_Mid1, &_State, &_Cvt)) < 0) {
return error; // locale-specific wcrtomb failed
} else if (_Last2 - _Mid2 < _Bytes) { // converted too many, roll back and return previous
_State = _Stsave;
break;
} else { // copy converted bytes from buffer
_CSTD memcpy(_Mid2, _Buf, static_cast<size_t>(_Bytes));
++_Mid1;
_Mid2 += _Bytes;
}
}
}
return _Mid1 == _Last1 ? ok : partial;
}
virtual result __CLR_OR_THIS_CALL do_unshift(mbstate_t& _State, char* _First2, char* _Last2, char*& _Mid2) const {
// generate bytes to return to default shift state
_Adl_verify_range(_First2, _Last2);
_Mid2 = _First2;
result _Ans = ok;
int _Bytes;
char _Buf[MB_LEN_MAX];
mbstate_t _Stsave = _State;
if ((_Bytes = _Wcrtomb(_Buf, L'\0', &_State, &_Cvt)) <= 0) {
_Ans = error; // locale-specific wcrtomb failed
} else if (_Last2 - _Mid2 < --_Bytes) { // converted too many, roll back and return
_State = _Stsave;
_Ans = partial;
} else if (0 < _Bytes) { // copy converted bytes from buffer
_CSTD memcpy(_Mid2, _Buf, static_cast<size_t>(_Bytes));
_Mid2 += _Bytes;
}
return _Ans;
}
virtual int __CLR_OR_THIS_CALL do_length(
mbstate_t& _State, const char* _First1, const char* _Last1, size_t _Count) const {
// return p - _First1, for the largest value p in [_First1, _Last1] such that [_First1, p) successfully
// converts to at most _Count wide characters
_Adl_verify_range(_First1, _Last1);
const auto _Old_first1 = _First1;
for (; _Count > 0u && _First1 != _Last1; --_Count) {
wchar_t _Ch;
int _Bytes = _Mbrtowc(&_Ch, _First1, static_cast<size_t>(_Last1 - _First1), &_State, &_Cvt);
if (_Bytes < 0) { // partial or failed conversion
break;
}
if (_Bytes == 0) { // converted NULL character, TRANSITION, VSO-654347
_Bytes = 1;
}
// converted _Bytes bytes to a wide character
_First1 += _Bytes;
}
return static_cast<int>((_STD min)(_First1 - _Old_first1, ptrdiff_t{INT_MAX}));
}
bool __CLR_OR_THIS_CALL do_always_noconv() const noexcept override {
// return true if conversions never change input
return false;
}
int __CLR_OR_THIS_CALL do_max_length() const noexcept override {
// return maximum length required for a conversion (from codecvt)
return static_cast<int>(_Cvt._Mbcurmax);
}
int __CLR_OR_THIS_CALL do_encoding() const noexcept override {
// return length of code sequence (from codecvt)
return _Cvt._Mbcurmax == 1u; // 0 => varying length, 1 => fixed length
}
private:
_Locinfo::_Cvtvec _Cvt; // locale info passed to _Mbrtowc, _Wcrtomb
};
#endif // defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
_EXPORT_STD template <class _Elem, class _Byte, class _Statype>
class codecvt_byname : public codecvt<_Elem, _Byte, _Statype> {
public:
static_assert(!_ENFORCE_FACET_SPECIALIZATIONS
|| _Is_any_of_v<codecvt_byname, codecvt_byname<char, char, mbstate_t>,
codecvt_byname<wchar_t, char, mbstate_t>>,
_FACET_SPECIALIZATION_MESSAGE);
explicit __CLR_OR_THIS_CALL codecvt_byname(const char* _Locname, size_t _Refs = 0)
: codecvt<_Elem, _Byte, _Statype>(_Locinfo(_Locname), _Refs) {}
explicit __CLR_OR_THIS_CALL codecvt_byname(const string& _Str, size_t _Refs = 0)
: codecvt<_Elem, _Byte, _Statype>(_Locinfo(_Str.c_str()), _Refs) {}
protected:
__CLR_OR_THIS_CALL ~codecvt_byname() noexcept override {}
};
_STL_DISABLE_DEPRECATED_WARNING
template <>
class _CXX20_DEPRECATE_CODECVT_FACETS codecvt_byname<char16_t, char, mbstate_t>
: public codecvt<char16_t, char, mbstate_t> {
public:
explicit __CLR_OR_THIS_CALL codecvt_byname(const char* _Locname, size_t _Refs = 0)
: codecvt(_Locinfo(_Locname), _Refs) {}
explicit __CLR_OR_THIS_CALL codecvt_byname(const string& _Str, size_t _Refs = 0)
: codecvt(_Locinfo(_Str.c_str()), _Refs) {}
protected:
__CLR_OR_THIS_CALL ~codecvt_byname() noexcept override {}
};
template <>
class _CXX20_DEPRECATE_CODECVT_FACETS codecvt_byname<char32_t, char, mbstate_t>
: public codecvt<char32_t, char, mbstate_t> {
public:
explicit __CLR_OR_THIS_CALL codecvt_byname(const char* _Locname, size_t _Refs = 0)
: codecvt(_Locinfo(_Locname), _Refs) {}
explicit __CLR_OR_THIS_CALL codecvt_byname(const string& _Str, size_t _Refs = 0)
: codecvt(_Locinfo(_Str.c_str()), _Refs) {}
protected:
__CLR_OR_THIS_CALL ~codecvt_byname() noexcept override {}
};
#ifdef __cpp_char8_t
template <>
class _CXX20_DEPRECATE_CODECVT_CHAR8_T_FACETS codecvt_byname<char16_t, char8_t, mbstate_t>
: public codecvt<char16_t, char8_t, mbstate_t> {
public:
explicit __CLR_OR_THIS_CALL codecvt_byname(const char* _Locname, size_t _Refs = 0)
: codecvt(_Locinfo(_Locname), _Refs) {}
explicit __CLR_OR_THIS_CALL codecvt_byname(const string& _Str, size_t _Refs = 0)
: codecvt(_Locinfo(_Str.c_str()), _Refs) {}
protected:
__CLR_OR_THIS_CALL ~codecvt_byname() noexcept override {}
};
template <>
class _CXX20_DEPRECATE_CODECVT_CHAR8_T_FACETS codecvt_byname<char32_t, char8_t, mbstate_t>
: public codecvt<char32_t, char8_t, mbstate_t> {
public:
explicit __CLR_OR_THIS_CALL codecvt_byname(const char* _Locname, size_t _Refs = 0)
: codecvt(_Locinfo(_Locname), _Refs) {}
explicit __CLR_OR_THIS_CALL codecvt_byname(const string& _Str, size_t _Refs = 0)
: codecvt(_Locinfo(_Str.c_str()), _Refs) {}
protected:
__CLR_OR_THIS_CALL ~codecvt_byname() noexcept override {}
};
#endif // defined(__cpp_char8_t)
_STL_RESTORE_DEPRECATED_WARNING
#define _XA 0x100 // extra alphabetic
#define _BB _CONTROL // BEL, BS, etc.
#define _CN _SPACE // CR, FF, HT, NL, VT
#define _DI _DIGIT // '0'-'9'
#define _LO _LOWER // 'a'-'z'
#define _PU _PUNCT // punctuation
#define _SP _BLANK // space
#define _UP _UPPER // 'A'-'Z'
#define _XD _HEX // '0'-'9', 'A'-'F', 'a'-'f'
_EXPORT_STD extern "C++" struct _CRTIMP2_PURE_IMPORT ctype_base // base for ctype
: locale::facet // TRANSITION, ABI, shouldn't be derived from locale::facet
{
enum { // constants for character classifications
alnum = _DI | _LO | _UP | _XA,
alpha = _LO | _UP | _XA,
cntrl = _BB,
digit = _DI,
graph = _DI | _LO | _PU | _UP | _XA,
lower = _LO,
print = _DI | _LO | _PU | _SP | _UP | _XA | _XD,
punct = _PU,
space = _CN | _SP,
upper = _UP,
xdigit = _XD,
blank = _CN | _SP
};
using mask = short; // to match <ctype.h>
__CLR_OR_THIS_CALL ctype_base(size_t _Refs = 0) noexcept // strengthened
: locale::facet(_Refs) {}
__CLR_OR_THIS_CALL ~ctype_base() noexcept override {}
};
#undef _XA
#undef _BB
#undef _CN
#undef _DI
#undef _LO
#undef _PU
#undef _SP
#undef _UP
#undef _XD
_EXPORT_STD extern "C++" template <class _Elem>
class ctype : public ctype_base { // facet for classifying elements, converting cases
public:
// ctype<char>, ctype<wchar_t>, and ctype<unsigned short> are explicitly specialized below.
static_assert(!_ENFORCE_FACET_SPECIALIZATIONS || _Always_false<_Elem>, _FACET_SPECIALIZATION_MESSAGE);
using char_type = _Elem;
bool __CLR_OR_THIS_CALL is(mask _Maskval, _Elem _Ch) const { // test if element fits any mask classifications
return do_is(_Maskval, _Ch);
}
const _Elem* __CLR_OR_THIS_CALL is(const _Elem* _First, const _Elem* _Last,
mask* _Dest) const { // get mask sequence for elements in [_First, _Last)
return do_is(_First, _Last, _Dest);
}
const _Elem* __CLR_OR_THIS_CALL scan_is(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) that fits mask classification
return do_scan_is(_Maskval, _First, _Last);
}
const _Elem* __CLR_OR_THIS_CALL scan_not(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) not fitting mask classification
return do_scan_not(_Maskval, _First, _Last);
}
_Elem __CLR_OR_THIS_CALL tolower(_Elem _Ch) const { // convert element to lower case
return do_tolower(_Ch);
}
const _Elem* __CLR_OR_THIS_CALL tolower(
_Elem* _First, const _Elem* _Last) const { // convert [_First, _Last) in place to lower case
return do_tolower(_First, _Last);
}
_Elem __CLR_OR_THIS_CALL toupper(_Elem _Ch) const { // convert element to upper case
return do_toupper(_Ch);
}
const _Elem* __CLR_OR_THIS_CALL toupper(
_Elem* _First, const _Elem* _Last) const { // convert [_First, _Last) in place to upper case
return do_toupper(_First, _Last);
}
_Elem __CLR_OR_THIS_CALL widen(char _Byte) const { // widen char
return do_widen(_Byte);
}
const char* __CLR_OR_THIS_CALL widen(const char* _First, const char* _Last,
_Elem* _Dest) const { // widen chars in [_First, _Last)
return do_widen(_First, _Last, _Dest);
}
char __CLR_OR_THIS_CALL narrow(_Elem _Ch, char _Dflt = '\0') const { // narrow element to char
return do_narrow(_Ch, _Dflt);
}
const _Elem* __CLR_OR_THIS_CALL narrow(const _Elem* _First, const _Elem* _Last, char _Dflt,
char* _Dest) const { // narrow elements in [_First, _Last) to chars
return do_narrow(_First, _Last, _Dflt, _Dest);
}
__PURE_APPDOMAIN_GLOBAL static locale::id id;
explicit __CLR_OR_THIS_CALL ctype(size_t _Refs = 0) : ctype_base(_Refs) {
_BEGIN_LOCINFO(_Lobj)
_Init(_Lobj);
_END_LOCINFO()
}
__CLR_OR_THIS_CALL ctype(const _Locinfo& _Lobj, size_t _Refs = 0) : ctype_base(_Refs) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
if (_Ppf && !*_Ppf) {
*_Ppf = new ctype<_Elem>(_Locinfo(_Ploc->_C_str()));
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~ctype() noexcept override {
if (_Ctype._Delfl) {
_CSTD free(const_cast<short*>(_Ctype._Table));
}
_CSTD free(_Ctype._LocaleName);
}
void __CLR_OR_THIS_CALL _Init(const _Locinfo& _Lobj) { // initialize from _Lobj
_Ctype = _Lobj._Getctype();
_Cvt = _Lobj._Getcvt();
}
virtual bool __CLR_OR_THIS_CALL do_is(
mask _Maskval, _Elem _Ch) const { // test if element fits any mask classifications
return (_Ctype._Table[static_cast<unsigned char>(narrow(_Ch))] & _Maskval) != 0;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_is(const _Elem* _First, const _Elem* _Last,
mask* _Dest) const { // get mask sequence for elements in [_First, _Last)
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First, ++_Dest) {
*_Dest = _Ctype._Table[static_cast<unsigned char>(narrow(*_First))];
}
return _First;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_scan_is(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) that fits mask classification
_Adl_verify_range(_First, _Last);
while (_First != _Last && !is(_Maskval, *_First)) {
++_First;
}
return _First;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_scan_not(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) not fitting mask classification
_Adl_verify_range(_First, _Last);
while (_First != _Last && is(_Maskval, *_First)) {
++_First;
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_tolower(_Elem _Ch) const { // convert element to lower case
unsigned char _Byte = static_cast<unsigned char>(narrow(_Ch, '\0'));
if (_Byte == '\0') {
return _Ch;
}
return widen(static_cast<char>(_Tolower(_Byte, &_Ctype)));
}
virtual const _Elem* __CLR_OR_THIS_CALL do_tolower(_Elem* _First,
const _Elem* _Last) const { // convert [_First, _Last) in place to lower case
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First) { // convert *_First to lower case
unsigned char _Byte = static_cast<unsigned char>(narrow(*_First, '\0'));
if (_Byte != '\0') {
*_First = (widen(static_cast<char>(_Tolower(_Byte, &_Ctype))));
}
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_toupper(_Elem _Ch) const { // convert element to upper case
unsigned char _Byte = static_cast<unsigned char>(narrow(_Ch, '\0'));
if (_Byte == '\0') {
return _Ch;
}
return widen(static_cast<char>(_Toupper(_Byte, &_Ctype)));
}
virtual const _Elem* __CLR_OR_THIS_CALL do_toupper(_Elem* _First,
const _Elem* _Last) const { // convert [_First, _Last) in place to upper case
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First) { // convert *_First to upper case
unsigned char _Byte = static_cast<unsigned char>(narrow(*_First, '\0'));
if (_Byte != '\0') {
*_First = (widen(static_cast<char>(_Toupper(_Byte, &_Ctype))));
}
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_widen(char _Byte) const { // widen char
return _Maklocchr(_Byte, static_cast<_Elem*>(nullptr), _Cvt);
}
virtual const char* __CLR_OR_THIS_CALL do_widen(
const char* _First, const char* _Last, _Elem* _Dest) const { // widen chars in [_First, _Last)
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First, ++_Dest) {
*_Dest = _Maklocchr(*_First, static_cast<_Elem*>(nullptr), _Cvt);
}
return _First;
}
char __CLR_OR_THIS_CALL _Donarrow(_Elem _Ch, char _Dflt) const { // narrow element to char
char _Byte;
if (_Ch == _Elem{}) {
return '\0';
}
if ((_Byte = _Maklocbyte(_Ch, _Cvt)) == '\0') {
return _Dflt;
}
return _Byte;
}
virtual char __CLR_OR_THIS_CALL do_narrow(_Elem _Ch, char _Dflt) const { // narrow element to char
return _Donarrow(_Ch, _Dflt);
}
virtual const _Elem* __CLR_OR_THIS_CALL do_narrow(const _Elem* _First, const _Elem* _Last, char _Dflt,
char* _Dest) const { // narrow elements in [_First, _Last) to chars
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First, ++_Dest) {
*_Dest = _Donarrow(*_First, _Dflt);
}
return _First;
}
private:
_Locinfo::_Ctypevec _Ctype; // locale info passed to _Tolower, etc.
_Locinfo::_Cvtvec _Cvt; // conversion information
};
#ifdef __clang__
#pragma clang diagnostic push
#pragma clang diagnostic ignored "-Wdllimport-static-field-def"
#endif // defined(__clang__)
template <class _Elem>
locale::id ctype<_Elem>::id;
#ifdef __clang__
#pragma clang diagnostic pop
#endif // defined(__clang__)
extern "C++" template <>
class _CRTIMP2_PURE_IMPORT ctype<char> : public ctype_base { // facet for classifying char elements, converting cases
public:
using _Elem = char;
using char_type = _Elem;
bool __CLR_OR_THIS_CALL is(mask _Maskval, _Elem _Ch) const { // test if element fits any mask classifications
return (_Ctype._Table[static_cast<unsigned char>(_Ch)] & _Maskval) != 0;
}
const _Elem* __CLR_OR_THIS_CALL is(const _Elem* _First, const _Elem* _Last,
mask* _Dest) const { // get mask sequence for elements in [_First, _Last)
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First, ++_Dest) {
*_Dest = _Ctype._Table[static_cast<unsigned char>(*_First)];
}
return _First;
}
const _Elem* __CLR_OR_THIS_CALL scan_is(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) that fits mask classification
_Adl_verify_range(_First, _Last);
while (_First != _Last && !is(_Maskval, *_First)) {
++_First;
}
return _First;
}
const _Elem* __CLR_OR_THIS_CALL scan_not(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) not fitting mask classification
_Adl_verify_range(_First, _Last);
while (_First != _Last && is(_Maskval, *_First)) {
++_First;
}
return _First;
}
_Elem __CLR_OR_THIS_CALL tolower(_Elem _Ch) const { // convert element to lower case
return do_tolower(_Ch);
}
const _Elem* __CLR_OR_THIS_CALL tolower(
_Elem* _First, const _Elem* _Last) const { // convert [_First, _Last) in place to lower case
return do_tolower(_First, _Last);
}
_Elem __CLR_OR_THIS_CALL toupper(_Elem _Ch) const { // convert element to upper case
return do_toupper(_Ch);
}
const _Elem* __CLR_OR_THIS_CALL toupper(
_Elem* _First, const _Elem* _Last) const { // convert [_First, _Last) in place to upper case
return do_toupper(_First, _Last);
}
_Elem __CLR_OR_THIS_CALL widen(char _Byte) const { // widen char
return do_widen(_Byte);
}
const _Elem* __CLR_OR_THIS_CALL widen(const char* _First, const char* _Last,
_Elem* _Dest) const { // widen chars in [_First, _Last)
return do_widen(_First, _Last, _Dest);
}
_Elem __CLR_OR_THIS_CALL narrow(_Elem _Ch, char _Dflt = '\0') const { // narrow element to char
return do_narrow(_Ch, _Dflt);
}
const _Elem* __CLR_OR_THIS_CALL narrow(const _Elem* _First, const _Elem* _Last, char _Dflt,
char* _Dest) const { // narrow elements in [_First, _Last) to chars
return do_narrow(_First, _Last, _Dflt, _Dest);
}
__PURE_APPDOMAIN_GLOBAL static locale::id id;
explicit __CLR_OR_THIS_CALL ctype(const mask* _Table = nullptr, bool _Deletetable = false,
size_t _Refs = 0)
: ctype_base(_Refs) { // construct with specified table and delete flag for table
_BEGIN_LOCINFO(_Lobj)
_Init(_Lobj);
_END_LOCINFO()
_Tidy(); // free existing table, as needed
if (_Table) { // replace existing char to mask table
_Ctype._Table = _Table;
_Ctype._Delfl = _Deletetable ? -1 : 0;
} else { // use classic table
_Ctype._Table = classic_table();
_Ctype._Delfl = 0;
}
}
__CLR_OR_THIS_CALL ctype(const _Locinfo& _Lobj, size_t _Refs = 0) : ctype_base(_Refs) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
if (_Ppf && !*_Ppf) {
*_Ppf = new ctype<_Elem>(_Locinfo(_Ploc->_C_str()));
}
return _X_CTYPE;
}
const mask* __CLR_OR_THIS_CALL table() const noexcept {
return _Ctype._Table;
}
static const mask* __CLRCALL_OR_CDECL classic_table() noexcept {
return _STD use_facet<ctype>(locale::classic()).table();
}
_PGLOBAL static const size_t table_size = 1 << CHAR_BIT; // size of ctype mapping table, typically 256
protected:
__CLR_OR_THIS_CALL ~ctype() noexcept override {
_Tidy();
}
void __CLR_OR_THIS_CALL _Init(const _Locinfo& _Lobj) { // initialize from _Lobj
_Ctype = _Lobj._Getctype();
}
void __CLR_OR_THIS_CALL _Tidy() noexcept { // free any allocated storage
if (0 < _Ctype._Delfl) {
_CSTD free(const_cast<short*>(_Ctype._Table));
} else if (_Ctype._Delfl < 0) {
delete[] _Ctype._Table;
}
_CSTD free(_Ctype._LocaleName);
}
virtual _Elem __CLR_OR_THIS_CALL do_tolower(_Elem _Ch) const { // convert element to lower case
return static_cast<_Elem>(_Tolower(static_cast<unsigned char>(_Ch), &_Ctype));
}
virtual const _Elem* __CLR_OR_THIS_CALL do_tolower(_Elem* _First,
const _Elem* _Last) const { // convert [_First, _Last) in place to lower case
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First) {
*_First = static_cast<_Elem>(_Tolower(static_cast<unsigned char>(*_First), &_Ctype));
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_toupper(_Elem _Ch) const { // convert element to upper case
return static_cast<_Elem>(_Toupper(static_cast<unsigned char>(_Ch), &_Ctype));
}
virtual const _Elem* __CLR_OR_THIS_CALL do_toupper(_Elem* _First,
const _Elem* _Last) const { // convert [_First, _Last) in place to upper case
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First) {
*_First = static_cast<_Elem>(_Toupper(static_cast<unsigned char>(*_First), &_Ctype));
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_widen(char _Byte) const { // widen char
return _Byte;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_widen(
const char* _First, const char* _Last, _Elem* _Dest) const { // widen chars in [_First, _Last)
_Adl_verify_range(_First, _Last);
_CSTD memcpy(_Dest, _First, static_cast<size_t>(_Last - _First));
return _Last;
}
virtual _Elem __CLR_OR_THIS_CALL do_narrow(_Elem _Ch, char) const { // narrow char
return _Ch;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_narrow(const _Elem* _First, const _Elem* _Last, char,
char* _Dest) const { // narrow elements in [_First, _Last) to chars
_Adl_verify_range(_First, _Last);
_CSTD memcpy(_Dest, _First, static_cast<size_t>(_Last - _First));
return _Last;
}
private:
_Locinfo::_Ctypevec _Ctype; // information
};
extern "C++" template <>
class _CRTIMP2_PURE_IMPORT ctype<wchar_t>
: public ctype_base { // facet for classifying wchar_t elements, converting cases
public:
using _Elem = wchar_t;
using char_type = _Elem;
bool __CLR_OR_THIS_CALL is(mask _Maskval, _Elem _Ch) const { // test if element fits any mask classifications
return do_is(_Maskval, _Ch);
}
const _Elem* __CLR_OR_THIS_CALL is(const _Elem* _First, const _Elem* _Last,
mask* _Dest) const { // get mask sequence for elements in [_First, _Last)
return do_is(_First, _Last, _Dest);
}
const _Elem* __CLR_OR_THIS_CALL scan_is(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) that fits mask classification
return do_scan_is(_Maskval, _First, _Last);
}
const _Elem* __CLR_OR_THIS_CALL scan_not(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) not fitting mask classification
return do_scan_not(_Maskval, _First, _Last);
}
_Elem __CLR_OR_THIS_CALL tolower(_Elem _Ch) const { // convert element to lower case
return do_tolower(_Ch);
}
const _Elem* __CLR_OR_THIS_CALL tolower(
_Elem* _First, const _Elem* _Last) const { // convert [_First, _Last) in place to lower case
return do_tolower(_First, _Last);
}
_Elem __CLR_OR_THIS_CALL toupper(_Elem _Ch) const { // convert element to upper case
return do_toupper(_Ch);
}
const _Elem* __CLR_OR_THIS_CALL toupper(
_Elem* _First, const _Elem* _Last) const { // convert [_First, _Last) in place to upper case
return do_toupper(_First, _Last);
}
_Elem __CLR_OR_THIS_CALL widen(char _Byte) const { // widen char
return do_widen(_Byte);
}
const char* __CLR_OR_THIS_CALL widen(const char* _First, const char* _Last,
_Elem* _Dest) const { // widen chars in [_First, _Last)
return do_widen(_First, _Last, _Dest);
}
char __CLR_OR_THIS_CALL narrow(_Elem _Ch, char _Dflt = '\0') const { // narrow element to char
return do_narrow(_Ch, _Dflt);
}
const _Elem* __CLR_OR_THIS_CALL narrow(const _Elem* _First, const _Elem* _Last, char _Dflt,
char* _Dest) const { // narrow elements in [_First, _Last) to chars
return do_narrow(_First, _Last, _Dflt, _Dest);
}
__PURE_APPDOMAIN_GLOBAL static locale::id id;
explicit __CLR_OR_THIS_CALL ctype(size_t _Refs = 0) : ctype_base(_Refs) {
_BEGIN_LOCINFO(_Lobj)
_Init(_Lobj);
_END_LOCINFO()
}
__CLR_OR_THIS_CALL ctype(const _Locinfo& _Lobj, size_t _Refs = 0) : ctype_base(_Refs) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
if (_Ppf && !*_Ppf) {
*_Ppf = new ctype<_Elem>(_Locinfo(_Ploc->_C_str()));
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~ctype() noexcept override {
if (_Ctype._Delfl) {
_CSTD free(const_cast<short*>(_Ctype._Table));
}
_CSTD free(_Ctype._LocaleName);
}
void __CLR_OR_THIS_CALL _Init(const _Locinfo& _Lobj) { // initialize from _Lobj
_Ctype = _Lobj._Getctype();
_Cvt = _Lobj._Getcvt();
}
virtual bool __CLR_OR_THIS_CALL do_is(
mask _Maskval, _Elem _Ch) const { // test if element fits any mask classifications
return (_CSTD _Getwctype(_Ch, &_Ctype) & _Maskval) != 0;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_is(const _Elem* _First, const _Elem* _Last,
mask* _Dest) const { // get mask sequence for elements in [_First, _Last)
_Adl_verify_range(_First, _Last);
return _CSTD _Getwctypes(_First, _Last, _Dest, &_Ctype);
}
virtual const _Elem* __CLR_OR_THIS_CALL do_scan_is(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) that fits mask classification
_Adl_verify_range(_First, _Last);
while (_First != _Last && !is(_Maskval, *_First)) {
++_First;
}
return _First;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_scan_not(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) not fitting mask classification
_Adl_verify_range(_First, _Last);
while (_First != _Last && is(_Maskval, *_First)) {
++_First;
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_tolower(_Elem _Ch) const { // convert element to lower case
return _Towlower(_Ch, &_Ctype);
}
virtual const _Elem* __CLR_OR_THIS_CALL do_tolower(_Elem* _First,
const _Elem* _Last) const { // convert [_First, _Last) in place to lower case
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First) {
*_First = _Towlower(*_First, &_Ctype);
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_toupper(_Elem _Ch) const { // convert element to upper case
return _Towupper(_Ch, &_Ctype);
}
virtual const _Elem* __CLR_OR_THIS_CALL do_toupper(_Elem* _First,
const _Elem* _Last) const { // convert [_First, _Last) in place to upper case
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First) {
*_First = _Towupper(*_First, &_Ctype);
}
return _First;
}
_Elem __CLR_OR_THIS_CALL _Dowiden(char _Byte) const { // widen char
mbstate_t _Mbst = {};
wchar_t _Wc;
return _Mbrtowc(&_Wc, &_Byte, 1, &_Mbst, &_Cvt) < 0 ? static_cast<wchar_t>(WEOF) : _Wc;
}
virtual _Elem __CLR_OR_THIS_CALL do_widen(char _Byte) const { // widen char
return _Dowiden(_Byte);
}
virtual const char* __CLR_OR_THIS_CALL do_widen(
const char* _First, const char* _Last, _Elem* _Dest) const { // widen chars in [_First, _Last)
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First, ++_Dest) {
*_Dest = _Dowiden(*_First);
}
return _First;
}
char __CLR_OR_THIS_CALL _Donarrow(_Elem _Ch, char _Dflt) const { // narrow element to char
char _Buf[MB_LEN_MAX];
mbstate_t _Mbst = {};
return _Wcrtomb(_Buf, _Ch, &_Mbst, &_Cvt) != 1 ? _Dflt : _Buf[0];
}
virtual char __CLR_OR_THIS_CALL do_narrow(_Elem _Ch, char _Dflt) const { // narrow element to char
return _Donarrow(_Ch, _Dflt);
}
virtual const _Elem* __CLR_OR_THIS_CALL do_narrow(const _Elem* _First, const _Elem* _Last, char _Dflt,
char* _Dest) const { // narrow elements in [_First, _Last) to chars
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First, ++_Dest) {
*_Dest = _Donarrow(*_First, _Dflt);
}
return _First;
}
private:
_Locinfo::_Ctypevec _Ctype; // locale info passed to _Tolower, etc.
_Locinfo::_Cvtvec _Cvt; // conversion information
};
#if defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
extern "C++" template <>
class _CRTIMP2_PURE_IMPORT ctype<unsigned short>
: public ctype_base { // facet for classifying unsigned short elements, converting cases
public:
using _Elem = unsigned short;
using char_type = _Elem;
bool __CLR_OR_THIS_CALL is(mask _Maskval, _Elem _Ch) const { // test if element fits any mask classifications
return do_is(_Maskval, _Ch);
}
const _Elem* __CLR_OR_THIS_CALL is(const _Elem* _First, const _Elem* _Last,
mask* _Dest) const { // get mask sequence for elements in [_First, _Last)
return do_is(_First, _Last, _Dest);
}
const _Elem* __CLR_OR_THIS_CALL scan_is(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) that fits mask classification
return do_scan_is(_Maskval, _First, _Last);
}
const _Elem* __CLR_OR_THIS_CALL scan_not(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) not fitting mask classification
return do_scan_not(_Maskval, _First, _Last);
}
_Elem __CLR_OR_THIS_CALL tolower(_Elem _Ch) const { // convert element to lower case
return do_tolower(_Ch);
}
const _Elem* __CLR_OR_THIS_CALL tolower(
_Elem* _First, const _Elem* _Last) const { // convert [_First, _Last) in place to lower case
return do_tolower(_First, _Last);
}
_Elem __CLR_OR_THIS_CALL toupper(_Elem _Ch) const { // convert element to upper case
return do_toupper(_Ch);
}
const _Elem* __CLR_OR_THIS_CALL toupper(
_Elem* _First, const _Elem* _Last) const { // convert [_First, _Last) in place to upper case
return do_toupper(_First, _Last);
}
_Elem __CLR_OR_THIS_CALL widen(char _Byte) const { // widen char
return do_widen(_Byte);
}
const char* __CLR_OR_THIS_CALL widen(const char* _First, const char* _Last,
_Elem* _Dest) const { // widen chars in [_First, _Last)
return do_widen(_First, _Last, _Dest);
}
char __CLR_OR_THIS_CALL narrow(_Elem _Ch, char _Dflt = '\0') const { // narrow element to char
return do_narrow(_Ch, _Dflt);
}
const _Elem* __CLR_OR_THIS_CALL narrow(const _Elem* _First, const _Elem* _Last, char _Dflt,
char* _Dest) const { // narrow elements in [_First, _Last) to chars
return do_narrow(_First, _Last, _Dflt, _Dest);
}
__PURE_APPDOMAIN_GLOBAL static locale::id id;
explicit __CLR_OR_THIS_CALL ctype(size_t _Refs = 0) : ctype_base(_Refs) {
_BEGIN_LOCINFO(_Lobj)
_Init(_Lobj);
_END_LOCINFO()
}
__CLR_OR_THIS_CALL ctype(const _Locinfo& _Lobj, size_t _Refs = 0) : ctype_base(_Refs) {
_Init(_Lobj);
}
static size_t __CLRCALL_OR_CDECL _Getcat(const locale::facet** _Ppf = nullptr, const locale* _Ploc = nullptr) {
if (_Ppf && !*_Ppf) {
*_Ppf = new ctype<_Elem>(_Locinfo(_Ploc->_C_str()));
}
return _X_CTYPE;
}
protected:
__CLR_OR_THIS_CALL ~ctype() noexcept override {
if (_Ctype._Delfl) {
_CSTD free(const_cast<short*>(_Ctype._Table));
}
_CSTD free(_Ctype._LocaleName);
}
void __CLR_OR_THIS_CALL _Init(const _Locinfo& _Lobj) { // initialize from _Lobj
_Ctype = _Lobj._Getctype();
_Cvt = _Lobj._Getcvt();
}
virtual bool __CLR_OR_THIS_CALL do_is(
mask _Maskval, _Elem _Ch) const { // test if element fits any mask classifications
return (_CSTD _Getwctype(_Ch, &_Ctype) & _Maskval) != 0;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_is(const _Elem* _First, const _Elem* _Last,
mask* _Dest) const { // get mask sequence for elements in [_First, _Last)
_Adl_verify_range(_First, _Last);
return reinterpret_cast<const _Elem*>(_CSTD _Getwctypes(
reinterpret_cast<const wchar_t*>(_First), reinterpret_cast<const wchar_t*>(_Last), _Dest, &_Ctype));
}
virtual const _Elem* __CLR_OR_THIS_CALL do_scan_is(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) that fits mask classification
_Adl_verify_range(_First, _Last);
while (_First != _Last && !is(_Maskval, *_First)) {
++_First;
}
return _First;
}
virtual const _Elem* __CLR_OR_THIS_CALL do_scan_not(mask _Maskval, const _Elem* _First,
const _Elem* _Last) const { // find first in [_First, _Last) not fitting mask classification
_Adl_verify_range(_First, _Last);
while (_First != _Last && is(_Maskval, *_First)) {
++_First;
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_tolower(_Elem _Ch) const { // convert element to lower case
return _Towlower(_Ch, &_Ctype);
}
virtual const _Elem* __CLR_OR_THIS_CALL do_tolower(_Elem* _First,
const _Elem* _Last) const { // convert [_First, _Last) in place to lower case
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First) {
*_First = _Towlower(*_First, &_Ctype);
}
return _First;
}
virtual _Elem __CLR_OR_THIS_CALL do_toupper(_Elem _Ch) const { // convert element to upper case
return _Towupper(_Ch, &_Ctype);
}
virtual const _Elem* __CLR_OR_THIS_CALL do_toupper(_Elem* _First,
const _Elem* _Last) const { // convert [_First, _Last) in place to upper case
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First) {
*_First = _Towupper(*_First, &_Ctype);
}
return _First;
}
_Elem __CLR_OR_THIS_CALL _Dowiden(char _Byte) const { // widen char
mbstate_t _Mbst = {};
unsigned short _Wc;
if (_Mbrtowc(reinterpret_cast<wchar_t*>(&_Wc), &_Byte, 1, &_Mbst, &_Cvt) < 0) {
return static_cast<unsigned short>(WEOF);
}
return _Wc;
}
virtual _Elem __CLR_OR_THIS_CALL do_widen(char _Byte) const { // widen char
return _Dowiden(_Byte);
}
virtual const char* __CLR_OR_THIS_CALL do_widen(
const char* _First, const char* _Last, _Elem* _Dest) const { // widen chars in [_First, _Last)
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First, ++_Dest) {
*_Dest = _Dowiden(*_First);
}
return _First;
}
char __CLR_OR_THIS_CALL _Donarrow(_Elem _Ch, char _Dflt) const { // narrow element to char
char _Buf[MB_LEN_MAX];
mbstate_t _Mbst = {};
return _Wcrtomb(_Buf, _Ch, &_Mbst, &_Cvt) != 1 ? _Dflt : _Buf[0];
}
virtual char __CLR_OR_THIS_CALL do_narrow(_Elem _Ch, char _Dflt) const { // narrow element to char
return _Donarrow(_Ch, _Dflt);
}
virtual const _Elem* __CLR_OR_THIS_CALL do_narrow(const _Elem* _First, const _Elem* _Last, char _Dflt,
char* _Dest) const { // narrow elements in [_First, _Last) to chars
_Adl_verify_range(_First, _Last);
for (; _First != _Last; ++_First, ++_Dest) {
*_Dest = _Donarrow(*_First, _Dflt);
}
return _First;
}
private:
_Locinfo::_Ctypevec _Ctype; // locale info passed to _Tolower, etc.
_Locinfo::_Cvtvec _Cvt; // conversion information
};
#endif // defined(_NATIVE_WCHAR_T_DEFINED) && !_ENFORCE_FACET_SPECIALIZATIONS
_EXPORT_STD template <class _Elem>
class ctype_byname : public ctype<_Elem> { // ctype for named locale
public:
static_assert(!_ENFORCE_FACET_SPECIALIZATIONS || _Is_any_of_v<_Elem, char, wchar_t>, _FACET_SPECIALIZATION_MESSAGE);
explicit __CLR_OR_THIS_CALL ctype_byname(const char* _Locname, size_t _Refs = 0)
: ctype<_Elem>(_Locinfo(_Locname), _Refs) {} // construct for named locale
explicit __CLR_OR_THIS_CALL ctype_byname(const string& _Str, size_t _Refs = 0)
: ctype<_Elem>(_Locinfo(_Str.c_str()), _Refs) {} // construct for named locale
protected:
__CLR_OR_THIS_CALL ~ctype_byname() noexcept override {}
};
enum class _Case_sensitive : bool { _Nope, _Yes };
template <class _InIt, class _Elem>
int __CRTDECL _Getloctxt(
_InIt& _First, _InIt& _Last, size_t _Numfields, const _Elem* _Ptr, const _Case_sensitive _Matching) {
// find field at _Ptr that matches longest in [_First, _Last)
for (size_t _Off = 0; _Ptr[_Off] != _Elem{}; ++_Off) {
if (_Ptr[_Off] == _Ptr[0]) {
++_Numfields; // add fields with leading mark to initial count
}
}
string _Str(_Numfields, '\0'); // one column counter for each field
const ctype<_Elem>& _CType = _STD use_facet<ctype<_Elem>>(locale{});
int _Ans = -2; // no candidates so far
for (size_t _Column = 1;; ++_Column, (void) ++_First, _Ans = -1) { // test each element against all viable fields
bool _Prefix = false; // seen at least one valid prefix
size_t _Off = 0; // offset into fields
size_t _Field = 0; // current field number
for (; _Field < _Numfields; ++_Field) { // test element at _Column in field _Field
while (_Ptr[_Off] != _Elem{} && _Ptr[_Off] != _Ptr[0]) { // find beginning of field
++_Off;
}
if (_Str[_Field] != '\0') {
_Off += _Str[_Field]; // skip tested columns in field
} else if (_Ptr[_Off += _Column] == _Ptr[0]
|| _Ptr[_Off] == _Elem{}) { // matched all of field, save as possible answer
_Str[_Field] = static_cast<char>(_Column < 127 ? _Column : 127); // save skip count if small enough
_Ans = static_cast<int>(_Field); // save answer
} else if (_First == _Last
|| (_Matching == _Case_sensitive::_Yes
? _Ptr[_Off] != *_First
: _CType.tolower(_Ptr[_Off]) != _CType.tolower(static_cast<_Elem>(*_First)))) {
_Str[_Field] = static_cast<char>(_Column < 127 ? _Column : 127); // no match, just save skip count
} else {
_Prefix = true; // still a valid prefix
}
}
if (!_Prefix || _First == _Last) {
break; // no pending prefixes or no input, give up
}
}
return _Ans; // return field number or negative value on failure
}
#if defined(_DLL_CPPLIB)
#if !defined(_CRTBLD) || defined(__FORCE_INSTANCE)
template class _CRTIMP2_PURE_IMPORT codecvt<char, char, mbstate_t>;
#endif // !defined(_CRTBLD) || defined(__FORCE_INSTANCE)
#endif // defined(_DLL_CPPLIB)
_STD_END
#pragma pop_macro("new")
_STL_RESTORE_CLANG_WARNINGS
#pragma warning(pop)
#pragma pack(pop)
#endif // _STL_COMPILER_PREPROCESSOR
#endif // _XLOCALE_