// // wctomb.cpp // // Copyright (c) Microsoft Corporation. All rights reserved. // // Functions to convert a wide character to the equivalent multibyte character, // according to the LC_CTYPE category of the current locale. The return value // (or *return_value, for the _s-suffixed functions) depends on the destination // and destination_count: // * If destination == nullptr && count == 0, number of bytes needed for conversion // * If destination != nullptr: the number of bytes used for the conversion // * If destination == nullptr && count > 0, the state information // (0 for no state dependency, 1 if a state dependent encoding) // // Historically Windows has not supported state-dependent encodings for wctomb, // however UTF-8 can possible require more than one input wchar_t and maintain // state between calls. // // The return_value pointer may be null. // #include #include #include #include #include #include #include extern "C" int __cdecl _wctomb_internal( int* const return_value, char* const destination, size_t const destination_count, wchar_t const wchar, __crt_cached_ptd_host& ptd ) { // Did the caller request if this is a state dependent encoding? if (!destination && destination_count > 0) { // Indicate do not have state-dependent encodings: if (return_value != nullptr) *return_value = 0; return 0; } if (return_value) *return_value = -1; // We need to cast destination_count to int, so we make sure we are not // going to truncate destination_count: _UCRT_VALIDATE_RETURN_ERRCODE(ptd, destination_count <= INT_MAX, EINVAL); _locale_t const locale = ptd.get_locale(); if (locale->locinfo->_public._locale_lc_codepage == CP_UTF8) { // Unlike c16rtomb. wctomb/wcrtomb have no ability to process a partial code point. // So, we could call c16rtomb and check for a lone surrogate or other error, or for simplicity // We can instead just call c32rtomb and check for any error. I choose the latter. mbstate_t state{}; int result = static_cast(__crt_mbstring::__c32rtomb_utf8(destination, static_cast(wchar), &state, ptd)); if (return_value != nullptr) { *return_value = result; } if (result <= 4) { return 0; } else { return ptd.get_errno().value_or(0); } } // Check for C-locale behavior, which merely casts it to char (if in range) // for ASCII-ish behavior. if (!locale->locinfo->locale_name[LC_CTYPE]) { // See if the WCHAR is > ASCII-ish range if (wchar > 255) // Validate high byte { // Too big, can't convert, clear buffer and return error if (destination != nullptr && destination_count > 0) { memset(destination, 0, destination_count); } return ptd.get_errno().set(EILSEQ); } // ASCII-ish, just cast to a (char) if (destination != nullptr) { _UCRT_VALIDATE_RETURN_ERRCODE(ptd, destination_count > 0, ERANGE); *destination = static_cast(wchar); } if (return_value != nullptr) { // casting one WCHAR emits a single char *return_value = 1; } // We're done return 0; } else { BOOL default_used{}; int const size = __acrt_WideCharToMultiByte( locale->locinfo->_public._locale_lc_codepage, 0, &wchar, 1, destination, static_cast(destination_count), nullptr, &default_used); if (size == 0 || default_used) { if (size == 0 && GetLastError() == ERROR_INSUFFICIENT_BUFFER) { if (destination && destination_count > 0) { memset(destination, 0, destination_count); } _UCRT_VALIDATE_RETURN_ERRCODE(ptd, ("Buffer too small", 0), ERANGE); } return ptd.get_errno().set(EILSEQ); } if (return_value) { *return_value = size; } return 0; } // The last thing was an if/else, so we already returned. } extern "C" int __cdecl _wctomb_s_l( int* const return_value, char* const destination, size_t const destination_count, wchar_t const wchar, _locale_t const locale ) { __crt_cached_ptd_host ptd(locale); return _wctomb_internal(return_value, destination, destination_count, wchar, ptd); } extern "C" errno_t __cdecl wctomb_s ( int* const return_value, char* const destination, size_t const destination_count, wchar_t const wchar ) { __crt_cached_ptd_host ptd; return _wctomb_internal(return_value, destination, destination_count, wchar, ptd); } extern "C" int __cdecl _wctomb_l( char* const destination, wchar_t const wchar, _locale_t const locale ) { __crt_cached_ptd_host ptd(locale); int return_value{}; errno_t const e = _wctomb_internal( &return_value, destination, ptd.get_locale()->locinfo->_public._locale_mb_cur_max, wchar, ptd); if (e != 0) { return -1; } return return_value; } // Disable the OACR error that warns that 'MB_CUR_MAX' doesn't properly constrain buffer 'destination'. // wctomb() doesn't take a buffer size, so the function's contract is inherently dangerous. __pragma(warning(push)) __pragma(warning(disable:__WARNING_POTENTIAL_BUFFER_OVERFLOW_HIGH_PRIORITY)) // 26015 extern "C" int __cdecl wctomb( char* const destination, wchar_t const wchar ) { __crt_cached_ptd_host ptd; int return_value{}; errno_t const e = _wctomb_internal(&return_value, destination, MB_CUR_MAX, wchar, ptd); if (e != 0) { return -1; } return return_value; } __pragma(warning(pop))