|  | // Copyright 2012 The Chromium Authors | 
|  | // Use of this source code is governed by a BSD-style license that can be | 
|  | // found in the LICENSE file. | 
|  |  | 
|  | #include "base/strings/sys_string_conversions.h" | 
|  |  | 
|  | #include <stddef.h> | 
|  | #include <string.h> | 
|  | #include <wchar.h> | 
|  |  | 
|  | #include "base/strings/string_piece.h" | 
|  | #include "base/strings/utf_string_conversions.h" | 
|  | #include "build/build_config.h" | 
|  |  | 
|  | namespace gurl_base { | 
|  |  | 
|  | std::string SysWideToUTF8(const std::wstring& wide) { | 
|  | // In theory this should be using the system-provided conversion rather | 
|  | // than our ICU, but this will do for now. | 
|  | return WideToUTF8(wide); | 
|  | } | 
|  | std::wstring SysUTF8ToWide(StringPiece utf8) { | 
|  | // In theory this should be using the system-provided conversion rather | 
|  | // than our ICU, but this will do for now. | 
|  | std::wstring out; | 
|  | UTF8ToWide(utf8.data(), utf8.size(), &out); | 
|  | return out; | 
|  | } | 
|  |  | 
|  | #if defined(SYSTEM_NATIVE_UTF8) || BUILDFLAG(IS_ANDROID) | 
|  | // TODO(port): Consider reverting the OS_ANDROID when we have wcrtomb() | 
|  | // support and a better understanding of what calls these routines. | 
|  |  | 
|  | std::string SysWideToNativeMB(const std::wstring& wide) { | 
|  | return WideToUTF8(wide); | 
|  | } | 
|  |  | 
|  | std::wstring SysNativeMBToWide(StringPiece native_mb) { | 
|  | return SysUTF8ToWide(native_mb); | 
|  | } | 
|  |  | 
|  | #else | 
|  |  | 
|  | std::string SysWideToNativeMB(const std::wstring& wide) { | 
|  | mbstate_t ps; | 
|  |  | 
|  | // Calculate the number of multi-byte characters.  We walk through the string | 
|  | // without writing the output, counting the number of multi-byte characters. | 
|  | size_t num_out_chars = 0; | 
|  | memset(&ps, 0, sizeof(ps)); | 
|  | for (auto src : wide) { | 
|  | // Use a temp buffer since calling wcrtomb with an output of NULL does not | 
|  | // calculate the output length. | 
|  | char buf[16]; | 
|  | // Skip NULLs to avoid wcrtomb's special handling of them. | 
|  | size_t res = src ? wcrtomb(buf, src, &ps) : 0; | 
|  | switch (res) { | 
|  | // Handle any errors and return an empty string. | 
|  | case static_cast<size_t>(-1): | 
|  | return std::string(); | 
|  | case 0: | 
|  | // We hit an embedded null byte, keep going. | 
|  | ++num_out_chars; | 
|  | break; | 
|  | default: | 
|  | num_out_chars += res; | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | if (num_out_chars == 0) | 
|  | return std::string(); | 
|  |  | 
|  | std::string out; | 
|  | out.resize(num_out_chars); | 
|  |  | 
|  | // We walk the input string again, with |i| tracking the index of the | 
|  | // wide input, and |j| tracking the multi-byte output. | 
|  | memset(&ps, 0, sizeof(ps)); | 
|  | for (size_t i = 0, j = 0; i < wide.size(); ++i) { | 
|  | const wchar_t src = wide[i]; | 
|  | // We don't want wcrtomb to do its funkiness for embedded NULLs. | 
|  | size_t res = src ? wcrtomb(&out[j], src, &ps) : 0; | 
|  | switch (res) { | 
|  | // Handle any errors and return an empty string. | 
|  | case static_cast<size_t>(-1): | 
|  | return std::string(); | 
|  | case 0: | 
|  | // We hit an embedded null byte, keep going. | 
|  | ++j;  // Output is already zeroed. | 
|  | break; | 
|  | default: | 
|  | j += res; | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | return out; | 
|  | } | 
|  |  | 
|  | std::wstring SysNativeMBToWide(StringPiece native_mb) { | 
|  | mbstate_t ps; | 
|  |  | 
|  | // Calculate the number of wide characters.  We walk through the string | 
|  | // without writing the output, counting the number of wide characters. | 
|  | size_t num_out_chars = 0; | 
|  | memset(&ps, 0, sizeof(ps)); | 
|  | for (size_t i = 0; i < native_mb.size(); ) { | 
|  | const char* src = native_mb.data() + i; | 
|  | size_t res = mbrtowc(nullptr, src, native_mb.size() - i, &ps); | 
|  | switch (res) { | 
|  | // Handle any errors and return an empty string. | 
|  | case static_cast<size_t>(-2): | 
|  | case static_cast<size_t>(-1): | 
|  | return std::wstring(); | 
|  | case 0: | 
|  | // We hit an embedded null byte, keep going. | 
|  | i += 1; | 
|  | [[fallthrough]]; | 
|  | default: | 
|  | i += res; | 
|  | ++num_out_chars; | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | if (num_out_chars == 0) | 
|  | return std::wstring(); | 
|  |  | 
|  | std::wstring out; | 
|  | out.resize(num_out_chars); | 
|  |  | 
|  | memset(&ps, 0, sizeof(ps));  // Clear the shift state. | 
|  | // We walk the input string again, with |i| tracking the index of the | 
|  | // multi-byte input, and |j| tracking the wide output. | 
|  | for (size_t i = 0, j = 0; i < native_mb.size(); ++j) { | 
|  | const char* src = native_mb.data() + i; | 
|  | wchar_t* dst = &out[j]; | 
|  | size_t res = mbrtowc(dst, src, native_mb.size() - i, &ps); | 
|  | switch (res) { | 
|  | // Handle any errors and return an empty string. | 
|  | case static_cast<size_t>(-2): | 
|  | case static_cast<size_t>(-1): | 
|  | return std::wstring(); | 
|  | case 0: | 
|  | i += 1;  // Skip null byte. | 
|  | break; | 
|  | default: | 
|  | i += res; | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | return out; | 
|  | } | 
|  |  | 
|  | #endif  // defined(SYSTEM_NATIVE_UTF8) || BUILDFLAG(IS_ANDROID) | 
|  |  | 
|  | }  // namespace base |