163 lines
4.6 KiB
C++
163 lines
4.6 KiB
C++
// Copyright (c) 2012 The Chromium Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
// found in the LICENSE file.
|
|
|
|
#include "base/strings/sys_string_conversions.h"
|
|
|
|
#include <stddef.h>
|
|
#include <wchar.h>
|
|
|
|
#include "base/strings/string_piece.h"
|
|
#include "base/strings/utf_string_conversions.h"
|
|
#include "build/build_config.h"
|
|
|
|
namespace base {
|
|
|
|
std::string SysWideToUTF8(const std::wstring& wide) {
|
|
// In theory this should be using the system-provided conversion rather
|
|
// than our ICU, but this will do for now.
|
|
return WideToUTF8(wide);
|
|
}
|
|
std::wstring SysUTF8ToWide(StringPiece utf8) {
|
|
// In theory this should be using the system-provided conversion rather
|
|
// than our ICU, but this will do for now.
|
|
std::wstring out;
|
|
UTF8ToWide(utf8.data(), utf8.size(), &out);
|
|
return out;
|
|
}
|
|
|
|
#if defined(SYSTEM_NATIVE_UTF8) || defined(OS_ANDROID)
|
|
// TODO(port): Consider reverting the OS_ANDROID when we have wcrtomb()
|
|
// support and a better understanding of what calls these routines.
|
|
|
|
std::string SysWideToNativeMB(const std::wstring& wide) {
|
|
return WideToUTF8(wide);
|
|
}
|
|
|
|
std::wstring SysNativeMBToWide(StringPiece native_mb) {
|
|
return SysUTF8ToWide(native_mb);
|
|
}
|
|
|
|
#else
|
|
|
|
std::string SysWideToNativeMB(const std::wstring& wide) {
|
|
mbstate_t ps;
|
|
|
|
// Calculate the number of multi-byte characters. We walk through the string
|
|
// without writing the output, counting the number of multi-byte characters.
|
|
size_t num_out_chars = 0;
|
|
memset(&ps, 0, sizeof(ps));
|
|
for (auto src : wide) {
|
|
// Use a temp buffer since calling wcrtomb with an output of NULL does not
|
|
// calculate the output length.
|
|
char buf[16];
|
|
// Skip NULLs to avoid wcrtomb's special handling of them.
|
|
size_t res = src ? wcrtomb(buf, src, &ps) : 0;
|
|
switch (res) {
|
|
// Handle any errors and return an empty string.
|
|
case static_cast<size_t>(-1):
|
|
return std::string();
|
|
break;
|
|
case 0:
|
|
// We hit an embedded null byte, keep going.
|
|
++num_out_chars;
|
|
break;
|
|
default:
|
|
num_out_chars += res;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (num_out_chars == 0)
|
|
return std::string();
|
|
|
|
std::string out;
|
|
out.resize(num_out_chars);
|
|
|
|
// We walk the input string again, with |i| tracking the index of the
|
|
// wide input, and |j| tracking the multi-byte output.
|
|
memset(&ps, 0, sizeof(ps));
|
|
for (size_t i = 0, j = 0; i < wide.size(); ++i) {
|
|
const wchar_t src = wide[i];
|
|
// We don't want wcrtomb to do its funkiness for embedded NULLs.
|
|
size_t res = src ? wcrtomb(&out[j], src, &ps) : 0;
|
|
switch (res) {
|
|
// Handle any errors and return an empty string.
|
|
case static_cast<size_t>(-1):
|
|
return std::string();
|
|
break;
|
|
case 0:
|
|
// We hit an embedded null byte, keep going.
|
|
++j; // Output is already zeroed.
|
|
break;
|
|
default:
|
|
j += res;
|
|
break;
|
|
}
|
|
}
|
|
|
|
return out;
|
|
}
|
|
|
|
std::wstring SysNativeMBToWide(StringPiece native_mb) {
|
|
mbstate_t ps;
|
|
|
|
// Calculate the number of wide characters. We walk through the string
|
|
// without writing the output, counting the number of wide characters.
|
|
size_t num_out_chars = 0;
|
|
memset(&ps, 0, sizeof(ps));
|
|
for (size_t i = 0; i < native_mb.size(); ) {
|
|
const char* src = native_mb.data() + i;
|
|
size_t res = mbrtowc(nullptr, src, native_mb.size() - i, &ps);
|
|
switch (res) {
|
|
// Handle any errors and return an empty string.
|
|
case static_cast<size_t>(-2):
|
|
case static_cast<size_t>(-1):
|
|
return std::wstring();
|
|
break;
|
|
case 0:
|
|
// We hit an embedded null byte, keep going.
|
|
i += 1;
|
|
FALLTHROUGH;
|
|
default:
|
|
i += res;
|
|
++num_out_chars;
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (num_out_chars == 0)
|
|
return std::wstring();
|
|
|
|
std::wstring out;
|
|
out.resize(num_out_chars);
|
|
|
|
memset(&ps, 0, sizeof(ps)); // Clear the shift state.
|
|
// We walk the input string again, with |i| tracking the index of the
|
|
// multi-byte input, and |j| tracking the wide output.
|
|
for (size_t i = 0, j = 0; i < native_mb.size(); ++j) {
|
|
const char* src = native_mb.data() + i;
|
|
wchar_t* dst = &out[j];
|
|
size_t res = mbrtowc(dst, src, native_mb.size() - i, &ps);
|
|
switch (res) {
|
|
// Handle any errors and return an empty string.
|
|
case static_cast<size_t>(-2):
|
|
case static_cast<size_t>(-1):
|
|
return std::wstring();
|
|
break;
|
|
case 0:
|
|
i += 1; // Skip null byte.
|
|
break;
|
|
default:
|
|
i += res;
|
|
break;
|
|
}
|
|
}
|
|
|
|
return out;
|
|
}
|
|
|
|
#endif // defined(SYSTEM_NATIVE_UTF8) || defined(OS_ANDROID)
|
|
|
|
} // namespace base
|