aboutsummaryrefslogtreecommitdiff
path: root/libstdc++-v3/src
diff options
context:
space:
mode:
authorJonathan Wakely <jwakely@redhat.com>2017-03-16 15:27:45 +0000
committerJonathan Wakely <redi@gcc.gnu.org>2017-03-16 15:27:45 +0000
commit02e12bda2df86491a5d9c7294550fd4cd4968aa1 (patch)
tree33f94cc1c2cd76b91fa4b4764e91ca08e07ae7f2 /libstdc++-v3/src
parent8d85abab445d4f458826f4ef3acbc83091257c8b (diff)
downloadgcc-02e12bda2df86491a5d9c7294550fd4cd4968aa1.zip
gcc-02e12bda2df86491a5d9c7294550fd4cd4968aa1.tar.gz
gcc-02e12bda2df86491a5d9c7294550fd4cd4968aa1.tar.bz2
PR libstdc++/79511 fix endianness of UTF-16 data
PR libstdc++/79511 * src/c++11/codecvt.cc (write_utf16_code_point): Don't write 0xffff as a surrogate pair. (__codecvt_utf8_utf16_base<char32_t>::do_in): Use native endianness for internal representation. (__codecvt_utf8_utf16_base<wchar_t>::do_in): Likewise. * testsuite/22_locale/codecvt/codecvt_utf8_utf16/79511.cc: New test. From-SVN: r246199
Diffstat (limited to 'libstdc++-v3/src')
-rw-r--r--libstdc++-v3/src/c++11/codecvt.cc14
1 files changed, 11 insertions, 3 deletions
diff --git a/libstdc++-v3/src/c++11/codecvt.cc b/libstdc++-v3/src/c++11/codecvt.cc
index 12a4d4f..9b63e2b 100644
--- a/libstdc++-v3/src/c++11/codecvt.cc
+++ b/libstdc++-v3/src/c++11/codecvt.cc
@@ -315,7 +315,7 @@ namespace
{
static_assert(sizeof(C) >= 2, "a code unit must be at least 16-bit");
- if (codepoint < max_single_utf16_unit)
+ if (codepoint <= max_single_utf16_unit)
{
if (to.size() > 0)
{
@@ -1341,7 +1341,11 @@ do_in(state_type&, const extern_type* __from, const extern_type* __from_end,
{
range<const char> from{ __from, __from_end };
range<char32_t> to{ __to, __to_end };
- auto res = utf16_in(from, to, _M_maxcode, _M_mode);
+ codecvt_mode mode = codecvt_mode(_M_mode & (consume_header|generate_header));
+#if __BYTE_ORDER__ != __ORDER_BIG_ENDIAN__
+ mode = codecvt_mode(mode | little_endian);
+#endif
+ auto res = utf16_in(from, to, _M_maxcode, mode);
__from_next = from.next;
__to_next = to.next;
return res;
@@ -1411,7 +1415,11 @@ do_in(state_type&, const extern_type* __from, const extern_type* __from_end,
{
range<const char> from{ __from, __from_end };
range<wchar_t> to{ __to, __to_end };
- auto res = utf16_in(from, to, _M_maxcode, _M_mode);
+ codecvt_mode mode = codecvt_mode(_M_mode & (consume_header|generate_header));
+#if __BYTE_ORDER__ != __ORDER_BIG_ENDIAN__
+ mode = codecvt_mode(mode | little_endian);
+#endif
+ auto res = utf16_in(from, to, _M_maxcode, mode);
__from_next = from.next;
__to_next = to.next;
return res;