diff options
Diffstat (limited to 'wcsmbs/mbsnrtowcs.c')
-rw-r--r-- | wcsmbs/mbsnrtowcs.c | 112 |
1 files changed, 68 insertions, 44 deletions
diff --git a/wcsmbs/mbsnrtowcs.c b/wcsmbs/mbsnrtowcs.c index bb79a30..db67d5c 100644 --- a/wcsmbs/mbsnrtowcs.c +++ b/wcsmbs/mbsnrtowcs.c @@ -43,10 +43,16 @@ __mbsnrtowcs (dst, src, nmc, len, ps) size_t written = 0; const char *run = *src; const char *last = run + nmc; + wchar_t value; + size_t count; if (ps == NULL) ps = &internal; + /* Get information from last use of this state. */ + count = ps->count; + value = ps->value; + if (dst == NULL) /* The LEN parameter has to be ignored if we don't actually write anything. */ @@ -55,57 +61,66 @@ __mbsnrtowcs (dst, src, nmc, len, ps) /* Copy all words. */ while (written < len && run < last) { - wchar_t value; - size_t count; - unsigned char byte = *run++; + unsigned char byte; - /* We expect a start of a new multibyte character. */ - if (byte < 0x80) - { - /* One byte sequence. */ - count = 0; - value = byte; - } - else if ((byte & 0xe0) == 0xc0) - { - count = 1; - value = byte & 0x1f; - } - else if ((byte & 0xf0) == 0xe0) - { - /* We expect three bytes. */ - count = 2; - value = byte & 0x0f; - } - else if ((byte & 0xf8) == 0xf0) - { - /* We expect four bytes. */ - count = 3; - value = byte & 0x07; - } - else if ((byte & 0xfc) == 0xf8) - { - /* We expect five bytes. */ - count = 4; - value = byte & 0x03; - } - else if ((byte & 0xfe) == 0xfc) - { - /* We expect six bytes. */ - count = 5; - value = byte & 0x01; - } - else + /* Store address of next byte to process. */ + *src = run; + + /* Start reading a new character only if we are in the initial + state. */ + if (count == 0) { - /* This is an illegal encoding. */ - __set_errno (EILSEQ); - return (size_t) -1; + byte = *run++; + + /* We expect a start of a new multibyte character. */ + if (byte < 0x80) + { + /* One byte sequence. */ + count = 0; + value = byte; + } + else if ((byte & 0xe0) == 0xc0) + { + count = 1; + value = byte & 0x1f; + } + else if ((byte & 0xf0) == 0xe0) + { + /* We expect three bytes. */ + count = 2; + value = byte & 0x0f; + } + else if ((byte & 0xf8) == 0xf0) + { + /* We expect four bytes. */ + count = 3; + value = byte & 0x07; + } + else if ((byte & 0xfc) == 0xf8) + { + /* We expect five bytes. */ + count = 4; + value = byte & 0x03; + } + else if ((byte & 0xfe) == 0xfc) + { + /* We expect six bytes. */ + count = 5; + value = byte & 0x01; + } + else + { + /* This is an illegal encoding. */ + __set_errno (EILSEQ); + return (size_t) -1; + } } /* Read the possible remaining bytes. */ - while (count-- > 0) + while (run < last && count > 0) { byte = *run++; + --count; if ((byte & 0xc0) != 0x80) { @@ -118,6 +133,14 @@ __mbsnrtowcs (dst, src, nmc, len, ps) value |= byte & 0x3f; } + /* If this character is only partially available remember this. */ + if (run == last && count != 0) + { + ps->count = count; + ps->value = value; + break; + } + /* Store value is required. */ if (dst != NULL) *dst++ = value; @@ -128,6 +151,7 @@ __mbsnrtowcs (dst, src, nmc, len, ps) { /* Found the end of the string. */ *src = NULL; + ps->count = 0; return written; } |