1 //===----------------------------------------------------------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include <cstddef> // size_t
10 #include <cwchar> // mbstate_t
11 #include <limits.h> // MB_LEN_MAX
12 #include <string.h> // wmemcpy
14 // Returns the number of wide characters found in the multi byte sequence `src`
15 // (of `src_size_bytes`), that fit in the buffer `dst` (of `max_dest_chars`
16 // elements size). The count returned excludes the null terminator.
17 // When `dst` is NULL, no characters are copied to `dst`.
18 // Returns (size_t) -1 when an invalid sequence is encountered.
19 // Leaves *`src` pointing to the next character to convert or NULL
20 // if a null character was converted from *`src`.
21 _LIBCPP_EXPORTED_FROM_ABI
size_t mbsnrtowcs(
22 wchar_t* __restrict dst
,
23 const char** __restrict src
,
24 size_t src_size_bytes
,
25 size_t max_dest_chars
,
26 mbstate_t* __restrict ps
) {
27 const size_t terminated_sequence
= static_cast<size_t>(0);
28 const size_t invalid_sequence
= static_cast<size_t>(-1);
29 const size_t incomplete_sequence
= static_cast<size_t>(-2);
31 size_t source_converted
;
32 size_t dest_converted
;
35 // If `dst` is null then `max_dest_chars` should be ignored according to the
36 // standard. Setting `max_dest_chars` to a large value has this effect.
38 max_dest_chars
= static_cast<size_t>(-1);
40 for (dest_converted
= source_converted
= 0;
41 source_converted
< src_size_bytes
&& (!dst
|| dest_converted
< max_dest_chars
);
42 ++dest_converted
, source_converted
+= result
) {
43 // Converts one multi byte character.
44 // If result (char_size) is greater than 0, it's the size in bytes of that character.
45 // If result (char_size) is zero, it indicates that the null character has been found.
46 // Otherwise, it's an error and errno may be set.
47 size_t source_remaining
= src_size_bytes
- source_converted
;
48 size_t dest_remaining
= max_dest_chars
- dest_converted
;
51 result
= mbrtowc(nullptr, *src
+ source_converted
, source_remaining
, ps
);
52 } else if (dest_remaining
>= source_remaining
) {
53 // dst has enough space to translate in-place.
54 result
= mbrtowc(dst
+ dest_converted
, *src
+ source_converted
, source_remaining
, ps
);
57 * dst may not have enough space, so use a temporary buffer.
59 * We need to save a copy of the conversion state
60 * here so we can restore it if the multibyte
61 * character is too long for the buffer.
63 wchar_t buff
[MB_LEN_MAX
];
64 mbstate_t mbstate_tmp
;
68 result
= mbrtowc(buff
, *src
+ source_converted
, source_remaining
, ps
);
70 if (result
> dest_remaining
) {
71 // Multi-byte sequence for character won't fit.
76 // The buffer was used, so we need copy the translation to dst.
77 wmemcpy(dst
, buff
, result
);
81 // Don't do anything to change errno from here on.
82 if (result
== invalid_sequence
|| result
== terminated_sequence
|| result
== incomplete_sequence
) {
88 if (result
== terminated_sequence
)
91 *src
+= source_converted
;
93 if (result
== invalid_sequence
)
94 return invalid_sequence
;
96 return dest_converted
;