1 /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
3 * This file is part of the LibreOffice project.
5 * This Source Code Form is subject to the terms of the Mozilla Public
6 * License, v. 2.0. If a copy of the MPL was not distributed with this
7 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
9 * This file incorporates work covered by the following license notice:
11 * Licensed to the Apache Software Foundation (ASF) under one or more
12 * contributor license agreements. See the NOTICE file distributed
13 * with this work for additional information regarding copyright
14 * ownership. The ASF licenses this file to you under the Apache
15 * License, Version 2.0 (the "License"); you may not use this file
16 * except in compliance with the License. You may obtain a copy of
17 * the License at http://www.apache.org/licenses/LICENSE-2.0 .
20 #include <sal/config.h>
25 #include <rtl/character.hxx>
26 #include <rtl/textcvt.h>
27 #include <sal/types.h>
29 #include "context.hxx"
30 #include "converter.hxx"
31 #include "convertsinglebytetobmpunicode.hxx"
32 #include "unichars.hxx"
34 sal_Size
rtl_textenc_convertSingleByteToBmpUnicode(
35 void const * data
, SAL_UNUSED_PARAMETER
void *, char const * srcBuf
,
36 sal_Size srcBytes
, sal_Unicode
* destBuf
, sal_Size destChars
,
37 sal_uInt32 flags
, sal_uInt32
* info
, sal_Size
* srcCvtBytes
)
39 sal_Unicode
const * map
= static_cast<
40 rtl::textenc::BmpUnicodeToSingleByteConverterData
const * >(
42 sal_uInt32 infoFlags
= 0;
43 sal_Size converted
= 0;
44 sal_Unicode
* destBufPtr
= destBuf
;
45 sal_Unicode
* destBufEnd
= destBuf
+ destChars
;
46 for (; converted
< srcBytes
; ++converted
) {
48 sal_Unicode c
= map
[static_cast< sal_uInt8
>(b
)];
52 if (destBufEnd
- destBufPtr
< 1) {
58 switch (sal::detail::textenc::handleBadInputTextToUnicodeConversion(
59 true/*undefined*/, false, b
, flags
, &destBufPtr
, destBufEnd
,
62 case sal::detail::textenc::BAD_INPUT_STOP
:
63 if ((flags
& RTL_TEXTTOUNICODE_FLAGS_FLUSH
) == 0) {
68 case sal::detail::textenc::BAD_INPUT_CONTINUE
:
71 case sal::detail::textenc::BAD_INPUT_NO_OUTPUT
:
77 infoFlags
|= RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOOSMALL
;
80 if (info
!= nullptr) {
83 if (srcCvtBytes
!= nullptr) {
84 *srcCvtBytes
= converted
;
86 return destBufPtr
- destBuf
;
89 sal_Size
rtl_textenc_convertBmpUnicodeToSingleByte(
90 void const * data
, void * context
,
91 sal_Unicode
const * srcBuf
, sal_Size srcChars
, char * destBuf
,
92 sal_Size destBytes
, sal_uInt32 flags
, sal_uInt32
* info
,
93 sal_Size
* srcCvtChars
)
95 std::size_t entries
= static_cast<
96 rtl::textenc::BmpUnicodeToSingleByteConverterData
const * >(
97 data
)->unicodeToByteEntries
;
98 rtl::textenc::BmpUnicodeToSingleByteRange
const * ranges
= static_cast<
99 rtl::textenc::BmpUnicodeToSingleByteConverterData
const * >(
100 data
)->unicodeToByte
;
101 sal_Unicode highSurrogate
= 0;
102 sal_uInt32 infoFlags
= 0;
103 sal_Size converted
= 0;
104 char * destBufPtr
= destBuf
;
105 char * destBufEnd
= destBuf
+ destBytes
;
106 if (context
!= nullptr) {
107 highSurrogate
= static_cast< ImplUnicodeToTextContext
* >(context
)->
110 for (; converted
< srcChars
; ++converted
) {
111 bool undefined
= true;
112 sal_uInt32 c
= *srcBuf
++;
113 if (highSurrogate
== 0) {
114 if (rtl::isHighSurrogate(c
)) {
115 highSurrogate
= static_cast< sal_Unicode
>(c
);
118 else if (rtl::isLowSurrogate(c
))
123 } else if (rtl::isLowSurrogate(c
)) {
124 c
= rtl::combineSurrogates(highSurrogate
, c
);
129 assert(rtl::isUnicodeScalarValue(c
));
130 // Linearly searching through the ranges if probably fastest, assuming
131 // that most converted characters belong to the ASCII subset:
132 for (std::size_t i
= 0; i
< entries
; ++i
) {
133 if (c
< ranges
[i
].unicode
) {
136 if (c
<= sal::static_int_cast
< sal_uInt32
>(
137 ranges
[i
].unicode
+ ranges
[i
].range
))
139 if (destBufEnd
- destBufPtr
< 1) {
142 *destBufPtr
++ = static_cast< char >(
143 ranges
[i
].byte
+ (c
- ranges
[i
].unicode
));
152 switch (sal::detail::textenc::handleBadInputUnicodeToTextConversion(
153 undefined
, c
, flags
, &destBufPtr
, destBufEnd
, &infoFlags
, nullptr,
156 case sal::detail::textenc::BAD_INPUT_STOP
:
160 case sal::detail::textenc::BAD_INPUT_CONTINUE
:
164 case sal::detail::textenc::BAD_INPUT_NO_OUTPUT
:
170 infoFlags
|= RTL_UNICODETOTEXT_INFO_DESTBUFFERTOSMALL
;
173 if (highSurrogate
!= 0
175 & (RTL_UNICODETOTEXT_INFO_ERROR
176 | RTL_UNICODETOTEXT_INFO_DESTBUFFERTOSMALL
))
179 if ((flags
& RTL_UNICODETOTEXT_FLAGS_FLUSH
) != 0) {
180 infoFlags
|= RTL_UNICODETOTEXT_INFO_SRCBUFFERTOSMALL
;
182 switch (sal::detail::textenc::handleBadInputUnicodeToTextConversion(
183 false, 0, flags
, &destBufPtr
, destBufEnd
, &infoFlags
, nullptr,
186 case sal::detail::textenc::BAD_INPUT_STOP
:
187 case sal::detail::textenc::BAD_INPUT_CONTINUE
:
191 case sal::detail::textenc::BAD_INPUT_NO_OUTPUT
:
192 infoFlags
|= RTL_UNICODETOTEXT_INFO_DESTBUFFERTOSMALL
;
197 if (context
!= nullptr) {
198 static_cast< ImplUnicodeToTextContext
* >(context
)->m_nHighSurrogate
201 if (info
!= nullptr) {
204 if (srcCvtChars
!= nullptr) {
205 *srcCvtChars
= converted
;
207 return destBufPtr
- destBuf
;
210 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */