1 /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
3 * This file is part of the LibreOffice project.
5 * This Source Code Form is subject to the terms of the Mozilla Public
6 * License, v. 2.0. If a copy of the MPL was not distributed with this
7 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
9 * This file incorporates work covered by the following license notice:
11 * Licensed to the Apache Software Foundation (ASF) under one or more
12 * contributor license agreements. See the NOTICE file distributed
13 * with this work for additional information regarding copyright
14 * ownership. The ASF licenses this file to you under the Apache
15 * License, Version 2.0 (the "License"); you may not use this file
16 * except in compliance with the License. You may obtain a copy of
17 * the License at http://www.apache.org/licenses/LICENSE-2.0 .
20 #ifndef INCLUDED_OOX_TOKEN_TOKENMAP_HXX
21 #define INCLUDED_OOX_TOKEN_TOKENMAP_HXX
23 #include <sal/config.h>
25 #include <string_view>
28 #include <com/sun/star/uno/Sequence.hxx>
29 #include <oox/token/tokens.hxx>
30 #include <oox/dllapi.h>
31 #include <rtl/ustring.hxx>
32 #include <sal/log.hxx>
33 #include <sal/types.h>
44 /** Returns the token identifier for the passed Unicode token name. */
45 static sal_Int32
getTokenFromUnicode( std::u16string_view rUnicodeName
);
47 /** Returns the UTF8 name of the passed token identifier as byte sequence. */
48 css::uno::Sequence
< sal_Int8
> const &
49 getUtf8TokenName( sal_Int32 nToken
) const
51 SAL_WARN_IF(nToken
< 0 || nToken
>= XML_TOKEN_COUNT
, "oox", "Wrong nToken parameter");
52 if (0 <= nToken
&& nToken
< XML_TOKEN_COUNT
)
53 return maTokenNames
[ nToken
];
54 return EMPTY_BYTE_SEQ
;
57 /** Returns the token identifier for the passed UTF8 token name. */
58 sal_Int32
getTokenFromUtf8(
59 const css::uno::Sequence
< sal_Int8
>& rUtf8Name
) const
61 return getTokenFromUTF8( reinterpret_cast< const char * >(
62 rUtf8Name
.getConstArray() ),
63 rUtf8Name
.getLength() );
66 /** Returns the token identifier for a UTF8 string passed in pToken */
67 sal_Int32
getTokenFromUTF8( const char *pToken
, sal_Int32 nLength
) const
69 // 50% of OOXML tokens are primarily 1 lower-case character, a-z
73 if (c
>= 'a' && c
<= 'z')
74 return mnAlphaTokens
[ c
- 'a' ];
76 return getTokenPerfectHash( pToken
, nLength
);
80 static sal_Int32
getTokenPerfectHash( const char *pToken
, sal_Int32 nLength
);
81 static const css::uno::Sequence
< sal_Int8
> EMPTY_BYTE_SEQ
;
83 std::vector
< css::uno::Sequence
< sal_Int8
> >
85 sal_Int32 mnAlphaTokens
[26];
89 TokenMap
& StaticTokenMap();
95 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */