LibreOffice Module oox (master) 1
tokenmap.hxx
Go to the documentation of this file.
1/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
2/*
3 * This file is part of the LibreOffice project.
4 *
5 * This Source Code Form is subject to the terms of the Mozilla Public
6 * License, v. 2.0. If a copy of the MPL was not distributed with this
7 * file, You can obtain one at http://mozilla.org/MPL/2.0/.
8 *
9 * This file incorporates work covered by the following license notice:
10 *
11 * Licensed to the Apache Software Foundation (ASF) under one or more
12 * contributor license agreements. See the NOTICE file distributed
13 * with this work for additional information regarding copyright
14 * ownership. The ASF licenses this file to you under the Apache
15 * License, Version 2.0 (the "License"); you may not use this file
16 * except in compliance with the License. You may obtain a copy of
17 * the License at http://www.apache.org/licenses/LICENSE-2.0 .
18 */
19
20#ifndef INCLUDED_OOX_TOKEN_TOKENMAP_HXX
21#define INCLUDED_OOX_TOKEN_TOKENMAP_HXX
22
23#include <sal/config.h>
24
25#include <string_view>
26#include <vector>
27
28#include <com/sun/star/uno/Sequence.hxx>
29#include <oox/token/tokens.hxx>
30#include <oox/dllapi.h>
31#include <rtl/ustring.hxx>
32#include <sal/log.hxx>
33#include <sal/types.h>
34
35namespace oox {
36
37
39{
40public:
41 explicit TokenMap();
42 ~TokenMap();
43
45 static sal_Int32 getTokenFromUnicode( std::u16string_view rUnicodeName );
46
48 css::uno::Sequence< sal_Int8 > const &
49 getUtf8TokenName( sal_Int32 nToken ) const
50 {
51 SAL_WARN_IF(nToken < 0 || nToken >= XML_TOKEN_COUNT, "oox", "Wrong nToken parameter");
52 if (0 <= nToken && nToken < XML_TOKEN_COUNT)
53 return maTokenNames[ nToken ];
54 return EMPTY_BYTE_SEQ;
55 }
56
59 const css::uno::Sequence< sal_Int8 >& rUtf8Name ) const
60 {
61 return getTokenFromUTF8( reinterpret_cast< const char * >(
62 rUtf8Name.getConstArray() ),
63 rUtf8Name.getLength() );
64 }
65
67 sal_Int32 getTokenFromUTF8( const char *pToken, sal_Int32 nLength ) const
68 {
69 // 50% of OOXML tokens are primarily 1 lower-case character, a-z
70 if( nLength == 1)
71 {
72 char c = pToken[0];
73 if (c >= 'a' && c <= 'z')
74 return mnAlphaTokens[ c - 'a' ];
75 }
76 return getTokenPerfectHash( pToken, nLength );
77 }
78
79private:
80 static sal_Int32 getTokenPerfectHash( const char *pToken, sal_Int32 nLength );
81 static const css::uno::Sequence< sal_Int8 > EMPTY_BYTE_SEQ;
82
83 std::vector< css::uno::Sequence< sal_Int8 > >
85 sal_Int32 mnAlphaTokens[26];
86};
87
88
90
91} // namespace oox
92
93#endif
94
95/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
css::uno::Sequence< sal_Int8 > const & getUtf8TokenName(sal_Int32 nToken) const
Returns the UTF8 name of the passed token identifier as byte sequence.
Definition: tokenmap.hxx:49
sal_Int32 getTokenFromUtf8(const css::uno::Sequence< sal_Int8 > &rUtf8Name) const
Returns the token identifier for the passed UTF8 token name.
Definition: tokenmap.hxx:58
std::vector< css::uno::Sequence< sal_Int8 > > maTokenNames
Definition: tokenmap.hxx:84
static sal_Int32 getTokenFromUnicode(std::u16string_view rUnicodeName)
Returns the token identifier for the passed Unicode token name.
Definition: tokenmap.cxx:77
sal_Int32 getTokenFromUTF8(const char *pToken, sal_Int32 nLength) const
Returns the token identifier for a UTF8 string passed in pToken.
Definition: tokenmap.hxx:67
sal_Int32 mnAlphaTokens[26]
Definition: tokenmap.hxx:85
static sal_Int32 getTokenPerfectHash(const char *pToken, sal_Int32 nLength)
Definition: tokenmap.cxx:84
static const css::uno::Sequence< sal_Int8 > EMPTY_BYTE_SEQ
Definition: tokenmap.hxx:81
#define SAL_WARN_IF(condition, area, stream)
TokenMap & StaticTokenMap()
Definition: tokenmap.cxx:90
DefTokenId nToken
sal_Int32 nLength