LibreOffice Module oox (master)  1
tokenmap.hxx
Go to the documentation of this file.
1 /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
2 /*
3  * This file is part of the LibreOffice project.
4  *
5  * This Source Code Form is subject to the terms of the Mozilla Public
6  * License, v. 2.0. If a copy of the MPL was not distributed with this
7  * file, You can obtain one at http://mozilla.org/MPL/2.0/.
8  *
9  * This file incorporates work covered by the following license notice:
10  *
11  * Licensed to the Apache Software Foundation (ASF) under one or more
12  * contributor license agreements. See the NOTICE file distributed
13  * with this work for additional information regarding copyright
14  * ownership. The ASF licenses this file to you under the Apache
15  * License, Version 2.0 (the "License"); you may not use this file
16  * except in compliance with the License. You may obtain a copy of
17  * the License at http://www.apache.org/licenses/LICENSE-2.0 .
18  */
19 
20 #ifndef INCLUDED_OOX_TOKEN_TOKENMAP_HXX
21 #define INCLUDED_OOX_TOKEN_TOKENMAP_HXX
22 
23 #include <sal/config.h>
24 
25 #include <string_view>
26 #include <vector>
27 
28 #include <com/sun/star/uno/Sequence.hxx>
29 #include <oox/token/tokens.hxx>
30 #include <oox/dllapi.h>
31 #include <rtl/ustring.hxx>
32 #include <sal/log.hxx>
33 #include <sal/types.h>
34 
35 namespace oox {
36 
37 
38 class TokenMap
39 {
40 public:
41  explicit TokenMap();
42  ~TokenMap();
43 
45  static sal_Int32 getTokenFromUnicode( std::u16string_view rUnicodeName );
46 
48  css::uno::Sequence< sal_Int8 > const &
49  getUtf8TokenName( sal_Int32 nToken ) const
50  {
51  SAL_WARN_IF(nToken < 0 || nToken >= XML_TOKEN_COUNT, "oox", "Wrong nToken parameter");
52  if (0 <= nToken && nToken < XML_TOKEN_COUNT)
53  return maTokenNames[ nToken ];
54  return EMPTY_BYTE_SEQ;
55  }
56 
58  sal_Int32 getTokenFromUtf8(
59  const css::uno::Sequence< sal_Int8 >& rUtf8Name ) const
60  {
61  return getTokenFromUTF8( reinterpret_cast< const char * >(
62  rUtf8Name.getConstArray() ),
63  rUtf8Name.getLength() );
64  }
65 
67  sal_Int32 getTokenFromUTF8( const char *pToken, sal_Int32 nLength ) const
68  {
69  // 50% of OOXML tokens are primarily 1 lower-case character, a-z
70  if( nLength == 1)
71  {
72  char c = pToken[0];
73  if (c >= 'a' && c <= 'z')
74  return mnAlphaTokens[ c - 'a' ];
75  }
76  return getTokenPerfectHash( pToken, nLength );
77  }
78 
79 private:
80  static sal_Int32 getTokenPerfectHash( const char *pToken, sal_Int32 nLength );
81  static const css::uno::Sequence< sal_Int8 > EMPTY_BYTE_SEQ;
82 
83  std::vector< css::uno::Sequence< sal_Int8 > >
85  sal_Int32 mnAlphaTokens[26];
86 };
87 
88 
90 
91 } // namespace oox
92 
93 #endif
94 
95 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */
TokenMap & StaticTokenMap()
Definition: tokenmap.cxx:90
sal_Int32 getTokenFromUtf8(const css::uno::Sequence< sal_Int8 > &rUtf8Name) const
Returns the token identifier for the passed UTF8 token name.
Definition: tokenmap.hxx:58
sal_Int32 getTokenFromUTF8(const char *pToken, sal_Int32 nLength) const
Returns the token identifier for a UTF8 string passed in pToken.
Definition: tokenmap.hxx:67
static sal_Int32 getTokenFromUnicode(std::u16string_view rUnicodeName)
Returns the token identifier for the passed Unicode token name.
Definition: tokenmap.cxx:77
sal_Int32 mnAlphaTokens[26]
Definition: tokenmap.hxx:85
static sal_Int32 getTokenPerfectHash(const char *pToken, sal_Int32 nLength)
Definition: tokenmap.cxx:84
css::uno::Sequence< sal_Int8 > const & getUtf8TokenName(sal_Int32 nToken) const
Returns the UTF8 name of the passed token identifier as byte sequence.
Definition: tokenmap.hxx:49
static const css::uno::Sequence< sal_Int8 > EMPTY_BYTE_SEQ
Definition: tokenmap.hxx:81
std::vector< css::uno::Sequence< sal_Int8 > > maTokenNames
Definition: tokenmap.hxx:84
#define SAL_WARN_IF(condition, area, stream)