LibreOffice Module oox (master)  1
tokenmap.hxx
Go to the documentation of this file.
1 /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
2 /*
3  * This file is part of the LibreOffice project.
4  *
5  * This Source Code Form is subject to the terms of the Mozilla Public
6  * License, v. 2.0. If a copy of the MPL was not distributed with this
7  * file, You can obtain one at http://mozilla.org/MPL/2.0/.
8  *
9  * This file incorporates work covered by the following license notice:
10  *
11  * Licensed to the Apache Software Foundation (ASF) under one or more
12  * contributor license agreements. See the NOTICE file distributed
13  * with this work for additional information regarding copyright
14  * ownership. The ASF licenses this file to you under the Apache
15  * License, Version 2.0 (the "License"); you may not use this file
16  * except in compliance with the License. You may obtain a copy of
17  * the License at http://www.apache.org/licenses/LICENSE-2.0 .
18  */
19 
20 #ifndef INCLUDED_OOX_TOKEN_TOKENMAP_HXX
21 #define INCLUDED_OOX_TOKEN_TOKENMAP_HXX
22 
23 #include <sal/config.h>
24 
25 #include <string_view>
26 #include <vector>
27 
28 #include <com/sun/star/uno/Sequence.hxx>
29 #include <oox/token/tokens.hxx>
30 #include <oox/dllapi.h>
31 #include <rtl/instance.hxx>
32 #include <rtl/ustring.hxx>
33 #include <sal/log.hxx>
34 #include <sal/types.h>
35 
36 namespace oox {
37 
38 
39 class TokenMap
40 {
41 public:
42  explicit TokenMap();
43  ~TokenMap();
44 
46  static sal_Int32 getTokenFromUnicode( std::u16string_view rUnicodeName );
47 
49  css::uno::Sequence< sal_Int8 > const &
50  getUtf8TokenName( sal_Int32 nToken ) const
51  {
52  SAL_WARN_IF(nToken < 0 || nToken >= XML_TOKEN_COUNT, "oox", "Wrong nToken parameter");
53  if (0 <= nToken && nToken < XML_TOKEN_COUNT)
54  return maTokenNames[ nToken ];
55  return EMPTY_BYTE_SEQ;
56  }
57 
59  sal_Int32 getTokenFromUtf8(
60  const css::uno::Sequence< sal_Int8 >& rUtf8Name ) const
61  {
62  return getTokenFromUTF8( reinterpret_cast< const char * >(
63  rUtf8Name.getConstArray() ),
64  rUtf8Name.getLength() );
65  }
66 
68  sal_Int32 getTokenFromUTF8( const char *pToken, sal_Int32 nLength ) const
69  {
70  // 50% of OOXML tokens are primarily 1 lower-case character, a-z
71  if( nLength == 1)
72  {
73  char c = pToken[0];
74  if (c >= 'a' && c <= 'z')
75  return mnAlphaTokens[ c - 'a' ];
76  }
77  return getTokenPerfectHash( pToken, nLength );
78  }
79 
80 private:
81  static sal_Int32 getTokenPerfectHash( const char *pToken, sal_Int32 nLength );
82  static const css::uno::Sequence< sal_Int8 > EMPTY_BYTE_SEQ;
83 
84  std::vector< css::uno::Sequence< sal_Int8 > >
86  sal_Int32 mnAlphaTokens[26];
87 };
88 
89 
90 struct StaticTokenMap : public ::rtl::Static< TokenMap, StaticTokenMap > {};
91 
92 
93 } // namespace oox
94 
95 #endif
96 
97 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */
sal_Int32 getTokenFromUtf8(const css::uno::Sequence< sal_Int8 > &rUtf8Name) const
Returns the token identifier for the passed UTF8 token name.
Definition: tokenmap.hxx:59
sal_Int32 getTokenFromUTF8(const char *pToken, sal_Int32 nLength) const
Returns the token identifier for a UTF8 string passed in pToken.
Definition: tokenmap.hxx:68
static sal_Int32 getTokenFromUnicode(std::u16string_view rUnicodeName)
Returns the token identifier for the passed Unicode token name.
Definition: tokenmap.cxx:77
sal_Int32 mnAlphaTokens[26]
Definition: tokenmap.hxx:86
static sal_Int32 getTokenPerfectHash(const char *pToken, sal_Int32 nLength)
Definition: tokenmap.cxx:84
css::uno::Sequence< sal_Int8 > const & getUtf8TokenName(sal_Int32 nToken) const
Returns the UTF8 name of the passed token identifier as byte sequence.
Definition: tokenmap.hxx:50
static const css::uno::Sequence< sal_Int8 > EMPTY_BYTE_SEQ
Definition: tokenmap.hxx:82
std::vector< css::uno::Sequence< sal_Int8 > > maTokenNames
Definition: tokenmap.hxx:85
#define SAL_WARN_IF(condition, area, stream)