LibreOffice Module i18npool (master)  1
ignoreIterationMark_ja_JP.cxx
Go to the documentation of this file.
1 /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
2 /*
3  * This file is part of the LibreOffice project.
4  *
5  * This Source Code Form is subject to the terms of the Mozilla Public
6  * License, v. 2.0. If a copy of the MPL was not distributed with this
7  * file, You can obtain one at http://mozilla.org/MPL/2.0/.
8  *
9  * This file incorporates work covered by the following license notice:
10  *
11  * Licensed to the Apache Software Foundation (ASF) under one or more
12  * contributor license agreements. See the NOTICE file distributed
13  * with this work for additional information regarding copyright
14  * ownership. The ASF licenses this file to you under the Apache
15  * License, Version 2.0 (the "License"); you may not use this file
16  * except in compliance with the License. You may obtain a copy of
17  * the License at http://www.apache.org/licenses/LICENSE-2.0 .
18  */
19 
21 
23 
24 #include <numeric>
25 
26 using namespace com::sun::star::uno;
27 using namespace com::sun::star::lang;
28 
29 
30 namespace i18npool {
31 
33  { 0x3046, 0x3094 }, // HIRAGANA LETTER U --> HIRAGANA LETTER VU
34  { 0x304B, 0x304C }, // HIRAGANA LETTER KA --> HIRAGANA LETTER GA
35  { 0x304D, 0x304E }, // HIRAGANA LETTER KI --> HIRAGANA LETTER GI
36  { 0x304F, 0x3050 }, // HIRAGANA LETTER KU --> HIRAGANA LETTER GU
37  { 0x3051, 0x3052 }, // HIRAGANA LETTER KE --> HIRAGANA LETTER GE
38  { 0x3053, 0x3054 }, // HIRAGANA LETTER KO --> HIRAGANA LETTER GO
39  { 0x3055, 0x3056 }, // HIRAGANA LETTER SA --> HIRAGANA LETTER ZA
40  { 0x3057, 0x3058 }, // HIRAGANA LETTER SI --> HIRAGANA LETTER ZI
41  { 0x3059, 0x305A }, // HIRAGANA LETTER SU --> HIRAGANA LETTER ZU
42  { 0x305B, 0x305C }, // HIRAGANA LETTER SE --> HIRAGANA LETTER ZE
43  { 0x305D, 0x305E }, // HIRAGANA LETTER SO --> HIRAGANA LETTER ZO
44  { 0x305F, 0x3060 }, // HIRAGANA LETTER TA --> HIRAGANA LETTER DA
45  { 0x3061, 0x3062 }, // HIRAGANA LETTER TI --> HIRAGANA LETTER DI
46  { 0x3064, 0x3065 }, // HIRAGANA LETTER TU --> HIRAGANA LETTER DU
47  { 0x3066, 0x3067 }, // HIRAGANA LETTER TE --> HIRAGANA LETTER DE
48  { 0x3068, 0x3069 }, // HIRAGANA LETTER TO --> HIRAGANA LETTER DO
49  { 0x306F, 0x3070 }, // HIRAGANA LETTER HA --> HIRAGANA LETTER BA
50  { 0x3072, 0x3073 }, // HIRAGANA LETTER HI --> HIRAGANA LETTER BI
51  { 0x3075, 0x3076 }, // HIRAGANA LETTER HU --> HIRAGANA LETTER BU
52  { 0x3078, 0x3079 }, // HIRAGANA LETTER HE --> HIRAGANA LETTER BE
53  { 0x307B, 0x307C }, // HIRAGANA LETTER HO --> HIRAGANA LETTER BO
54  { 0x309D, 0x309E }, // HIRAGANA ITERATION MARK --> HIRAGANA VOICED ITERATION MARK
55  { 0x30A6, 0x30F4 }, // KATAKANA LETTER U --> KATAKANA LETTER VU
56  { 0x30AB, 0x30AC }, // KATAKANA LETTER KA --> KATAKANA LETTER GA
57  { 0x30AD, 0x30AE }, // KATAKANA LETTER KI --> KATAKANA LETTER GI
58  { 0x30AF, 0x30B0 }, // KATAKANA LETTER KU --> KATAKANA LETTER GU
59  { 0x30B1, 0x30B2 }, // KATAKANA LETTER KE --> KATAKANA LETTER GE
60  { 0x30B3, 0x30B4 }, // KATAKANA LETTER KO --> KATAKANA LETTER GO
61  { 0x30B5, 0x30B6 }, // KATAKANA LETTER SA --> KATAKANA LETTER ZA
62  { 0x30B7, 0x30B8 }, // KATAKANA LETTER SI --> KATAKANA LETTER ZI
63  { 0x30B9, 0x30BA }, // KATAKANA LETTER SU --> KATAKANA LETTER ZU
64  { 0x30BB, 0x30BC }, // KATAKANA LETTER SE --> KATAKANA LETTER ZE
65  { 0x30BD, 0x30BE }, // KATAKANA LETTER SO --> KATAKANA LETTER ZO
66  { 0x30BF, 0x30C0 }, // KATAKANA LETTER TA --> KATAKANA LETTER DA
67  { 0x30C1, 0x30C2 }, // KATAKANA LETTER TI --> KATAKANA LETTER DI
68  { 0x30C4, 0x30C5 }, // KATAKANA LETTER TU --> KATAKANA LETTER DU
69  { 0x30C6, 0x30C7 }, // KATAKANA LETTER TE --> KATAKANA LETTER DE
70  { 0x30C8, 0x30C9 }, // KATAKANA LETTER TO --> KATAKANA LETTER DO
71  { 0x30CF, 0x30D0 }, // KATAKANA LETTER HA --> KATAKANA LETTER BA
72  { 0x30D2, 0x30D3 }, // KATAKANA LETTER HI --> KATAKANA LETTER BI
73  { 0x30D5, 0x30D6 }, // KATAKANA LETTER HU --> KATAKANA LETTER BU
74  { 0x30D8, 0x30D9 }, // KATAKANA LETTER HE --> KATAKANA LETTER BE
75  { 0x30DB, 0x30DC }, // KATAKANA LETTER HO --> KATAKANA LETTER BO
76  { 0x30EF, 0x30F7 }, // KATAKANA LETTER WA --> KATAKANA LETTER VA
77  { 0x30F0, 0x30F8 }, // KATAKANA LETTER WI --> KATAKANA LETTER VI
78  { 0x30F1, 0x30F9 }, // KATAKANA LETTER WE --> KATAKANA LETTER VE
79  { 0x30F2, 0x30FA }, // KATAKANA LETTER WO --> KATAKANA LETTER VO
80  { 0x30FD, 0x30FE } // KATAKANA ITERATION MARK --> KATAKANA VOICED ITERATION MARK
81 };
82 
83 
84 OUString
85 ignoreIterationMark_ja_JP::foldingImpl( const OUString& inStr, sal_Int32 startPos, sal_Int32 nCount, Sequence< sal_Int32 >* pOffset )
86 {
87  i18nutil::oneToOneMapping aTable(ignoreIterationMark_ja_JP_mappingTable, sizeof(ignoreIterationMark_ja_JP_mappingTable));
88 
89  // Create a string buffer which can hold nCount + 1 characters.
90  // The reference count is 1 now.
91  rtl_uString * newStr = rtl_uString_alloc(nCount);
92  sal_Unicode * dst = newStr->buffer;
93  const sal_Unicode * src = inStr.getStr() + startPos;
94 
95  if (pOffset) {
96  // Allocate nCount length to offset argument.
97  pOffset->realloc( nCount );
98  auto [begin, end] = asNonConstRange(*pOffset);
99  std::iota(begin, end, startPos);
100  }
101 
102 
103  sal_Unicode previousChar = *src ++;
104  sal_Unicode currentChar;
105 
106  // Conversion
107  while (-- nCount > 0) {
108  currentChar = *src ++;
109 
110  switch ( currentChar ) {
111  case 0x30fd: // KATAKANA ITERATION MARK
112  case 0x309d: // HIRAGANA ITERATION MARK
113  case 0x3005: // IDEOGRAPHIC ITERATION MARK
114  currentChar = previousChar;
115  break;
116  case 0x30fe: // KATAKANA VOICED ITERATION MARK
117  case 0x309e: // HIRAGANA VOICED ITERATION MARK
118  currentChar = aTable[ previousChar ];
119  break;
120  }
121  *dst ++ = previousChar;
122  previousChar = currentChar;
123  }
124 
125  if (nCount == 0) {
126  *dst ++ = previousChar;
127  }
128 
129  *dst = u'\0';
130 
131  newStr->length = sal_Int32(dst - newStr->buffer);
132  if (pOffset)
133  pOffset->realloc(newStr->length);
134  return OUString(newStr, SAL_NO_ACQUIRE); // take ownership
135 }
136 
137 }
138 
139 /* vim:set shiftwidth=4 softtabstop=4 expandtab: */
sal_uInt16 sal_Unicode
enumrange< T >::Iterator begin(enumrange< T >)
float u
Constant values shared between i18npool and, for example, the number formatter.
enumrange< T >::Iterator end(enumrange< T >)
i18nutil::OneToOneMappingTable_t const ignoreIterationMark_ja_JP_mappingTable[]