1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
|
/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
/*
* This file is part of the LibreOffice project.
*
* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
*
* This file incorporates work covered by the following license notice:
*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed
* with this work for additional information regarding copyright
* ownership. The ASF licenses this file to you under the Apache
* License, Version 2.0 (the "License"); you may not use this file
* except in compliance with the License. You may obtain a copy of
* the License at http://www.apache.org/licenses/LICENSE-2.0 .
*/
#include <i18nutil/oneToOneMapping.hxx>
#include <transliteration_Ignore.hxx>
#include <numeric>
using namespace com::sun::star::uno;
using namespace com::sun::star::lang;
namespace i18npool {
i18nutil::OneToOneMappingTable_t const ignoreIterationMark_ja_JP_mappingTable[] = {
{ 0x3046, 0x3094 }, // HIRAGANA LETTER U --> HIRAGANA LETTER VU
{ 0x304B, 0x304C }, // HIRAGANA LETTER KA --> HIRAGANA LETTER GA
{ 0x304D, 0x304E }, // HIRAGANA LETTER KI --> HIRAGANA LETTER GI
{ 0x304F, 0x3050 }, // HIRAGANA LETTER KU --> HIRAGANA LETTER GU
{ 0x3051, 0x3052 }, // HIRAGANA LETTER KE --> HIRAGANA LETTER GE
{ 0x3053, 0x3054 }, // HIRAGANA LETTER KO --> HIRAGANA LETTER GO
{ 0x3055, 0x3056 }, // HIRAGANA LETTER SA --> HIRAGANA LETTER ZA
{ 0x3057, 0x3058 }, // HIRAGANA LETTER SI --> HIRAGANA LETTER ZI
{ 0x3059, 0x305A }, // HIRAGANA LETTER SU --> HIRAGANA LETTER ZU
{ 0x305B, 0x305C }, // HIRAGANA LETTER SE --> HIRAGANA LETTER ZE
{ 0x305D, 0x305E }, // HIRAGANA LETTER SO --> HIRAGANA LETTER ZO
{ 0x305F, 0x3060 }, // HIRAGANA LETTER TA --> HIRAGANA LETTER DA
{ 0x3061, 0x3062 }, // HIRAGANA LETTER TI --> HIRAGANA LETTER DI
{ 0x3064, 0x3065 }, // HIRAGANA LETTER TU --> HIRAGANA LETTER DU
{ 0x3066, 0x3067 }, // HIRAGANA LETTER TE --> HIRAGANA LETTER DE
{ 0x3068, 0x3069 }, // HIRAGANA LETTER TO --> HIRAGANA LETTER DO
{ 0x306F, 0x3070 }, // HIRAGANA LETTER HA --> HIRAGANA LETTER BA
{ 0x3072, 0x3073 }, // HIRAGANA LETTER HI --> HIRAGANA LETTER BI
{ 0x3075, 0x3076 }, // HIRAGANA LETTER HU --> HIRAGANA LETTER BU
{ 0x3078, 0x3079 }, // HIRAGANA LETTER HE --> HIRAGANA LETTER BE
{ 0x307B, 0x307C }, // HIRAGANA LETTER HO --> HIRAGANA LETTER BO
{ 0x309D, 0x309E }, // HIRAGANA ITERATION MARK --> HIRAGANA VOICED ITERATION MARK
{ 0x30A6, 0x30F4 }, // KATAKANA LETTER U --> KATAKANA LETTER VU
{ 0x30AB, 0x30AC }, // KATAKANA LETTER KA --> KATAKANA LETTER GA
{ 0x30AD, 0x30AE }, // KATAKANA LETTER KI --> KATAKANA LETTER GI
{ 0x30AF, 0x30B0 }, // KATAKANA LETTER KU --> KATAKANA LETTER GU
{ 0x30B1, 0x30B2 }, // KATAKANA LETTER KE --> KATAKANA LETTER GE
{ 0x30B3, 0x30B4 }, // KATAKANA LETTER KO --> KATAKANA LETTER GO
{ 0x30B5, 0x30B6 }, // KATAKANA LETTER SA --> KATAKANA LETTER ZA
{ 0x30B7, 0x30B8 }, // KATAKANA LETTER SI --> KATAKANA LETTER ZI
{ 0x30B9, 0x30BA }, // KATAKANA LETTER SU --> KATAKANA LETTER ZU
{ 0x30BB, 0x30BC }, // KATAKANA LETTER SE --> KATAKANA LETTER ZE
{ 0x30BD, 0x30BE }, // KATAKANA LETTER SO --> KATAKANA LETTER ZO
{ 0x30BF, 0x30C0 }, // KATAKANA LETTER TA --> KATAKANA LETTER DA
{ 0x30C1, 0x30C2 }, // KATAKANA LETTER TI --> KATAKANA LETTER DI
{ 0x30C4, 0x30C5 }, // KATAKANA LETTER TU --> KATAKANA LETTER DU
{ 0x30C6, 0x30C7 }, // KATAKANA LETTER TE --> KATAKANA LETTER DE
{ 0x30C8, 0x30C9 }, // KATAKANA LETTER TO --> KATAKANA LETTER DO
{ 0x30CF, 0x30D0 }, // KATAKANA LETTER HA --> KATAKANA LETTER BA
{ 0x30D2, 0x30D3 }, // KATAKANA LETTER HI --> KATAKANA LETTER BI
{ 0x30D5, 0x30D6 }, // KATAKANA LETTER HU --> KATAKANA LETTER BU
{ 0x30D8, 0x30D9 }, // KATAKANA LETTER HE --> KATAKANA LETTER BE
{ 0x30DB, 0x30DC }, // KATAKANA LETTER HO --> KATAKANA LETTER BO
{ 0x30EF, 0x30F7 }, // KATAKANA LETTER WA --> KATAKANA LETTER VA
{ 0x30F0, 0x30F8 }, // KATAKANA LETTER WI --> KATAKANA LETTER VI
{ 0x30F1, 0x30F9 }, // KATAKANA LETTER WE --> KATAKANA LETTER VE
{ 0x30F2, 0x30FA }, // KATAKANA LETTER WO --> KATAKANA LETTER VO
{ 0x30FD, 0x30FE } // KATAKANA ITERATION MARK --> KATAKANA VOICED ITERATION MARK
};
OUString
ignoreIterationMark_ja_JP::foldingImpl( const OUString& inStr, sal_Int32 startPos, sal_Int32 nCount, Sequence< sal_Int32 >* pOffset )
{
i18nutil::oneToOneMapping aTable(ignoreIterationMark_ja_JP_mappingTable, sizeof(ignoreIterationMark_ja_JP_mappingTable));
// Create a string buffer which can hold nCount + 1 characters.
// The reference count is 1 now.
rtl_uString * newStr = rtl_uString_alloc(nCount);
sal_Unicode * dst = newStr->buffer;
const sal_Unicode * src = inStr.getStr() + startPos;
if (pOffset) {
// Allocate nCount length to offset argument.
pOffset->realloc( nCount );
auto [begin, end] = asNonConstRange(*pOffset);
std::iota(begin, end, startPos);
}
sal_Unicode previousChar = *src ++;
sal_Unicode currentChar;
// Conversion
while (-- nCount > 0) {
currentChar = *src ++;
switch ( currentChar ) {
case 0x30fd: // KATAKANA ITERATION MARK
case 0x309d: // HIRAGANA ITERATION MARK
case 0x3005: // IDEOGRAPHIC ITERATION MARK
currentChar = previousChar;
break;
case 0x30fe: // KATAKANA VOICED ITERATION MARK
case 0x309e: // HIRAGANA VOICED ITERATION MARK
currentChar = aTable[ previousChar ];
break;
}
*dst ++ = previousChar;
previousChar = currentChar;
}
if (nCount == 0) {
*dst ++ = previousChar;
}
*dst = u'\0';
newStr->length = sal_Int32(dst - newStr->buffer);
if (pOffset)
pOffset->realloc(newStr->length);
return OUString(newStr, SAL_NO_ACQUIRE); // take ownership
}
}
/* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|