1449ab281SAndrew Rist /**************************************************************
2cdf0e10cSrcweir *
3449ab281SAndrew Rist * Licensed to the Apache Software Foundation (ASF) under one
4449ab281SAndrew Rist * or more contributor license agreements. See the NOTICE file
5449ab281SAndrew Rist * distributed with this work for additional information
6449ab281SAndrew Rist * regarding copyright ownership. The ASF licenses this file
7449ab281SAndrew Rist * to you under the Apache License, Version 2.0 (the
8449ab281SAndrew Rist * "License"); you may not use this file except in compliance
9449ab281SAndrew Rist * with the License. You may obtain a copy of the License at
10449ab281SAndrew Rist *
11449ab281SAndrew Rist * http://www.apache.org/licenses/LICENSE-2.0
12449ab281SAndrew Rist *
13449ab281SAndrew Rist * Unless required by applicable law or agreed to in writing,
14449ab281SAndrew Rist * software distributed under the License is distributed on an
15449ab281SAndrew Rist * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
16449ab281SAndrew Rist * KIND, either express or implied. See the License for the
17449ab281SAndrew Rist * specific language governing permissions and limitations
18449ab281SAndrew Rist * under the License.
19449ab281SAndrew Rist *
20449ab281SAndrew Rist *************************************************************/
21449ab281SAndrew Rist
22449ab281SAndrew Rist
23cdf0e10cSrcweir
24cdf0e10cSrcweir // MARKER(update_precomp.py): autogen include statement, do not remove
25cdf0e10cSrcweir #include "precompiled_i18npool.hxx"
26cdf0e10cSrcweir
27cdf0e10cSrcweir // prevent internal compiler error with MSVC6SP3
28cdf0e10cSrcweir #include <utility>
29cdf0e10cSrcweir
30cdf0e10cSrcweir #include <i18nutil/oneToOneMapping.hxx>
31cdf0e10cSrcweir #define TRANSLITERATION_IandEfollowedByYa_ja_JP
32cdf0e10cSrcweir #include <transliteration_Ignore.hxx>
33cdf0e10cSrcweir
34cdf0e10cSrcweir using namespace com::sun::star::uno;
35cdf0e10cSrcweir using namespace com::sun::star::lang;
36cdf0e10cSrcweir using namespace rtl;
37cdf0e10cSrcweir
38cdf0e10cSrcweir namespace com { namespace sun { namespace star { namespace i18n {
39cdf0e10cSrcweir
40cdf0e10cSrcweir OneToOneMappingTable_t IandE[] = {
41cdf0e10cSrcweir MAKE_PAIR( 0x30A3, 0x0000 ), // KATAKANA LETTER SMALL I
42cdf0e10cSrcweir MAKE_PAIR( 0x30A4, 0x0000 ), // KATAKANA LETTER I
43cdf0e10cSrcweir MAKE_PAIR( 0x30A7, 0x0000 ), // KATAKANA LETTER SMALL E
44cdf0e10cSrcweir MAKE_PAIR( 0x30A8, 0x0000 ), // KATAKANA LETTER E
45cdf0e10cSrcweir MAKE_PAIR( 0x30AD, 0x0000 ), // KATAKANA LETTER KI
46cdf0e10cSrcweir MAKE_PAIR( 0x30AE, 0x0000 ), // KATAKANA LETTER GI
47cdf0e10cSrcweir MAKE_PAIR( 0x30B1, 0x0000 ), // KATAKANA LETTER KE
48cdf0e10cSrcweir MAKE_PAIR( 0x30B2, 0x0000 ), // KATAKANA LETTER GE
49cdf0e10cSrcweir MAKE_PAIR( 0x30B7, 0x0000 ), // KATAKANA LETTER SI
50cdf0e10cSrcweir MAKE_PAIR( 0x30B8, 0x0000 ), // KATAKANA LETTER ZI
51cdf0e10cSrcweir MAKE_PAIR( 0x30BB, 0x0000 ), // KATAKANA LETTER SE
52cdf0e10cSrcweir MAKE_PAIR( 0x30BC, 0x0000 ), // KATAKANA LETTER ZE
53cdf0e10cSrcweir MAKE_PAIR( 0x30C1, 0x0000 ), // KATAKANA LETTER TI
54cdf0e10cSrcweir MAKE_PAIR( 0x30C2, 0x0000 ), // KATAKANA LETTER DI
55cdf0e10cSrcweir MAKE_PAIR( 0x30C6, 0x0000 ), // KATAKANA LETTER TE
56cdf0e10cSrcweir MAKE_PAIR( 0x30C7, 0x0000 ), // KATAKANA LETTER DE
57cdf0e10cSrcweir MAKE_PAIR( 0x30CB, 0x0000 ), // KATAKANA LETTER NI
58cdf0e10cSrcweir MAKE_PAIR( 0x30CD, 0x0000 ), // KATAKANA LETTER NE
59cdf0e10cSrcweir MAKE_PAIR( 0x30D2, 0x0000 ), // KATAKANA LETTER HI
60cdf0e10cSrcweir MAKE_PAIR( 0x30D3, 0x0000 ), // KATAKANA LETTER BI
61cdf0e10cSrcweir MAKE_PAIR( 0x30D4, 0x0000 ), // KATAKANA LETTER PI
62cdf0e10cSrcweir MAKE_PAIR( 0x30D8, 0x0000 ), // KATAKANA LETTER HE
63cdf0e10cSrcweir MAKE_PAIR( 0x30D9, 0x0000 ), // KATAKANA LETTER BE
64cdf0e10cSrcweir MAKE_PAIR( 0x30DA, 0x0000 ), // KATAKANA LETTER PE
65cdf0e10cSrcweir MAKE_PAIR( 0x30DF, 0x0000 ), // KATAKANA LETTER MI
66cdf0e10cSrcweir MAKE_PAIR( 0x30E1, 0x0000 ), // KATAKANA LETTER ME
67cdf0e10cSrcweir MAKE_PAIR( 0x30EA, 0x0000 ), // KATAKANA LETTER RI
68cdf0e10cSrcweir MAKE_PAIR( 0x30EC, 0x0000 ), // KATAKANA LETTER RE
69cdf0e10cSrcweir MAKE_PAIR( 0x30F0, 0x0000 ), // KATAKANA LETTER WI
70cdf0e10cSrcweir MAKE_PAIR( 0x30F1, 0x0000 ), // KATAKANA LETTER WE
71cdf0e10cSrcweir MAKE_PAIR( 0x30F6, 0x0000 ), // KATAKANA LETTER SMALL KE
72cdf0e10cSrcweir MAKE_PAIR( 0x30F8, 0x0000 ), // KATAKANA LETTER VI
73cdf0e10cSrcweir MAKE_PAIR( 0x30F9, 0x0000 ) // KATAKANA LETTER VE
74cdf0e10cSrcweir };
75cdf0e10cSrcweir
76cdf0e10cSrcweir
77cdf0e10cSrcweir
78cdf0e10cSrcweir
79cdf0e10cSrcweir OUString SAL_CALL
folding(const OUString & inStr,sal_Int32 startPos,sal_Int32 nCount,Sequence<sal_Int32> & offset)80cdf0e10cSrcweir ignoreIandEfollowedByYa_ja_JP::folding( const OUString& inStr, sal_Int32 startPos, sal_Int32 nCount, Sequence< sal_Int32 >& offset )
81cdf0e10cSrcweir throw(RuntimeException)
82cdf0e10cSrcweir {
83cdf0e10cSrcweir // Create a string buffer which can hold nCount + 1 characters.
84cdf0e10cSrcweir // The reference count is 0 now.
85cdf0e10cSrcweir rtl_uString * newStr = x_rtl_uString_new_WithLength( nCount ); // defined in x_rtl_ustring.h
86cdf0e10cSrcweir sal_Unicode * dst = newStr->buffer;
87cdf0e10cSrcweir const sal_Unicode * src = inStr.getStr() + startPos;
88cdf0e10cSrcweir
89cdf0e10cSrcweir sal_Int32 *p = 0;
90cdf0e10cSrcweir sal_Int32 position = 0;
91cdf0e10cSrcweir if (useOffset) {
92cdf0e10cSrcweir // Allocate nCount length to offset argument.
93cdf0e10cSrcweir offset.realloc( nCount );
94cdf0e10cSrcweir p = offset.getArray();
95cdf0e10cSrcweir position = startPos;
96cdf0e10cSrcweir }
97cdf0e10cSrcweir
98cdf0e10cSrcweir //
99cdf0e10cSrcweir sal_Unicode previousChar = *src ++;
100cdf0e10cSrcweir sal_Unicode currentChar;
101cdf0e10cSrcweir
102cdf0e10cSrcweir // One to one mapping
103cdf0e10cSrcweir oneToOneMapping aTable(IandE, sizeof(IandE));
104cdf0e10cSrcweir
105cdf0e10cSrcweir // Translation
106cdf0e10cSrcweir while (-- nCount > 0) {
107cdf0e10cSrcweir currentChar = *src ++;
108cdf0e10cSrcweir
109cdf0e10cSrcweir // the character listed in above table + YA --> the character + A
110cdf0e10cSrcweir if (currentChar == 0x30E3 || // KATAKANA LETTER SMALL YA
111cdf0e10cSrcweir currentChar == 0x30E4) { // KATAKANA LETTER YA
112cdf0e10cSrcweir if (aTable[ previousChar ] != previousChar) {
113cdf0e10cSrcweir if (useOffset) {
114cdf0e10cSrcweir *p ++ = position++;
115cdf0e10cSrcweir *p ++ = position++;
116cdf0e10cSrcweir }
117cdf0e10cSrcweir *dst ++ = previousChar;
118cdf0e10cSrcweir *dst ++ = 0x30A2; // KATAKANA LETTER A
119cdf0e10cSrcweir previousChar = *src ++;
120cdf0e10cSrcweir nCount --;
121cdf0e10cSrcweir continue;
122cdf0e10cSrcweir }
123cdf0e10cSrcweir }
124cdf0e10cSrcweir
125cdf0e10cSrcweir if (useOffset)
126cdf0e10cSrcweir *p ++ = position++;
127cdf0e10cSrcweir *dst ++ = previousChar;
128cdf0e10cSrcweir previousChar = currentChar;
129cdf0e10cSrcweir }
130cdf0e10cSrcweir
131cdf0e10cSrcweir if (nCount == 0) {
132cdf0e10cSrcweir if (useOffset)
133cdf0e10cSrcweir *p = position;
134cdf0e10cSrcweir *dst ++ = previousChar;
135cdf0e10cSrcweir }
136cdf0e10cSrcweir
137cdf0e10cSrcweir *dst = (sal_Unicode) 0;
138cdf0e10cSrcweir
139cdf0e10cSrcweir newStr->length = sal_Int32(dst - newStr->buffer);
140cdf0e10cSrcweir if (useOffset)
141cdf0e10cSrcweir offset.realloc(newStr->length);
142*4674bdb9SOliver-Rainer Wittmann return OUString( newStr, SAL_NO_ACQUIRE ); // take over ownership of <newStr>
143cdf0e10cSrcweir }
144cdf0e10cSrcweir
145cdf0e10cSrcweir } } } }
146