1*b1cdbd2cSJim Jagielski /**************************************************************
2*b1cdbd2cSJim Jagielski *
3*b1cdbd2cSJim Jagielski * Licensed to the Apache Software Foundation (ASF) under one
4*b1cdbd2cSJim Jagielski * or more contributor license agreements. See the NOTICE file
5*b1cdbd2cSJim Jagielski * distributed with this work for additional information
6*b1cdbd2cSJim Jagielski * regarding copyright ownership. The ASF licenses this file
7*b1cdbd2cSJim Jagielski * to you under the Apache License, Version 2.0 (the
8*b1cdbd2cSJim Jagielski * "License"); you may not use this file except in compliance
9*b1cdbd2cSJim Jagielski * with the License. You may obtain a copy of the License at
10*b1cdbd2cSJim Jagielski *
11*b1cdbd2cSJim Jagielski * http://www.apache.org/licenses/LICENSE-2.0
12*b1cdbd2cSJim Jagielski *
13*b1cdbd2cSJim Jagielski * Unless required by applicable law or agreed to in writing,
14*b1cdbd2cSJim Jagielski * software distributed under the License is distributed on an
15*b1cdbd2cSJim Jagielski * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
16*b1cdbd2cSJim Jagielski * KIND, either express or implied. See the License for the
17*b1cdbd2cSJim Jagielski * specific language governing permissions and limitations
18*b1cdbd2cSJim Jagielski * under the License.
19*b1cdbd2cSJim Jagielski *
20*b1cdbd2cSJim Jagielski *************************************************************/
21*b1cdbd2cSJim Jagielski
22*b1cdbd2cSJim Jagielski
23*b1cdbd2cSJim Jagielski
24*b1cdbd2cSJim Jagielski // MARKER(update_precomp.py): autogen include statement, do not remove
25*b1cdbd2cSJim Jagielski #include "precompiled_sw.hxx"
26*b1cdbd2cSJim Jagielski
27*b1cdbd2cSJim Jagielski #include "breakit.hxx"
28*b1cdbd2cSJim Jagielski #include <unicode/uchar.h>
29*b1cdbd2cSJim Jagielski #include <com/sun/star/lang/XMultiServiceFactory.hpp>
30*b1cdbd2cSJim Jagielski #ifndef _COM_SUN_STAR_I18N_SCRIPTTYPE_HDL_
31*b1cdbd2cSJim Jagielski #include <com/sun/star/i18n/ScriptType.hdl>
32*b1cdbd2cSJim Jagielski #endif
33*b1cdbd2cSJim Jagielski #include <unotools/localedatawrapper.hxx>
34*b1cdbd2cSJim Jagielski
35*b1cdbd2cSJim Jagielski #ifndef _SVX_LINGU_HXX
36*b1cdbd2cSJim Jagielski #include <editeng/unolingu.hxx>
37*b1cdbd2cSJim Jagielski #endif
38*b1cdbd2cSJim Jagielski #include <editeng/scripttypeitem.hxx>
39*b1cdbd2cSJim Jagielski #include "swtypes.hxx"
40*b1cdbd2cSJim Jagielski
41*b1cdbd2cSJim Jagielski using namespace com::sun::star;
42*b1cdbd2cSJim Jagielski
43*b1cdbd2cSJim Jagielski SwBreakIt * pBreakIt = 0;
44*b1cdbd2cSJim Jagielski
_Create(const uno::Reference<lang::XMultiServiceFactory> & rxMSF)45*b1cdbd2cSJim Jagielski void SwBreakIt::_Create(
46*b1cdbd2cSJim Jagielski const uno::Reference< lang::XMultiServiceFactory > & rxMSF)
47*b1cdbd2cSJim Jagielski {
48*b1cdbd2cSJim Jagielski delete pBreakIt, pBreakIt = new SwBreakIt( rxMSF );
49*b1cdbd2cSJim Jagielski }
50*b1cdbd2cSJim Jagielski
_Delete()51*b1cdbd2cSJim Jagielski void SwBreakIt::_Delete()
52*b1cdbd2cSJim Jagielski {
53*b1cdbd2cSJim Jagielski delete pBreakIt, pBreakIt = 0;
54*b1cdbd2cSJim Jagielski }
55*b1cdbd2cSJim Jagielski
Get()56*b1cdbd2cSJim Jagielski SwBreakIt * SwBreakIt::Get()
57*b1cdbd2cSJim Jagielski {
58*b1cdbd2cSJim Jagielski return pBreakIt;
59*b1cdbd2cSJim Jagielski }
60*b1cdbd2cSJim Jagielski
SwBreakIt(const uno::Reference<lang::XMultiServiceFactory> & rxMSF)61*b1cdbd2cSJim Jagielski SwBreakIt::SwBreakIt(
62*b1cdbd2cSJim Jagielski const uno::Reference< lang::XMultiServiceFactory > & rxMSF)
63*b1cdbd2cSJim Jagielski : m_xMSF( rxMSF ),
64*b1cdbd2cSJim Jagielski m_pLocale( NULL ),
65*b1cdbd2cSJim Jagielski m_pForbidden( NULL ),
66*b1cdbd2cSJim Jagielski aLast( LANGUAGE_DONTKNOW ),
67*b1cdbd2cSJim Jagielski aForbiddenLang( LANGUAGE_DONTKNOW)
68*b1cdbd2cSJim Jagielski {
69*b1cdbd2cSJim Jagielski DBG_ASSERT( m_xMSF.is(), "SwBreakIt: no MultiServiceFactory" );
70*b1cdbd2cSJim Jagielski //if ( m_xMSF.is() )
71*b1cdbd2cSJim Jagielski //{
72*b1cdbd2cSJim Jagielski // xBreak = uno::Reference< i18n::XBreakIterator >(
73*b1cdbd2cSJim Jagielski // m_xMSF->createInstance(
74*b1cdbd2cSJim Jagielski // rtl::OUString::createFromAscii( "com.sun.star.i18n.BreakIterator" ) ),
75*b1cdbd2cSJim Jagielski // uno::UNO_QUERY);
76*b1cdbd2cSJim Jagielski
77*b1cdbd2cSJim Jagielski // xCTLDetect = uno::Reference< i18n::XScriptTypeDetector >(
78*b1cdbd2cSJim Jagielski // m_xMSF->createInstance(
79*b1cdbd2cSJim Jagielski // rtl::OUString::createFromAscii( "com.sun.star.i18n.ScriptTypeDetector" ) ),
80*b1cdbd2cSJim Jagielski // uno::UNO_QUERY);
81*b1cdbd2cSJim Jagielski // }
82*b1cdbd2cSJim Jagielski }
83*b1cdbd2cSJim Jagielski
~SwBreakIt()84*b1cdbd2cSJim Jagielski SwBreakIt::~SwBreakIt()
85*b1cdbd2cSJim Jagielski {
86*b1cdbd2cSJim Jagielski delete m_pLocale;
87*b1cdbd2cSJim Jagielski delete m_pForbidden;
88*b1cdbd2cSJim Jagielski }
createBreakIterator() const89*b1cdbd2cSJim Jagielski void SwBreakIt::createBreakIterator() const
90*b1cdbd2cSJim Jagielski {
91*b1cdbd2cSJim Jagielski if ( m_xMSF.is() && !xBreak.is() )
92*b1cdbd2cSJim Jagielski xBreak.set(m_xMSF->createInstance(::rtl::OUString(RTL_CONSTASCII_USTRINGPARAM("com.sun.star.i18n.BreakIterator"))),uno::UNO_QUERY);
93*b1cdbd2cSJim Jagielski }
createScriptTypeDetector()94*b1cdbd2cSJim Jagielski void SwBreakIt::createScriptTypeDetector()
95*b1cdbd2cSJim Jagielski {
96*b1cdbd2cSJim Jagielski if ( m_xMSF.is() && !xCTLDetect.is() )
97*b1cdbd2cSJim Jagielski xCTLDetect.set(m_xMSF->createInstance(rtl::OUString(RTL_CONSTASCII_USTRINGPARAM( "com.sun.star.i18n.ScriptTypeDetector" ))),uno::UNO_QUERY);
98*b1cdbd2cSJim Jagielski }
_GetLocale(const LanguageType aLang)99*b1cdbd2cSJim Jagielski void SwBreakIt::_GetLocale( const LanguageType aLang )
100*b1cdbd2cSJim Jagielski {
101*b1cdbd2cSJim Jagielski aLast = aLang;
102*b1cdbd2cSJim Jagielski delete m_pLocale;
103*b1cdbd2cSJim Jagielski m_pLocale = new lang::Locale( SvxCreateLocale( aLast ) );
104*b1cdbd2cSJim Jagielski }
105*b1cdbd2cSJim Jagielski
_GetForbidden(const LanguageType aLang)106*b1cdbd2cSJim Jagielski void SwBreakIt::_GetForbidden( const LanguageType aLang )
107*b1cdbd2cSJim Jagielski {
108*b1cdbd2cSJim Jagielski LocaleDataWrapper aWrap( m_xMSF, GetLocale( aLang ) );
109*b1cdbd2cSJim Jagielski
110*b1cdbd2cSJim Jagielski aForbiddenLang = aLang;
111*b1cdbd2cSJim Jagielski delete m_pForbidden;
112*b1cdbd2cSJim Jagielski m_pForbidden = new i18n::ForbiddenCharacters( aWrap.getForbiddenCharacters() );
113*b1cdbd2cSJim Jagielski }
114*b1cdbd2cSJim Jagielski
GetRealScriptOfText(const String & rTxt,xub_StrLen nPos) const115*b1cdbd2cSJim Jagielski sal_uInt16 SwBreakIt::GetRealScriptOfText( const String& rTxt,
116*b1cdbd2cSJim Jagielski xub_StrLen nPos ) const
117*b1cdbd2cSJim Jagielski {
118*b1cdbd2cSJim Jagielski createBreakIterator();
119*b1cdbd2cSJim Jagielski sal_uInt16 nScript = i18n::ScriptType::WEAK;
120*b1cdbd2cSJim Jagielski if( xBreak.is() && rTxt.Len() )
121*b1cdbd2cSJim Jagielski {
122*b1cdbd2cSJim Jagielski if( nPos && nPos == rTxt.Len() )
123*b1cdbd2cSJim Jagielski --nPos;
124*b1cdbd2cSJim Jagielski nScript = xBreak->getScriptType( rTxt, nPos );
125*b1cdbd2cSJim Jagielski sal_Int32 nChgPos = 0;
126*b1cdbd2cSJim Jagielski if ( i18n::ScriptType::WEAK == nScript && nPos + 1 < rTxt.Len() )
127*b1cdbd2cSJim Jagielski {
128*b1cdbd2cSJim Jagielski // A weak character followed by a mark may be meant to combine with
129*b1cdbd2cSJim Jagielski // the mark, so prefer the following character's script
130*b1cdbd2cSJim Jagielski switch ( u_charType(rTxt.GetChar(nPos + 1) ) ) {
131*b1cdbd2cSJim Jagielski case U_NON_SPACING_MARK:
132*b1cdbd2cSJim Jagielski case U_ENCLOSING_MARK:
133*b1cdbd2cSJim Jagielski case U_COMBINING_SPACING_MARK:
134*b1cdbd2cSJim Jagielski nScript = xBreak->getScriptType( rTxt, nPos+1 );
135*b1cdbd2cSJim Jagielski break;
136*b1cdbd2cSJim Jagielski }
137*b1cdbd2cSJim Jagielski }
138*b1cdbd2cSJim Jagielski if( i18n::ScriptType::WEAK == nScript && nPos &&
139*b1cdbd2cSJim Jagielski 0 < (nChgPos = xBreak->beginOfScript( rTxt, nPos, nScript )) )
140*b1cdbd2cSJim Jagielski nScript = xBreak->getScriptType( rTxt, nChgPos-1 );
141*b1cdbd2cSJim Jagielski
142*b1cdbd2cSJim Jagielski if( i18n::ScriptType::WEAK == nScript && rTxt.Len() >
143*b1cdbd2cSJim Jagielski ( nChgPos = xBreak->endOfScript( rTxt, nPos, nScript ) ) &&
144*b1cdbd2cSJim Jagielski 0 <= nChgPos )
145*b1cdbd2cSJim Jagielski nScript = xBreak->getScriptType( rTxt, nChgPos );
146*b1cdbd2cSJim Jagielski }
147*b1cdbd2cSJim Jagielski if( i18n::ScriptType::WEAK == nScript )
148*b1cdbd2cSJim Jagielski nScript = GetI18NScriptTypeOfLanguage( (sal_uInt16)GetAppLanguage() );
149*b1cdbd2cSJim Jagielski return nScript;
150*b1cdbd2cSJim Jagielski }
151*b1cdbd2cSJim Jagielski
GetAllScriptsOfText(const String & rTxt) const152*b1cdbd2cSJim Jagielski sal_uInt16 SwBreakIt::GetAllScriptsOfText( const String& rTxt ) const
153*b1cdbd2cSJim Jagielski {
154*b1cdbd2cSJim Jagielski const sal_uInt16 coAllScripts = ( SCRIPTTYPE_LATIN |
155*b1cdbd2cSJim Jagielski SCRIPTTYPE_ASIAN |
156*b1cdbd2cSJim Jagielski SCRIPTTYPE_COMPLEX );
157*b1cdbd2cSJim Jagielski createBreakIterator();
158*b1cdbd2cSJim Jagielski sal_uInt16 nRet = 0, nScript;
159*b1cdbd2cSJim Jagielski if( !xBreak.is() )
160*b1cdbd2cSJim Jagielski nRet = coAllScripts;
161*b1cdbd2cSJim Jagielski else if( rTxt.Len() )
162*b1cdbd2cSJim Jagielski {
163*b1cdbd2cSJim Jagielski for( xub_StrLen n = 0, nEnd = rTxt.Len(); n < nEnd;
164*b1cdbd2cSJim Jagielski n = static_cast<xub_StrLen>(xBreak->endOfScript( rTxt, n, nScript )) )
165*b1cdbd2cSJim Jagielski {
166*b1cdbd2cSJim Jagielski switch( nScript = xBreak->getScriptType( rTxt, n ) )
167*b1cdbd2cSJim Jagielski {
168*b1cdbd2cSJim Jagielski case i18n::ScriptType::LATIN: nRet |= SCRIPTTYPE_LATIN; break;
169*b1cdbd2cSJim Jagielski case i18n::ScriptType::ASIAN: nRet |= SCRIPTTYPE_ASIAN; break;
170*b1cdbd2cSJim Jagielski case i18n::ScriptType::COMPLEX: nRet |= SCRIPTTYPE_COMPLEX; break;
171*b1cdbd2cSJim Jagielski case i18n::ScriptType::WEAK:
172*b1cdbd2cSJim Jagielski if( !nRet )
173*b1cdbd2cSJim Jagielski nRet |= coAllScripts;
174*b1cdbd2cSJim Jagielski break;
175*b1cdbd2cSJim Jagielski }
176*b1cdbd2cSJim Jagielski if( coAllScripts == nRet )
177*b1cdbd2cSJim Jagielski break;
178*b1cdbd2cSJim Jagielski }
179*b1cdbd2cSJim Jagielski }
180*b1cdbd2cSJim Jagielski return nRet;
181*b1cdbd2cSJim Jagielski }
182*b1cdbd2cSJim Jagielski
183