xref: /aoo41x/main/l10ntools/source/utf8conv.cxx (revision cdf0e10c)
1*cdf0e10cSrcweir /*************************************************************************
2*cdf0e10cSrcweir  *
3*cdf0e10cSrcweir  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4*cdf0e10cSrcweir  *
5*cdf0e10cSrcweir  * Copyright 2000, 2010 Oracle and/or its affiliates.
6*cdf0e10cSrcweir  *
7*cdf0e10cSrcweir  * OpenOffice.org - a multi-platform office productivity suite
8*cdf0e10cSrcweir  *
9*cdf0e10cSrcweir  * This file is part of OpenOffice.org.
10*cdf0e10cSrcweir  *
11*cdf0e10cSrcweir  * OpenOffice.org is free software: you can redistribute it and/or modify
12*cdf0e10cSrcweir  * it under the terms of the GNU Lesser General Public License version 3
13*cdf0e10cSrcweir  * only, as published by the Free Software Foundation.
14*cdf0e10cSrcweir  *
15*cdf0e10cSrcweir  * OpenOffice.org is distributed in the hope that it will be useful,
16*cdf0e10cSrcweir  * but WITHOUT ANY WARRANTY; without even the implied warranty of
17*cdf0e10cSrcweir  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18*cdf0e10cSrcweir  * GNU Lesser General Public License version 3 for more details
19*cdf0e10cSrcweir  * (a copy is included in the LICENSE file that accompanied this code).
20*cdf0e10cSrcweir  *
21*cdf0e10cSrcweir  * You should have received a copy of the GNU Lesser General Public License
22*cdf0e10cSrcweir  * version 3 along with OpenOffice.org.  If not, see
23*cdf0e10cSrcweir  * <http://www.openoffice.org/license.html>
24*cdf0e10cSrcweir  * for a copy of the LGPLv3 License.
25*cdf0e10cSrcweir  *
26*cdf0e10cSrcweir  ************************************************************************/
27*cdf0e10cSrcweir 
28*cdf0e10cSrcweir // MARKER(update_precomp.py): autogen include statement, do not remove
29*cdf0e10cSrcweir #include "precompiled_l10ntools.hxx"
30*cdf0e10cSrcweir #include "utf8conv.hxx"
31*cdf0e10cSrcweir 
32*cdf0e10cSrcweir //
33*cdf0e10cSrcweir // class UTF8Converter
34*cdf0e10cSrcweir //
35*cdf0e10cSrcweir 
36*cdf0e10cSrcweir #define MAX_CONV_BUFFER_SIZE	0xFF00
37*cdf0e10cSrcweir 
38*cdf0e10cSrcweir #define TO_CVTFLAGS		(RTL_TEXTTOUNICODE_FLAGS_UNDEFINED_MAPTOPRIVATE |\
39*cdf0e10cSrcweir 			 			 RTL_TEXTTOUNICODE_FLAGS_MBUNDEFINED_DEFAULT |\
40*cdf0e10cSrcweir 			 			 RTL_TEXTTOUNICODE_FLAGS_INVALID_DEFAULT)
41*cdf0e10cSrcweir 
42*cdf0e10cSrcweir #define FROM_CVTFLAGS  	(RTL_UNICODETOTEXT_FLAGS_UNDEFINED_DEFAULT |\
43*cdf0e10cSrcweir 			 		   	 RTL_UNICODETOTEXT_FLAGS_INVALID_DEFAULT |\
44*cdf0e10cSrcweir 					   	 RTL_UNICODETOTEXT_FLAGS_UNDEFINED_REPLACE |\
45*cdf0e10cSrcweir 					   	 RTL_UNICODETOTEXT_FLAGS_PRIVATE_MAPTO0)
46*cdf0e10cSrcweir 
47*cdf0e10cSrcweir /*****************************************************************************/
48*cdf0e10cSrcweir void UTF8Converter::Convert( ByteString &rBuffer,
49*cdf0e10cSrcweir 	rtl_TextEncoding nSourceENC, rtl_TextEncoding nDestENC )
50*cdf0e10cSrcweir /*****************************************************************************/
51*cdf0e10cSrcweir {
52*cdf0e10cSrcweir 	String sTemp( rBuffer, nSourceENC );
53*cdf0e10cSrcweir 	rBuffer = ByteString( sTemp, nDestENC );
54*cdf0e10cSrcweir }
55*cdf0e10cSrcweir 
56*cdf0e10cSrcweir /*****************************************************************************/
57*cdf0e10cSrcweir ByteString UTF8Converter::ConvertToUTF8(
58*cdf0e10cSrcweir 	const ByteString &rASCII, rtl_TextEncoding nEncoding )
59*cdf0e10cSrcweir /*****************************************************************************/
60*cdf0e10cSrcweir {
61*cdf0e10cSrcweir 	ByteString sReturn( rASCII );
62*cdf0e10cSrcweir 	Convert( sReturn, nEncoding, RTL_TEXTENCODING_UTF8 );
63*cdf0e10cSrcweir 	return sReturn;
64*cdf0e10cSrcweir }
65*cdf0e10cSrcweir 
66*cdf0e10cSrcweir /*****************************************************************************/
67*cdf0e10cSrcweir ByteString UTF8Converter::ConvertFromUTF8(
68*cdf0e10cSrcweir 	const ByteString &rUTF8, rtl_TextEncoding nEncoding )
69*cdf0e10cSrcweir /*****************************************************************************/
70*cdf0e10cSrcweir {
71*cdf0e10cSrcweir 	ByteString sReturn( rUTF8 );
72*cdf0e10cSrcweir 	Convert( sReturn, RTL_TEXTENCODING_UTF8, nEncoding );
73*cdf0e10cSrcweir 	return sReturn;
74*cdf0e10cSrcweir }
75