1 /************************************************************************* 2 * 3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4 * 5 * Copyright 2000, 2010 Oracle and/or its affiliates. 6 * 7 * OpenOffice.org - a multi-platform office productivity suite 8 * 9 * This file is part of OpenOffice.org. 10 * 11 * OpenOffice.org is free software: you can redistribute it and/or modify 12 * it under the terms of the GNU Lesser General Public License version 3 13 * only, as published by the Free Software Foundation. 14 * 15 * OpenOffice.org is distributed in the hope that it will be useful, 16 * but WITHOUT ANY WARRANTY; without even the implied warranty of 17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 18 * GNU Lesser General Public License version 3 for more details 19 * (a copy is included in the LICENSE file that accompanied this code). 20 * 21 * You should have received a copy of the GNU Lesser General Public License 22 * version 3 along with OpenOffice.org. If not, see 23 * <http://www.openoffice.org/license.html> 24 * for a copy of the LGPLv3 License. 25 * 26 ************************************************************************/ 27 28 // MARKER(update_precomp.py): autogen include statement, do not remove 29 #include "precompiled_sal.hxx" 30 31 /* TODO! This file should not be called textenc.c, because it is not the 32 implementation of rtl/textenc.h. Rather, it should be called 33 gettextencodingdata.c. */ 34 #include "gettextencodingdata.h" 35 #include "tenchelp.h" 36 #include "rtl/textenc.h" 37 38 #ifndef INCLUDED_STDDEF_H 39 #include <stddef.h> 40 #define INCLUDED_STDDEF_H 41 #endif 42 43 #define NOTABUNI_START 0xFF 44 #define NOTABUNI_END 0x00 45 46 #define NOTABCHAR_START 0xFFFF 47 #define NOTABCHAR_END 0x0000 48 49 #define SAME8090UNI_START 0x80 50 #define SAME8090UNI_END 0x9F 51 static sal_uInt16 const aImpl8090SameToUniTab[SAME8090UNI_END 52 - SAME8090UNI_START 53 + 1] 54 = { 0x0080, 0x0081, 0x0082, 0x0083, 0x0084, 0x0085, 0x0086, 0x0087, /* 0x80 */ 55 0x0088, 0x0089, 0x008A, 0x008B, 0x008C, 0x008D, 0x008E, 0x008F, 56 0x0090, 0x0091, 0x0092, 0x0093, 0x0094, 0x0095, 0x0096, 0x0097, /* 0x90 */ 57 0x0098, 0x0099, 0x009A, 0x009B, 0x009C, 0x009D, 0x009E, 0x009F }; 58 59 #define SAME8090CHAR_START 0x0080 60 #define SAME8090CHAR_END 0x009F 61 static sal_uChar const aImpl8090SameToCharTab[SAME8090CHAR_END 62 - SAME8090CHAR_START 63 + 1] 64 = { 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, /* 0x0080 */ 65 0x88, 0x89, 0x8A, 0x8B, 0x8C, 0x8D, 0x8E, 0x8F, 66 0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, /* 0x0090 */ 67 0x98, 0x99, 0x9A, 0x9B, 0x9C, 0x9D, 0x9E, 0x9F }; 68 69 #define SAMEA0FFCHAR_START 0x00A0 70 #define SAMEA0FFCHAR_END 0x00FF 71 static sal_uChar const aImplA0FFSameToCharTab[SAMEA0FFCHAR_END 72 - SAMEA0FFCHAR_START 73 + 1] 74 = { 0xA0, 0xA1, 0xA2, 0xA3, 0xA4, 0xA5, 0xA6, 0xA7, /* 0x00A0 */ 75 0xA8, 0xA9, 0xAA, 0xAB, 0xAC, 0xAD, 0xAE, 0xAF, 76 0xB0, 0xB1, 0xB2, 0xB3, 0xB4, 0xB5, 0xB6, 0xB7, /* 0x00B0 */ 77 0xB8, 0xB9, 0xBA, 0xBB, 0xBC, 0xBD, 0xBE, 0xBF, 78 0xC0, 0xC1, 0xC2, 0xC3, 0xC4, 0xC5, 0xC6, 0xC7, /* 0x00C0 */ 79 0xC8, 0xC9, 0xCA, 0xCB, 0xCC, 0xCD, 0xCE, 0xCF, 80 0xD0, 0xD1, 0xD2, 0xD3, 0xD4, 0xD5, 0xD6, 0xD7, /* 0x00D0 */ 81 0xD8, 0xD9, 0xDA, 0xDB, 0xDC, 0xDD, 0xDE, 0xDF, 82 0xE0, 0xE1, 0xE2, 0xE3, 0xE4, 0xE5, 0xE6, 0xE7, /* 0x00E0 */ 83 0xE8, 0xE9, 0xEA, 0xEB, 0xEC, 0xED, 0xEE, 0xEF, 84 0xF0, 0xF1, 0xF2, 0xF3, 0xF4, 0xF5, 0xF6, 0xF7, /* 0x00F0 */ 85 0xF8, 0xF9, 0xFA, 0xFB, 0xFC, 0xFD, 0xFE, 0xFF }; 86 87 static sal_uInt16 const aImplDoubleByteIdentifierTab[1] = { 0 }; 88 89 #include "tcvtarb1.tab" 90 #include "tcvteas1.tab" 91 #include "tcvtest1.tab" 92 #include "tcvtjp1.tab" 93 #include "tcvtjp2.tab" 94 #include "tcvtjp3.tab" 95 #include "tcvtjp4.tab" 96 #include "tcvtjp5.tab" 97 #include "tcvtjp6.tab" 98 #include "tcvtkr1.tab" 99 #include "tcvtkr2.tab" 100 #include "tcvtkr4.tab" 101 #include "tcvtkr5.tab" 102 #include "tcvtkr6.tab" 103 #include "tcvtlat1.tab" 104 #include "tcvtscn1.tab" 105 #include "tcvtscn2.tab" 106 #include "tcvtscn3.tab" 107 #include "tcvtscn4.tab" 108 #include "tcvtscn5.tab" 109 #include "tcvtscn6.tab" 110 #include "tcvtsym1.tab" 111 #include "tcvttcn1.tab" 112 #include "tcvttcn2.tab" 113 #include "tcvttcn6.tab" 114 #include "tcvtuni1.tab" 115 #include "convertiscii.tab" 116 117 #include "convertbig5hkscs.tab" 118 #include "converteuctw.tab" 119 #include "convertgb18030.tab" 120 #include "convertiso2022cn.tab" 121 #include "convertiso2022jp.tab" 122 #include "convertiso2022kr.tab" 123 #include "convertadobe.tab" 124 125 ImplTextEncodingData const * 126 Impl_getTextEncodingData(rtl_TextEncoding nEncoding) SAL_THROW_EXTERN_C() 127 { 128 static ImplTextEncodingData const * const aData[] 129 = { NULL, /* DONTKNOW */ 130 &aImplMS1252TextEncodingData, /* MS_1252 */ 131 &aImplAPPLEROMANTextEncodingData, /* APPLE_ROMAN */ 132 &aImplIBM437TextEncodingData, /* IBM_437 */ 133 &aImplIBM850TextEncodingData, /* IBM_850 */ 134 &aImplIBM860TextEncodingData, /* IBM_860 */ 135 &aImplIBM861TextEncodingData, /* IBM_861 */ 136 &aImplIBM863TextEncodingData, /* IBM_863 */ 137 &aImplIBM865TextEncodingData, /* IBM_865 */ 138 NULL, /* reserved (SYSTEM) */ 139 &aImplSYMBOLTextEncodingData, /* SYMBOL */ 140 &aImplUSASCIITextEncodingData, /* ASCII_US */ 141 &aImplISO88591TextEncodingData, /* ISO_8859_1 */ 142 &aImplISO88592TextEncodingData, /* ISO_8859_2 */ 143 &aImplISO88593TextEncodingData, /* ISO_8859_3 */ 144 &aImplISO88594TextEncodingData, /* ISO_8859_4 */ 145 &aImplISO88595TextEncodingData, /* ISO_8859_5 */ 146 &aImplISO88596TextEncodingData, /* ISO_8859_6 */ 147 &aImplISO88597TextEncodingData, /* ISO_8859_7 */ 148 &aImplISO88598TextEncodingData, /* ISO_8859_8 */ 149 &aImplISO88599TextEncodingData, /* ISO_8859_9 */ 150 &aImplISO885914TextEncodingData, /* ISO_8859_14 */ 151 &aImplISO885915TextEncodingData, /* ISO_8859_15 */ 152 &aImplIBM737TextEncodingData, /* IBM_737 */ 153 &aImplIBM775TextEncodingData, /* IBM_775 */ 154 &aImplIBM852TextEncodingData, /* IBM_852 */ 155 &aImplIBM855TextEncodingData, /* IBM_855 */ 156 &aImplIBM857TextEncodingData, /* IBM_857 */ 157 &aImplIBM862TextEncodingData, /* IBM_862 */ 158 &aImplIBM864TextEncodingData, /* IBM_864 */ 159 &aImplIBM866TextEncodingData, /* IBM_866 */ 160 &aImplIBM869TextEncodingData, /* IBM_869 */ 161 &aImplMS874TextEncodingData, /* MS_874 */ 162 &aImplMS1250TextEncodingData, /* MS_1250 */ 163 &aImplMS1251TextEncodingData, /* MS_1251 */ 164 &aImplMS1253TextEncodingData, /* MS_1253 */ 165 &aImplMS1254TextEncodingData, /* MS_1254 */ 166 &aImplMS1255TextEncodingData, /* MS_1255 */ 167 &aImplMS1256TextEncodingData, /* MS_1256 */ 168 &aImplMS1257TextEncodingData, /* MS_1257 */ 169 &aImplMS1258TextEncodingData, /* MS_1258 */ 170 NULL, /* TODO! APPLE_ARABIC */ 171 &aImplAPPLECENTEUROTextEncodingData, /* APPLE_CENTEURO */ 172 &aImplAPPLECROATIANTextEncodingData, /* APPLE_CROATIAN */ 173 &aImplAPPLECYRILLICTextEncodingData, /* APPLE_CYRILLIC */ 174 NULL, /* TODO! APPLE_DEVANAGARI */ 175 NULL, /* TODO! APPLE_FARSI */ 176 &aImplAPPLEGREEKTextEncodingData, /* APPLE_GREEK */ 177 NULL, /* TODO! APPLE_GUJARATI */ 178 NULL, /* TODO! APPLE_GURMUKHI */ 179 NULL, /* TODO! APPLE_HEBREW */ 180 &aImplAPPLEICELANDTextEncodingData, /* APPLE_ICELAND */ 181 &aImplAPPLEROMANIANTextEncodingData, /* APPLE_ROMANIAN */ 182 NULL, /* TODO! APPLE_THAI */ 183 &aImplAPPLETURKISHTextEncodingData, /* APPLE_TURKISH */ 184 &aImplAPPLEUKRAINIANTextEncodingData, /* APPLE_UKRAINIAN */ 185 &aImplAPPLECHINSIMPTextEncodingData, /* APPLE_CHINSIMP */ 186 &aImplAPPLECHINTRADTextEncodingData, /* APPLE_CHINTRAD */ 187 &aImplAPPLEJAPANESETextEncodingData, /* APPLE_JAPANESE */ 188 &aImplAPPLEKOREANTextEncodingData, /* APPLE_KOREAN */ 189 &aImplMS932TextEncodingData, /* MS_932 */ 190 &aImplMS936TextEncodingData, /* MS_936 */ 191 &aImplMS949TextEncodingData, /* MS_949 */ 192 &aImplMS950TextEncodingData, /* MS_950 */ 193 &aImplSJISTextEncodingData, /* SHIFT_JIS */ 194 &aImplGB2312TextEncodingData, /* GB_2312 */ 195 &aImplGBT12345TextEncodingData, /* GBT_12345 */ 196 &aImplGBKTextEncodingData, /* GBK */ 197 &aImplBIG5TextEncodingData, /* BIG5 */ 198 &aImplEUCJPTextEncodingData, /* EUC_JP */ 199 &aImplEUCCNTextEncodingData, /* EUC_CN */ 200 &aImplEucTwTextEncodingData, /* EUC_TW */ 201 &aImplIso2022JpTextEncodingData, /* ISO_2022_JP */ 202 &aImplIso2022CnTextEncodingData, /* ISO_2022_CN */ 203 &aImplKOI8RTextEncodingData, /* KOI8_R */ 204 &aImplUTF7TextEncodingData, /* UTF7 */ 205 &aImplUTF8TextEncodingData, /* UTF8 */ 206 &aImplISO885910TextEncodingData, /* ISO_8859_10 */ 207 &aImplISO885913TextEncodingData, /* ISO_8859_13 */ 208 &aImplEUCKRTextEncodingData, /* EUC_KR */ 209 &aImplIso2022KrTextEncodingData, /* ISO_2022_KR */ 210 &aImplJISX0201TextEncodingData, /* JIS_X_0201 */ 211 &aImplJISX0208TextEncodingData, /* JIS_X_0208 */ 212 &aImplJISX0212TextEncodingData, /* JIS_X_0212 */ 213 &aImplMS1361TextEncodingData, /* MS_1361 */ 214 &aImplGb18030TextEncodingData, /* GB_18030 */ 215 &aImplBig5HkscsTextEncodingData, /* BIG5_HKSCS */ 216 &aImplTis620TextEncodingData, /* TIS_620 */ 217 &aImplKoi8UTextEncodingData, /* KOI8_U */ 218 &aImplIsciiDevanagariTextEncodingData, /* ISCII_DEVANAGARI */ 219 &aImplJavaUtf8TextEncodingData, /* JAVA_UTF8 */ 220 &adobeStandardEncodingData, /* ADOBE_STANDARD */ 221 &adobeSymbolEncodingData, /* ADOBE_SYMBOL */ 222 &aImplPT154TextEncodingData, /* PT154 */ 223 &adobeDingbatsEncodingData }; /* ADOBE_DINGBATS */ 224 return 225 nEncoding < sizeof aData / sizeof aData[0] ? aData[nEncoding] : NULL; 226 } 227