/************************************************************** * * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. * *************************************************************/ #include "unichars.h" #include "osl/diagnose.h" #include "sal/types.h" int ImplIsNoncharacter(sal_uInt32 nUtf32) { /* All code points that are noncharacters, as of Unicode 3.1.1. */ return (nUtf32 >= 0xFDD0 && nUtf32 <= 0xFDEF) || (nUtf32 & 0xFFFF) >= 0xFFFE || nUtf32 > 0x10FFFF; } int ImplIsControlOrFormat(sal_uInt32 nUtf32) { /* All code points of , Version 3.1.1, that have a General Category of Cc (Other, Control) or Cf (Other, Format). */ return nUtf32 <= 0x001F || (nUtf32 >= 0x007F && nUtf32 <= 0x009F) || nUtf32 == 0x070F /* SYRIAC ABBREVIATION MARK */ || nUtf32 == 0x180B /* MONGOLIAN FREE VARIATION SELECTOR ONE */ || nUtf32 == 0x180C /* MONGOLIAN FREE VARIATION SELECTOR TWO */ || nUtf32 == 0x180D /* MONGOLIAN FREE VARIATION SELECTOR THREE */ || nUtf32 == 0x180E /* MONGOLIAN VOWEL SEPARATOR */ || nUtf32 == 0x200C /* ZERO WIDTH NON-JOINER */ || nUtf32 == 0x200D /* ZERO WIDTH JOINER */ || nUtf32 == 0x200E /* LEFT-TO-RIGHT MARK */ || nUtf32 == 0x200F /* RIGHT-TO-LEFT MARK */ || nUtf32 == 0x202A /* LEFT-TO-RIGHT EMBEDDING */ || nUtf32 == 0x202B /* RIGHT-TO-LEFT EMBEDDING */ || nUtf32 == 0x202C /* POP DIRECTIONAL FORMATTING */ || nUtf32 == 0x202D /* LEFT-TO-RIGHT OVERRIDE */ || nUtf32 == 0x202E /* RIGHT-TO-LEFT OVERRIDE */ || nUtf32 == 0x206A /* INHIBIT SYMMETRIC SWAPPING */ || nUtf32 == 0x206B /* ACTIVATE SYMMETRIC SWAPPING */ || nUtf32 == 0x206C /* INHIBIT ARABIC FORM SHAPING */ || nUtf32 == 0x206D /* ACTIVATE ARABIC FORM SHAPING */ || nUtf32 == 0x206E /* NATIONAL DIGIT SHAPES */ || nUtf32 == 0x206F /* NOMINAL DIGIT SHAPES */ || nUtf32 == 0xFEFF /* ZERO WIDTH NO-BREAK SPACE */ || nUtf32 == 0xFFF9 /* INTERLINEAR ANNOTATION ANCHOR */ || nUtf32 == 0xFFFA /* INTERLINEAR ANNOTATION SEPARATOR */ || nUtf32 == 0xFFFB /* INTERLINEAR ANNOTATION TERMINATOR */ || nUtf32 == 0x1D173 /* MUSICAL SYMBOL BEGIN BEAM */ || nUtf32 == 0x1D174 /* MUSICAL SYMBOL END BEAM */ || nUtf32 == 0x1D175 /* MUSICAL SYMBOL BEGIN TIE */ || nUtf32 == 0x1D176 /* MUSICAL SYMBOL END TIE */ || nUtf32 == 0x1D177 /* MUSICAL SYMBOL BEGIN SLUR */ || nUtf32 == 0x1D178 /* MUSICAL SYMBOL END SLUR */ || nUtf32 == 0x1D179 /* MUSICAL SYMBOL BEGIN PHRASE */ || nUtf32 == 0x1D17A /* MUSICAL SYMBOL END PHRASE */ || nUtf32 == 0xE0001 /* LANGUAGE TAG */ || (nUtf32 >= 0xE0020 && nUtf32 <= 0xE007F); } int ImplIsHighSurrogate(sal_uInt32 nUtf32) { /* All code points that are high-surrogates, as of Unicode 3.1.1. */ return nUtf32 >= 0xD800 && nUtf32 <= 0xDBFF; } int ImplIsLowSurrogate(sal_uInt32 nUtf32) { /* All code points that are low-surrogates, as of Unicode 3.1.1. */ return nUtf32 >= 0xDC00 && nUtf32 <= 0xDFFF; } int ImplIsPrivateUse(sal_uInt32 nUtf32) { /* All code points of , Version 3.1.1, that have a General Category of Co (Other, Private Use). */ return (nUtf32 >= 0xE000 && nUtf32 <= 0xF8FF) || (nUtf32 >= 0xF0000 && nUtf32 <= 0xFFFFD) || (nUtf32 >= 0x100000 && nUtf32 <= 0x10FFFD); } int ImplIsZeroWidth(sal_uInt32 nUtf32) { /* All code points of , Version 3.1.1, that have "ZERO WIDTH" in their Character name. */ return nUtf32 == 0x200B /* ZERO WIDTH SPACE */ || nUtf32 == 0x200C /* ZERO WIDTH NON-JOINER */ || nUtf32 == 0x200D /* ZERO WIDTH JOINER */ || nUtf32 == 0xFEFF; /* ZEOR WIDTH NO-BREAK SPACE */ } sal_uInt32 ImplGetHighSurrogate(sal_uInt32 nUtf32) { OSL_ENSURE(nUtf32 >= 0x10000, "specification violation"); return ((nUtf32 - 0x10000) >> 10) | 0xD800; } sal_uInt32 ImplGetLowSurrogate(sal_uInt32 nUtf32) { OSL_ENSURE(nUtf32 >= 0x10000, "specification violation"); return ((nUtf32 - 0x10000) & 0x3FF) | 0xDC00; } sal_uInt32 ImplCombineSurrogates(sal_uInt32 nHigh, sal_uInt32 nLow) { OSL_ENSURE(ImplIsHighSurrogate(nHigh) && ImplIsLowSurrogate(nLow), "specification violation"); return (((nHigh & 0x3FF) << 10) | (nLow & 0x3FF)) + 0x10000; }