Line data Source code
1 : /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
2 : /*
3 : * This file is part of the LibreOffice project.
4 : *
5 : * This Source Code Form is subject to the terms of the Mozilla Public
6 : * License, v. 2.0. If a copy of the MPL was not distributed with this
7 : * file, You can obtain one at http://mozilla.org/MPL/2.0/.
8 : *
9 : * This file incorporates work covered by the following license notice:
10 : *
11 : * Licensed to the Apache Software Foundation (ASF) under one or more
12 : * contributor license agreements. See the NOTICE file distributed
13 : * with this work for additional information regarding copyright
14 : * ownership. The ASF licenses this file to you under the Apache
15 : * License, Version 2.0 (the "License"); you may not use this file
16 : * except in compliance with the License. You may obtain a copy of
17 : * the License at http://www.apache.org/licenses/LICENSE-2.0 .
18 : */
19 :
20 : #include "sal/config.h"
21 : #include "sal/types.h"
22 : #include "unichars.hxx"
23 :
24 4 : bool ImplIsControlOrFormat(sal_uInt32 nUtf32)
25 : {
26 : // All code points of
27 : // <http://www.unicode.org/Public/UNIDATA/UnicodeData.txt>, Version 3.1.1,
28 : // that have a General Category of Cc (Other, Control) or Cf (Other,
29 : // Format):
30 : return nUtf32 <= 0x001F
31 4 : || (nUtf32 >= 0x007F && nUtf32 <= 0x009F)
32 4 : || nUtf32 == 0x070F // SYRIAC ABBREVIATION MARK
33 4 : || nUtf32 == 0x180B // MONGOLIAN FREE VARIATION SELECTOR ONE
34 4 : || nUtf32 == 0x180C // MONGOLIAN FREE VARIATION SELECTOR TWO
35 4 : || nUtf32 == 0x180D // MONGOLIAN FREE VARIATION SELECTOR THREE
36 4 : || nUtf32 == 0x180E // MONGOLIAN VOWEL SEPARATOR
37 4 : || nUtf32 == 0x200C // ZERO WIDTH NON-JOINER
38 4 : || nUtf32 == 0x200D // ZERO WIDTH JOINER
39 4 : || nUtf32 == 0x200E // LEFT-TO-RIGHT MARK
40 4 : || nUtf32 == 0x200F // RIGHT-TO-LEFT MARK
41 4 : || nUtf32 == 0x202A // LEFT-TO-RIGHT EMBEDDING
42 4 : || nUtf32 == 0x202B // RIGHT-TO-LEFT EMBEDDING
43 4 : || nUtf32 == 0x202C // POP DIRECTIONAL FORMATTING
44 4 : || nUtf32 == 0x202D // LEFT-TO-RIGHT OVERRIDE
45 4 : || nUtf32 == 0x202E // RIGHT-TO-LEFT OVERRIDE
46 4 : || nUtf32 == 0x206A // INHIBIT SYMMETRIC SWAPPING
47 4 : || nUtf32 == 0x206B // ACTIVATE SYMMETRIC SWAPPING
48 4 : || nUtf32 == 0x206C // INHIBIT ARABIC FORM SHAPING
49 4 : || nUtf32 == 0x206D // ACTIVATE ARABIC FORM SHAPING
50 4 : || nUtf32 == 0x206E // NATIONAL DIGIT SHAPES
51 4 : || nUtf32 == 0x206F // NOMINAL DIGIT SHAPES
52 4 : || nUtf32 == 0xFEFF // ZERO WIDTH NO-BREAK SPACE
53 4 : || nUtf32 == 0xFFF9 // INTERLINEAR ANNOTATION ANCHOR
54 4 : || nUtf32 == 0xFFFA // INTERLINEAR ANNOTATION SEPARATOR
55 4 : || nUtf32 == 0xFFFB // INTERLINEAR ANNOTATION TERMINATOR
56 4 : || nUtf32 == 0x1D173 // MUSICAL SYMBOL BEGIN BEAM
57 4 : || nUtf32 == 0x1D174 // MUSICAL SYMBOL END BEAM
58 4 : || nUtf32 == 0x1D175 // MUSICAL SYMBOL BEGIN TIE
59 4 : || nUtf32 == 0x1D176 // MUSICAL SYMBOL END TIE
60 4 : || nUtf32 == 0x1D177 // MUSICAL SYMBOL BEGIN SLUR
61 4 : || nUtf32 == 0x1D178 // MUSICAL SYMBOL END SLUR
62 4 : || nUtf32 == 0x1D179 // MUSICAL SYMBOL BEGIN PHRASE
63 4 : || nUtf32 == 0x1D17A // MUSICAL SYMBOL END PHRASE
64 4 : || nUtf32 == 0xE0001 // LANGUAGE TAG
65 8 : || (nUtf32 >= 0xE0020 && nUtf32 <= 0xE007F);
66 : }
67 :
68 4 : bool ImplIsPrivateUse(sal_uInt32 nUtf32)
69 : {
70 : // All code points of
71 : // <http://www.unicode.org/Public/UNIDATA/UnicodeData.txt>, Version 3.1.1,
72 : // that have a General Category of Co (Other, Private Use):
73 0 : return (nUtf32 >= 0xE000 && nUtf32 <= 0xF8FF)
74 4 : || (nUtf32 >= 0xF0000 && nUtf32 <= 0xFFFFD)
75 8 : || (nUtf32 >= 0x100000 && nUtf32 <= 0x10FFFD);
76 : }
77 :
78 4 : bool ImplIsZeroWidth(sal_uInt32 nUtf32)
79 : {
80 : // All code points of
81 : // <http://www.unicode.org/Public/UNIDATA/UnicodeData.txt>, Version 3.1.1,
82 : // that have "ZERO WIDTH" in their Character name:
83 : return nUtf32 == 0x200B // ZERO WIDTH SPACE
84 4 : || nUtf32 == 0x200C // ZERO WIDTH NON-JOINER
85 4 : || nUtf32 == 0x200D // ZERO WIDTH JOINER
86 8 : || nUtf32 == 0xFEFF; // ZEOR WIDTH NO-BREAK SPACE
87 : }
88 :
89 : /* vim:set shiftwidth=4 softtabstop=4 expandtab: */
|