summaryrefslogtreecommitdiffstats
path: root/sal/textenc/unichars.cxx
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 09:06:44 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-07 09:06:44 +0000
commited5640d8b587fbcfed7dd7967f3de04b37a76f26 (patch)
tree7a5f7c6c9d02226d7471cb3cc8fbbf631b415303 /sal/textenc/unichars.cxx
parentInitial commit. (diff)
downloadlibreoffice-upstream/4%7.4.7.tar.xz
libreoffice-upstream/4%7.4.7.zip
Adding upstream version 4:7.4.7.upstream/4%7.4.7upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to '')
-rw-r--r--sal/textenc/unichars.cxx87
1 files changed, 87 insertions, 0 deletions
diff --git a/sal/textenc/unichars.cxx b/sal/textenc/unichars.cxx
new file mode 100644
index 000000000..abd6945cf
--- /dev/null
+++ b/sal/textenc/unichars.cxx
@@ -0,0 +1,87 @@
+/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
+/*
+ * This file is part of the LibreOffice project.
+ *
+ * This Source Code Form is subject to the terms of the Mozilla Public
+ * License, v. 2.0. If a copy of the MPL was not distributed with this
+ * file, You can obtain one at http://mozilla.org/MPL/2.0/.
+ *
+ * This file incorporates work covered by the following license notice:
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed
+ * with this work for additional information regarding copyright
+ * ownership. The ASF licenses this file to you under the Apache
+ * License, Version 2.0 (the "License"); you may not use this file
+ * except in compliance with the License. You may obtain a copy of
+ * the License at http://www.apache.org/licenses/LICENSE-2.0 .
+ */
+
+#include <sal/config.h>
+#include <sal/types.h>
+#include "unichars.hxx"
+
+bool ImplIsControlOrFormat(sal_uInt32 nUtf32)
+{
+ // All code points of
+ // <http://www.unicode.org/Public/UNIDATA/UnicodeData.txt>, Version 3.1.1,
+ // that have a General Category of Cc (Other, Control) or Cf (Other,
+ // Format):
+ return nUtf32 <= 0x001F || (nUtf32 >= 0x007F && nUtf32 <= 0x009F)
+ || nUtf32 == 0x070F // SYRIAC ABBREVIATION MARK
+ || nUtf32 == 0x180B // MONGOLIAN FREE VARIATION SELECTOR ONE
+ || nUtf32 == 0x180C // MONGOLIAN FREE VARIATION SELECTOR TWO
+ || nUtf32 == 0x180D // MONGOLIAN FREE VARIATION SELECTOR THREE
+ || nUtf32 == 0x180E // MONGOLIAN VOWEL SEPARATOR
+ || nUtf32 == 0x200C // ZERO WIDTH NON-JOINER
+ || nUtf32 == 0x200D // ZERO WIDTH JOINER
+ || nUtf32 == 0x200E // LEFT-TO-RIGHT MARK
+ || nUtf32 == 0x200F // RIGHT-TO-LEFT MARK
+ || nUtf32 == 0x202A // LEFT-TO-RIGHT EMBEDDING
+ || nUtf32 == 0x202B // RIGHT-TO-LEFT EMBEDDING
+ || nUtf32 == 0x202C // POP DIRECTIONAL FORMATTING
+ || nUtf32 == 0x202D // LEFT-TO-RIGHT OVERRIDE
+ || nUtf32 == 0x202E // RIGHT-TO-LEFT OVERRIDE
+ || nUtf32 == 0x206A // INHIBIT SYMMETRIC SWAPPING
+ || nUtf32 == 0x206B // ACTIVATE SYMMETRIC SWAPPING
+ || nUtf32 == 0x206C // INHIBIT ARABIC FORM SHAPING
+ || nUtf32 == 0x206D // ACTIVATE ARABIC FORM SHAPING
+ || nUtf32 == 0x206E // NATIONAL DIGIT SHAPES
+ || nUtf32 == 0x206F // NOMINAL DIGIT SHAPES
+ || nUtf32 == 0xFEFF // ZERO WIDTH NO-BREAK SPACE
+ || nUtf32 == 0xFFF9 // INTERLINEAR ANNOTATION ANCHOR
+ || nUtf32 == 0xFFFA // INTERLINEAR ANNOTATION SEPARATOR
+ || nUtf32 == 0xFFFB // INTERLINEAR ANNOTATION TERMINATOR
+ || nUtf32 == 0x1D173 // MUSICAL SYMBOL BEGIN BEAM
+ || nUtf32 == 0x1D174 // MUSICAL SYMBOL END BEAM
+ || nUtf32 == 0x1D175 // MUSICAL SYMBOL BEGIN TIE
+ || nUtf32 == 0x1D176 // MUSICAL SYMBOL END TIE
+ || nUtf32 == 0x1D177 // MUSICAL SYMBOL BEGIN SLUR
+ || nUtf32 == 0x1D178 // MUSICAL SYMBOL END SLUR
+ || nUtf32 == 0x1D179 // MUSICAL SYMBOL BEGIN PHRASE
+ || nUtf32 == 0x1D17A // MUSICAL SYMBOL END PHRASE
+ || nUtf32 == 0xE0001 // LANGUAGE TAG
+ || (nUtf32 >= 0xE0020 && nUtf32 <= 0xE007F);
+}
+
+bool ImplIsPrivateUse(sal_uInt32 nUtf32)
+{
+ // All code points of
+ // <http://www.unicode.org/Public/UNIDATA/UnicodeData.txt>, Version 3.1.1,
+ // that have a General Category of Co (Other, Private Use):
+ return (nUtf32 >= 0xE000 && nUtf32 <= 0xF8FF) || (nUtf32 >= 0xF0000 && nUtf32 <= 0xFFFFD)
+ || (nUtf32 >= 0x100000 && nUtf32 <= 0x10FFFD);
+}
+
+bool ImplIsZeroWidth(sal_uInt32 nUtf32)
+{
+ // All code points of
+ // <http://www.unicode.org/Public/UNIDATA/UnicodeData.txt>, Version 3.1.1,
+ // that have "ZERO WIDTH" in their Character name:
+ return nUtf32 == 0x200B // ZERO WIDTH SPACE
+ || nUtf32 == 0x200C // ZERO WIDTH NON-JOINER
+ || nUtf32 == 0x200D // ZERO WIDTH JOINER
+ || nUtf32 == 0xFEFF; // ZERO WIDTH NO-BREAK SPACE
+}
+
+/* vim:set shiftwidth=4 softtabstop=4 expandtab: */