summaryrefslogtreecommitdiffstats
path: root/i18npool/inc/cclass_unicode.hxx
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 05:54:39 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-15 05:54:39 +0000
commit267c6f2ac71f92999e969232431ba04678e7437e (patch)
tree358c9467650e1d0a1d7227a21dac2e3d08b622b2 /i18npool/inc/cclass_unicode.hxx
parentInitial commit. (diff)
downloadlibreoffice-267c6f2ac71f92999e969232431ba04678e7437e.tar.xz
libreoffice-267c6f2ac71f92999e969232431ba04678e7437e.zip
Adding upstream version 4:24.2.0.upstream/4%24.2.0
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'i18npool/inc/cclass_unicode.hxx')
-rw-r--r--i18npool/inc/cclass_unicode.hxx187
1 files changed, 187 insertions, 0 deletions
diff --git a/i18npool/inc/cclass_unicode.hxx b/i18npool/inc/cclass_unicode.hxx
new file mode 100644
index 0000000000..3a5f28f124
--- /dev/null
+++ b/i18npool/inc/cclass_unicode.hxx
@@ -0,0 +1,187 @@
+/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
+/*
+ * This file is part of the LibreOffice project.
+ *
+ * This Source Code Form is subject to the terms of the Mozilla Public
+ * License, v. 2.0. If a copy of the MPL was not distributed with this
+ * file, You can obtain one at http://mozilla.org/MPL/2.0/.
+ *
+ * This file incorporates work covered by the following license notice:
+ *
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed
+ * with this work for additional information regarding copyright
+ * ownership. The ASF licenses this file to you under the Apache
+ * License, Version 2.0 (the "License"); you may not use this file
+ * except in compliance with the License. You may obtain a copy of
+ * the License at http://www.apache.org/licenses/LICENSE-2.0 .
+ */
+#pragma once
+
+#include <com/sun/star/i18n/XCharacterClassification.hpp>
+#include <cppuhelper/implbase.hxx>
+#include <com/sun/star/lang/XServiceInfo.hpp>
+#include <rtl/ref.hxx>
+
+#include <o3tl/typed_flags_set.hxx>
+#include <memory>
+
+namespace com::sun::star::uno { class XComponentContext; }
+namespace com::sun::star::i18n { class XNativeNumberSupplier; }
+namespace com::sun::star::i18n { class XLocaleData5; }
+namespace i18npool { class Transliteration_casemapping; }
+
+
+/// Flag values of table.
+enum class ParserFlags : sal_uInt32 {
+ ILLEGAL = 0x00000000,
+ CHAR = 0x00000001,
+ CHAR_BOOL = 0x00000002,
+ CHAR_WORD = 0x00000004,
+ CHAR_VALUE = 0x00000008,
+ CHAR_STRING = 0x00000010,
+ CHAR_DONTCARE = 0x00000020,
+ BOOL = 0x00000040,
+ WORD = 0x00000080,
+ WORD_SEP = 0x00000100,
+ VALUE = 0x00000200,
+ VALUE_SEP = 0x00000400,
+ VALUE_EXP = 0x00000800,
+ VALUE_SIGN = 0x00001000,
+ VALUE_EXP_VALUE = 0x00002000,
+ VALUE_DIGIT = 0x00004000,
+ NAME_SEP = 0x20000000,
+ STRING_SEP = 0x40000000,
+ EXCLUDED = 0x80000000,
+};
+namespace o3tl {
+ template<> struct typed_flags<ParserFlags> : is_typed_flags<ParserFlags, 0xe0007fff> {};
+}
+
+
+namespace i18npool {
+
+class cclass_Unicode final : public cppu::WeakImplHelper < css::i18n::XCharacterClassification, css::lang::XServiceInfo >
+{
+public:
+ cclass_Unicode(css::uno::Reference < css::uno::XComponentContext > xContext );
+ virtual ~cclass_Unicode() override;
+
+ virtual OUString SAL_CALL toUpper( const OUString& Text, sal_Int32 nPos, sal_Int32 nCount,
+ const css::lang::Locale& rLocale ) override;
+ virtual OUString SAL_CALL toLower( const OUString& Text, sal_Int32 nPos, sal_Int32 nCount,
+ const css::lang::Locale& rLocale ) override;
+ virtual OUString SAL_CALL toTitle( const OUString& Text, sal_Int32 nPos, sal_Int32 nCount,
+ const css::lang::Locale& rLocale ) override;
+ virtual sal_Int16 SAL_CALL getType( const OUString& Text, sal_Int32 nPos ) override;
+ virtual sal_Int16 SAL_CALL getCharacterDirection( const OUString& Text, sal_Int32 nPos ) override;
+ virtual sal_Int16 SAL_CALL getScript( const OUString& Text, sal_Int32 nPos ) override;
+ virtual sal_Int32 SAL_CALL getCharacterType( const OUString& text, sal_Int32 nPos,
+ const css::lang::Locale& rLocale ) override;
+ virtual sal_Int32 SAL_CALL getStringType( const OUString& text, sal_Int32 nPos, sal_Int32 nCount,
+ const css::lang::Locale& rLocale ) override;
+ virtual css::i18n::ParseResult SAL_CALL parseAnyToken( const OUString& Text, sal_Int32 nPos,
+ const css::lang::Locale& rLocale, sal_Int32 nStartCharFlags, const OUString& userDefinedCharactersStart,
+ sal_Int32 nContCharFlags, const OUString& userDefinedCharactersCont ) override;
+ virtual css::i18n::ParseResult SAL_CALL parsePredefinedToken( sal_Int32 nTokenType, const OUString& Text,
+ sal_Int32 nPos, const css::lang::Locale& rLocale, sal_Int32 nStartCharFlags,
+ const OUString& userDefinedCharactersStart, sal_Int32 nContCharFlags,
+ const OUString& userDefinedCharactersCont ) override;
+
+ //XServiceInfo
+ virtual OUString SAL_CALL getImplementationName() override;
+ virtual sal_Bool SAL_CALL supportsService(const OUString& ServiceName) override;
+ virtual css::uno::Sequence< OUString > SAL_CALL getSupportedServiceNames() override;
+
+private:
+ // These are performance sensitive, so we don't want to use locking and switch their state, so just
+ // have multiple copies.
+ rtl::Reference<Transliteration_casemapping> transToUpper;
+ rtl::Reference<Transliteration_casemapping> transToLower;
+ rtl::Reference<Transliteration_casemapping> transToTitle;
+
+// --- parser specific (implemented in cclass_unicode_parser.cxx) ---
+
+ enum ScanState
+ {
+ ssGetChar, // initial state; -> ssBounce, ssGetValue, ssRewindFromValue, ssGetWord, ssGetWordFirstChar, ssGetString, ssGetBool, ssStop
+ ssGetValue, // -> ssBounce, ssRewindFromValue, ssStopBack, ssGetWord
+ ssGetWord, // -> ssBounce, ssStop, ssStopBack
+ ssGetWordFirstChar, // -> ssBounce, ssGetWord, ssStop, ssStopBack
+ ssGetString, // -> ssBounce, ssStop
+ ssGetBool, // -> ssBounce, ssStop, ssStopBack
+ ssRewindFromValue, // -> ssBounce, ssGetValue, ssGetWord, ssGetWordFirstChar, ssGetString, ssGetBool, ssStop, ssIgnoreLeadingInRewind
+ ssIgnoreLeadingInRewind, // -> ssBounce, ssGetValue, ssRewindFromValue, ssGetWord, ssGetWordFirstChar, ssGetString, ssGetBool, ssStop
+ ssStopBack, // -> ssStop
+ ssBounce, // -> ssStopBack
+ ssStop
+ };
+
+ static const sal_uInt8 nDefCnt;
+ static const ParserFlags pDefaultParserTable[];
+ static const sal_Int32 pParseTokensType[];
+
+ /// If and where c occurs in pStr
+ static const sal_Unicode* StrChr( const sal_Unicode* pStr, sal_uInt32 c );
+
+
+ css::uno::Reference < css::uno::XComponentContext > m_xContext;
+
+ /// used for parser only
+ css::lang::Locale aParserLocale;
+ css::uno::Reference < css::i18n::XLocaleData5 > mxLocaleData;
+ css::uno::Reference < css::i18n::XNativeNumberSupplier > xNatNumSup;
+ OUString aStartChars;
+ OUString aContChars;
+ std::unique_ptr<ParserFlags[]> pTable;
+ std::unique_ptr<ParserFlags[]> pStart;
+ std::unique_ptr<ParserFlags[]> pCont;
+ sal_Int32 nStartTypes;
+ sal_Int32 nContTypes;
+ sal_Unicode cGroupSep;
+ sal_Unicode cDecimalSep;
+ sal_Unicode cDecimalSepAlt;
+
+ /// Get corresponding KParseTokens flag for a character
+ static sal_Int32 getParseTokensType(sal_uInt32 c, bool isFirst);
+
+ /// Access parser table flags.
+ ParserFlags getFlags(sal_uInt32 c, ScanState eState);
+
+ /// Access parser flags via International and special definitions.
+ ParserFlags getFlagsExtended(sal_uInt32 c, ScanState eState) const;
+
+ /// Access parser table flags for user defined start characters.
+ ParserFlags getStartCharsFlags( sal_uInt32 c );
+
+ /// Access parser table flags for user defined continuation characters.
+ ParserFlags getContCharsFlags( sal_Unicode c );
+
+ /// Setup parser table. Calls initParserTable() only if needed.
+ void setupParserTable( const css::lang::Locale& rLocale, sal_Int32 startCharTokenType,
+ const OUString& userDefinedCharactersStart, sal_Int32 contCharTokenType,
+ const OUString& userDefinedCharactersCont );
+
+ /// Init parser table.
+ void initParserTable( const css::lang::Locale& rLocale, sal_Int32 startCharTokenType,
+ const OUString& userDefinedCharactersStart, sal_Int32 contCharTokenType,
+ const OUString& userDefinedCharactersCont );
+
+ /// Destroy parser table.
+ void destroyParserTable();
+
+ /// Parse a text.
+ void parseText( css::i18n::ParseResult& r, const OUString& rText, sal_Int32 nPos,
+ sal_Int32 nTokenType = 0xffffffff );
+
+ /// Setup International class, new'ed only if different from existing.
+ void setupInternational( const css::lang::Locale& rLocale );
+
+ /// Implementation of getCharacterType() for one single character
+ static sal_Int32 getCharType( std::u16string_view Text, sal_Int32 *nPos, sal_Int32 increment);
+
+};
+
+}
+
+/* vim:set shiftwidth=4 softtabstop=4 expandtab: */