From 36d22d82aa202bb199967e9512281e9a53db42c9 Mon Sep 17 00:00:00 2001 From: Daniel Baumann Date: Sun, 7 Apr 2024 21:33:14 +0200 Subject: Adding upstream version 115.7.0esr. Signed-off-by: Daniel Baumann --- intl/icu/source/i18n/uspoof_build.cpp | 108 ++++++++++++++++++++++++++++++++++ 1 file changed, 108 insertions(+) create mode 100644 intl/icu/source/i18n/uspoof_build.cpp (limited to 'intl/icu/source/i18n/uspoof_build.cpp') diff --git a/intl/icu/source/i18n/uspoof_build.cpp b/intl/icu/source/i18n/uspoof_build.cpp new file mode 100644 index 0000000000..098d272e19 --- /dev/null +++ b/intl/icu/source/i18n/uspoof_build.cpp @@ -0,0 +1,108 @@ +// © 2016 and later: Unicode, Inc. and others. +// License & terms of use: http://www.unicode.org/copyright.html +/* + *************************************************************************** + * Copyright (C) 2008-2015, International Business Machines Corporation + * and others. All Rights Reserved. + *************************************************************************** + * file name: uspoof_build.cpp + * encoding: UTF-8 + * tab size: 8 (not used) + * indentation:4 + * + * created on: 2008 Dec 8 + * created by: Andy Heninger + * + * Unicode Spoof Detection Data Builder + * Builder-related functions are kept in separate files so that applications not needing + * the builder can more easily exclude them, typically by means of static linking. + * + * There are three relatively independent sets of Spoof data, + * Confusables, + * Whole Script Confusables + * ID character extensions. + * + * The data tables for each are built separately, each from its own definitions + */ + +#include "unicode/utypes.h" +#include "unicode/uspoof.h" +#include "unicode/unorm.h" +#include "unicode/uregex.h" +#include "unicode/ustring.h" +#include "cmemory.h" +#include "uspoof_impl.h" +#include "uhash.h" +#include "uvector.h" +#include "uassert.h" +#include "uarrsort.h" +#include "uspoof_conf.h" + +#if !UCONFIG_NO_NORMALIZATION + +U_NAMESPACE_USE + +// Defined in uspoof.cpp, initializes file-static variables. +U_CFUNC void uspoof_internalInitStatics(UErrorCode *status); + +// The main data building function + +U_CAPI USpoofChecker * U_EXPORT2 +uspoof_openFromSource(const char *confusables, int32_t confusablesLen, + const char* /*confusablesWholeScript*/, int32_t /*confusablesWholeScriptLen*/, + int32_t *errorType, UParseError *pe, UErrorCode *status) { + uspoof_internalInitStatics(status); + if (U_FAILURE(*status)) { + return nullptr; + } +#if UCONFIG_NO_REGULAR_EXPRESSIONS + *status = U_UNSUPPORTED_ERROR; + return nullptr; +#else + if (errorType!=nullptr) { + *errorType = 0; + } + if (pe != nullptr) { + pe->line = 0; + pe->offset = 0; + pe->preContext[0] = 0; + pe->postContext[0] = 0; + } + + // Set up a shell of a spoof detector, with empty data. + SpoofData *newSpoofData = new SpoofData(*status); + + if (newSpoofData == nullptr) { + *status = U_MEMORY_ALLOCATION_ERROR; + return nullptr; + } + + if (U_FAILURE(*status)) { + delete newSpoofData; + return nullptr; + } + SpoofImpl *This = new SpoofImpl(newSpoofData, *status); + + if (This == nullptr) { + *status = U_MEMORY_ALLOCATION_ERROR; + delete newSpoofData; // explicit delete as the destructor for SpoofImpl won't be called. + return nullptr; + } + + if (U_FAILURE(*status)) { + delete This; // no delete for newSpoofData, as the SpoofImpl destructor will delete it. + return nullptr; + } + + // Compile the binary data from the source (text) format. + ConfusabledataBuilder::buildConfusableData(This, confusables, confusablesLen, errorType, pe, *status); + + if (U_FAILURE(*status)) { + delete This; + This = nullptr; + } + return (USpoofChecker *)This; +#endif // UCONFIG_NO_REGULAR_EXPRESSIONS +} + +#endif -- cgit v1.2.3