aboutsummaryrefslogtreecommitdiffstats
path: root/contrib/libs/icu/i18n/uspoof_build.cpp
diff options
context:
space:
mode:
authorvvvv <vvvv@yandex-team.ru>2022-03-03 23:09:11 +0300
committervvvv <vvvv@yandex-team.ru>2022-03-03 23:09:11 +0300
commit8dbdbab054b6eb352cfffdad09991052008062fc (patch)
tree71befed92d327f2cc409bff4986ec510d0530d92 /contrib/libs/icu/i18n/uspoof_build.cpp
parented3f4e21f3a3837059607ec2606e1dc910269ac0 (diff)
downloadydb-8dbdbab054b6eb352cfffdad09991052008062fc.tar.gz
YQL-13710 try to switch to new shiny PG
ref:2bed0445c8e8bd6c575883632adf19445f0a72a7
Diffstat (limited to 'contrib/libs/icu/i18n/uspoof_build.cpp')
-rw-r--r--contrib/libs/icu/i18n/uspoof_build.cpp108
1 files changed, 108 insertions, 0 deletions
diff --git a/contrib/libs/icu/i18n/uspoof_build.cpp b/contrib/libs/icu/i18n/uspoof_build.cpp
new file mode 100644
index 0000000000..192fb9a688
--- /dev/null
+++ b/contrib/libs/icu/i18n/uspoof_build.cpp
@@ -0,0 +1,108 @@
+// © 2016 and later: Unicode, Inc. and others.
+// License & terms of use: http://www.unicode.org/copyright.html
+/*
+ ***************************************************************************
+ * Copyright (C) 2008-2015, International Business Machines Corporation
+ * and others. All Rights Reserved.
+ ***************************************************************************
+ * file name: uspoof_build.cpp
+ * encoding: UTF-8
+ * tab size: 8 (not used)
+ * indentation:4
+ *
+ * created on: 2008 Dec 8
+ * created by: Andy Heninger
+ *
+ * Unicode Spoof Detection Data Builder
+ * Builder-related functions are kept in separate files so that applications not needing
+ * the builder can more easily exclude them, typically by means of static linking.
+ *
+ * There are three relatively independent sets of Spoof data,
+ * Confusables,
+ * Whole Script Confusables
+ * ID character extensions.
+ *
+ * The data tables for each are built separately, each from its own definitions
+ */
+
+#include "unicode/utypes.h"
+#include "unicode/uspoof.h"
+#include "unicode/unorm.h"
+#include "unicode/uregex.h"
+#include "unicode/ustring.h"
+#include "cmemory.h"
+#include "uspoof_impl.h"
+#include "uhash.h"
+#include "uvector.h"
+#include "uassert.h"
+#include "uarrsort.h"
+#include "uspoof_conf.h"
+
+#if !UCONFIG_NO_NORMALIZATION
+
+U_NAMESPACE_USE
+
+// Defined in uspoof.cpp, initializes file-static variables.
+U_CFUNC void uspoof_internalInitStatics(UErrorCode *status);
+
+// The main data building function
+
+U_CAPI USpoofChecker * U_EXPORT2
+uspoof_openFromSource(const char *confusables, int32_t confusablesLen,
+ const char* /*confusablesWholeScript*/, int32_t /*confusablesWholeScriptLen*/,
+ int32_t *errorType, UParseError *pe, UErrorCode *status) {
+ uspoof_internalInitStatics(status);
+ if (U_FAILURE(*status)) {
+ return NULL;
+ }
+#if UCONFIG_NO_REGULAR_EXPRESSIONS
+ *status = U_UNSUPPORTED_ERROR;
+ return NULL;
+#else
+ if (errorType!=NULL) {
+ *errorType = 0;
+ }
+ if (pe != NULL) {
+ pe->line = 0;
+ pe->offset = 0;
+ pe->preContext[0] = 0;
+ pe->postContext[0] = 0;
+ }
+
+ // Set up a shell of a spoof detector, with empty data.
+ SpoofData *newSpoofData = new SpoofData(*status);
+
+ if (newSpoofData == NULL) {
+ *status = U_MEMORY_ALLOCATION_ERROR;
+ return NULL;
+ }
+
+ if (U_FAILURE(*status)) {
+ delete newSpoofData;
+ return NULL;
+ }
+ SpoofImpl *This = new SpoofImpl(newSpoofData, *status);
+
+ if (This == NULL) {
+ *status = U_MEMORY_ALLOCATION_ERROR;
+ delete newSpoofData; // explicit delete as the destructor for SpoofImpl won't be called.
+ return NULL;
+ }
+
+ if (U_FAILURE(*status)) {
+ delete This; // no delete for newSpoofData, as the SpoofImpl destructor will delete it.
+ return NULL;
+ }
+
+ // Compile the binary data from the source (text) format.
+ ConfusabledataBuilder::buildConfusableData(This, confusables, confusablesLen, errorType, pe, *status);
+
+ if (U_FAILURE(*status)) {
+ delete This;
+ This = NULL;
+ }
+ return (USpoofChecker *)This;
+#endif // UCONFIG_NO_REGULAR_EXPRESSIONS
+}
+
+#endif