aboutsummaryrefslogtreecommitdiffstats
path: root/contrib/libs/icu/io/ustream.cpp
diff options
context:
space:
mode:
authorvvvv <vvvv@yandex-team.ru>2022-03-03 23:09:11 +0300
committervvvv <vvvv@yandex-team.ru>2022-03-03 23:09:11 +0300
commit8dbdbab054b6eb352cfffdad09991052008062fc (patch)
tree71befed92d327f2cc409bff4986ec510d0530d92 /contrib/libs/icu/io/ustream.cpp
parented3f4e21f3a3837059607ec2606e1dc910269ac0 (diff)
downloadydb-8dbdbab054b6eb352cfffdad09991052008062fc.tar.gz
YQL-13710 try to switch to new shiny PG
ref:2bed0445c8e8bd6c575883632adf19445f0a72a7
Diffstat (limited to 'contrib/libs/icu/io/ustream.cpp')
-rw-r--r--contrib/libs/icu/io/ustream.cpp170
1 files changed, 170 insertions, 0 deletions
diff --git a/contrib/libs/icu/io/ustream.cpp b/contrib/libs/icu/io/ustream.cpp
new file mode 100644
index 0000000000..51676ea0f5
--- /dev/null
+++ b/contrib/libs/icu/io/ustream.cpp
@@ -0,0 +1,170 @@
+// © 2016 and later: Unicode, Inc. and others.
+// License & terms of use: http://www.unicode.org/copyright.html
+/*
+**********************************************************************
+* Copyright (C) 2001-2016, International Business Machines
+* Corporation and others. All Rights Reserved.
+**********************************************************************
+* FILE NAME : ustream.cpp
+*
+* Modification History:
+*
+* Date Name Description
+* 06/25/2001 grhoten Move iostream from unistr.h to here
+******************************************************************************
+*/
+
+#include "unicode/utypes.h"
+
+#if !UCONFIG_NO_CONVERSION
+
+#include "unicode/uobject.h"
+#include "unicode/ustream.h"
+#include "unicode/ucnv.h"
+#include "unicode/uchar.h"
+#include "unicode/utf16.h"
+#include "ustr_cnv.h"
+#include "cmemory.h"
+#include <string.h>
+
+// console IO
+
+#define STD_NAMESPACE std::
+
+#define STD_OSTREAM STD_NAMESPACE ostream
+#define STD_ISTREAM STD_NAMESPACE istream
+
+U_NAMESPACE_BEGIN
+
+U_IO_API STD_OSTREAM & U_EXPORT2
+operator<<(STD_OSTREAM& stream, const UnicodeString& str)
+{
+ if(str.length() > 0) {
+ char buffer[200];
+ UConverter *converter;
+ UErrorCode errorCode = U_ZERO_ERROR;
+
+ // use the default converter to convert chunks of text
+ converter = u_getDefaultConverter(&errorCode);
+ if(U_SUCCESS(errorCode)) {
+ const UChar *us = str.getBuffer();
+ const UChar *uLimit = us + str.length();
+ char *s, *sLimit = buffer + (sizeof(buffer) - 1);
+ do {
+ errorCode = U_ZERO_ERROR;
+ s = buffer;
+ ucnv_fromUnicode(converter, &s, sLimit, &us, uLimit, 0, FALSE, &errorCode);
+ *s = 0;
+
+ // write this chunk
+ if(s > buffer) {
+ stream << buffer;
+ }
+ } while(errorCode == U_BUFFER_OVERFLOW_ERROR);
+ u_releaseDefaultConverter(converter);
+ }
+ }
+
+/* stream.flush();*/
+ return stream;
+}
+
+U_IO_API STD_ISTREAM & U_EXPORT2
+operator>>(STD_ISTREAM& stream, UnicodeString& str)
+{
+ // This is like ICU status checking.
+ if (stream.fail()) {
+ return stream;
+ }
+
+ /* ipfx should eat whitespace when ios::skipws is set */
+ UChar uBuffer[16];
+ char buffer[16];
+ int32_t idx = 0;
+ UConverter *converter;
+ UErrorCode errorCode = U_ZERO_ERROR;
+
+ // use the default converter to convert chunks of text
+ converter = u_getDefaultConverter(&errorCode);
+ if(U_SUCCESS(errorCode)) {
+ UChar *us = uBuffer;
+ const UChar *uLimit = uBuffer + UPRV_LENGTHOF(uBuffer);
+ const char *s, *sLimit;
+ char ch;
+ UChar ch32;
+ UBool initialWhitespace = TRUE;
+ UBool continueReading = TRUE;
+
+ /* We need to consume one byte at a time to see what is considered whitespace. */
+ while (continueReading) {
+ ch = stream.get();
+ if (stream.eof()) {
+ // The EOF is only set after the get() of an unavailable byte.
+ if (!initialWhitespace) {
+ stream.clear(stream.eofbit);
+ }
+ continueReading = FALSE;
+ }
+ sLimit = &ch + (int)continueReading;
+ us = uBuffer;
+ s = &ch;
+ errorCode = U_ZERO_ERROR;
+ /*
+ Since we aren't guaranteed to see the state before this call,
+ this code won't work on stateful encodings like ISO-2022 or an EBCDIC stateful encoding.
+ We flush on the last byte to ensure that we output truncated multibyte characters.
+ */
+ ucnv_toUnicode(converter, &us, uLimit, &s, sLimit, 0, !continueReading, &errorCode);
+ if(U_FAILURE(errorCode)) {
+ /* Something really bad happened. setstate() isn't always an available API */
+ stream.clear(stream.failbit);
+ goto STOP_READING;
+ }
+ /* Was the character consumed? */
+ if (us != uBuffer) {
+ /* Reminder: ibm-1390 & JISX0213 can output 2 Unicode code points */
+ int32_t uBuffSize = static_cast<int32_t>(us-uBuffer);
+ int32_t uBuffIdx = 0;
+ while (uBuffIdx < uBuffSize) {
+ U16_NEXT(uBuffer, uBuffIdx, uBuffSize, ch32);
+ if (u_isWhitespace(ch32)) {
+ if (!initialWhitespace) {
+ buffer[idx++] = ch;
+ while (idx > 0) {
+ stream.putback(buffer[--idx]);
+ }
+ goto STOP_READING;
+ }
+ /* else skip intialWhitespace */
+ }
+ else {
+ if (initialWhitespace) {
+ /*
+ When initialWhitespace is TRUE, we haven't appended any
+ character yet. This is where we truncate the string,
+ to avoid modifying the string before we know if we can
+ actually read from the stream.
+ */
+ str.truncate(0);
+ initialWhitespace = FALSE;
+ }
+ str.append(ch32);
+ }
+ }
+ idx = 0;
+ }
+ else {
+ buffer[idx++] = ch;
+ }
+ }
+STOP_READING:
+ u_releaseDefaultConverter(converter);
+ }
+
+/* stream.flush();*/
+ return stream;
+}
+
+U_NAMESPACE_END
+
+#endif