diff options
| author | vitalyisaev <[email protected]> | 2023-11-14 09:58:56 +0300 |
|---|---|---|
| committer | vitalyisaev <[email protected]> | 2023-11-14 10:20:20 +0300 |
| commit | c2b2dfd9827a400a8495e172a56343462e3ceb82 (patch) | |
| tree | cd4e4f597d01bede4c82dffeb2d780d0a9046bd0 /contrib/clickhouse/src/Functions/regexpQuoteMeta.cpp | |
| parent | d4ae8f119e67808cb0cf776ba6e0cf95296f2df7 (diff) | |
YQ Connector: move tests from yql to ydb (OSS)
Перенос папки с тестами на Коннектор из папки yql в папку ydb (синхронизируется с github).
Diffstat (limited to 'contrib/clickhouse/src/Functions/regexpQuoteMeta.cpp')
| -rw-r--r-- | contrib/clickhouse/src/Functions/regexpQuoteMeta.cpp | 118 |
1 files changed, 118 insertions, 0 deletions
diff --git a/contrib/clickhouse/src/Functions/regexpQuoteMeta.cpp b/contrib/clickhouse/src/Functions/regexpQuoteMeta.cpp new file mode 100644 index 00000000000..bd8cf161518 --- /dev/null +++ b/contrib/clickhouse/src/Functions/regexpQuoteMeta.cpp @@ -0,0 +1,118 @@ +#include <Columns/ColumnString.h> +#include <DataTypes/DataTypeString.h> +#include <Functions/FunctionFactory.h> +#include <Functions/FunctionHelpers.h> +#include <base/find_symbols.h> + + +namespace DB +{ +namespace ErrorCodes +{ + extern const int ILLEGAL_COLUMN; + extern const int ILLEGAL_TYPE_OF_ARGUMENT; +} + +namespace +{ + +class FunctionRegexpQuoteMeta : public IFunction +{ +public: + static constexpr auto name = "regexpQuoteMeta"; + + static FunctionPtr create(ContextPtr) + { + return std::make_shared<FunctionRegexpQuoteMeta>(); + } + + String getName() const override + { + return name; + } + + size_t getNumberOfArguments() const override + { + return 1; + } + + bool useDefaultImplementationForConstants() const override + { + return true; + } + + bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; } + + DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override + { + if (!WhichDataType(arguments[0].type).isString()) + throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of 1 argument of function {}. Must be String.", + arguments[0].type->getName(), getName()); + + return std::make_shared<DataTypeString>(); + } + + ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override + { + const ColumnPtr & column_string = arguments[0].column; + const ColumnString * input = checkAndGetColumn<ColumnString>(column_string.get()); + + if (!input) + throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}", + arguments[0].column->getName(), getName()); + + auto dst_column = ColumnString::create(); + auto & dst_data = dst_column->getChars(); + auto & dst_offsets = dst_column->getOffsets(); + + dst_offsets.resize(input_rows_count); + + const ColumnString::Offsets & src_offsets = input->getOffsets(); + + const auto * src_begin = reinterpret_cast<const char *>(input->getChars().data()); + const auto * src_pos = src_begin; + + for (size_t row_idx = 0; row_idx < input_rows_count; ++row_idx) + { + /// NOTE This implementation slightly differs from re2::RE2::QuoteMeta. + /// It escapes zero byte as \0 instead of \x00 + /// and it escapes only required characters. + /// This is Ok. Look at comments in re2.cc + + const char * src_end = src_begin + src_offsets[row_idx] - 1; + + while (true) + { + const char * next_src_pos = find_first_symbols<'\0', '\\', '|', '(', ')', '^', '$', '.', '[', ']', '?', '*', '+', '{', ':', '-'>(src_pos, src_end); + + size_t bytes_to_copy = next_src_pos - src_pos; + size_t old_dst_size = dst_data.size(); + dst_data.resize(old_dst_size + bytes_to_copy); + memcpySmallAllowReadWriteOverflow15(dst_data.data() + old_dst_size, src_pos, bytes_to_copy); + src_pos = next_src_pos + 1; + + if (next_src_pos == src_end) + { + dst_data.emplace_back('\0'); + break; + } + + dst_data.emplace_back('\\'); + dst_data.emplace_back(*next_src_pos); + } + + dst_offsets[row_idx] = dst_data.size(); + } + + return dst_column; + } +}; + +} + +REGISTER_FUNCTION(RegexpQuoteMeta) +{ + factory.registerFunction<FunctionRegexpQuoteMeta>(); +} + +} |
