diff options
| author | vitalyisaev <[email protected]> | 2023-11-14 09:58:56 +0300 |
|---|---|---|
| committer | vitalyisaev <[email protected]> | 2023-11-14 10:20:20 +0300 |
| commit | c2b2dfd9827a400a8495e172a56343462e3ceb82 (patch) | |
| tree | cd4e4f597d01bede4c82dffeb2d780d0a9046bd0 /contrib/clickhouse/src/Functions/randomString.cpp | |
| parent | d4ae8f119e67808cb0cf776ba6e0cf95296f2df7 (diff) | |
YQ Connector: move tests from yql to ydb (OSS)
Перенос папки с тестами на Коннектор из папки yql в папку ydb (синхронизируется с github).
Diffstat (limited to 'contrib/clickhouse/src/Functions/randomString.cpp')
| -rw-r--r-- | contrib/clickhouse/src/Functions/randomString.cpp | 132 |
1 files changed, 132 insertions, 0 deletions
diff --git a/contrib/clickhouse/src/Functions/randomString.cpp b/contrib/clickhouse/src/Functions/randomString.cpp new file mode 100644 index 00000000000..4afd0799d29 --- /dev/null +++ b/contrib/clickhouse/src/Functions/randomString.cpp @@ -0,0 +1,132 @@ +#include <Columns/ColumnString.h> +#include <DataTypes/DataTypeString.h> +#include <Functions/FunctionFactory.h> +#include <Functions/FunctionHelpers.h> +#include <Functions/IFunction.h> +#include <Functions/FunctionsRandom.h> +#include <Functions/PerformanceAdaptors.h> +#include <pcg_random.hpp> +#include <Common/randomSeed.h> +#include <base/unaligned.h> + + +namespace DB +{ +namespace ErrorCodes +{ + extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH; + extern const int ILLEGAL_TYPE_OF_ARGUMENT; + extern const int TOO_LARGE_STRING_SIZE; +} + +namespace +{ + +/* Generate random string of specified length with fully random bytes (including zero). */ +template <typename RandImpl> +class FunctionRandomStringImpl : public IFunction +{ +public: + static constexpr auto name = "randomString"; + + String getName() const override { return name; } + + bool isVariadic() const override { return true; } + + bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; } + + size_t getNumberOfArguments() const override { return 0; } + + DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override + { + if (arguments.empty()) + throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, + "Function {} requires at least one argument: the size of resulting string", getName()); + + if (arguments.size() > 2) + throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, + "Function {} requires at most two arguments: the size of resulting string and optional disambiguation tag", getName()); + + const IDataType & length_type = *arguments[0]; + if (!isNumber(length_type)) + throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "First argument of function {} must have numeric type", getName()); + + return std::make_shared<DataTypeString>(); + } + + bool isDeterministic() const override { return false; } + bool isDeterministicInScopeOfQuery() const override { return false; } + + ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override + { + auto col_to = ColumnString::create(); + ColumnString::Chars & data_to = col_to->getChars(); + ColumnString::Offsets & offsets_to = col_to->getOffsets(); + + if (input_rows_count == 0) + return col_to; + + /// Fill offsets. + offsets_to.resize(input_rows_count); + const IColumn & length_column = *arguments[0].column; + + IColumn::Offset offset = 0; + for (size_t row_num = 0; row_num < input_rows_count; ++row_num) + { + size_t length = length_column.getUInt(row_num); + if (length > (1 << 30)) + throw Exception(ErrorCodes::TOO_LARGE_STRING_SIZE, "Too large string size in function {}", getName()); + + offset += length + 1; + offsets_to[row_num] = offset; + } + + /// Fill random bytes. + data_to.resize(offsets_to.back()); + RandImpl::execute(reinterpret_cast<char *>(data_to.data()), data_to.size()); + + /// Put zero bytes in between. + auto * pos = data_to.data(); + for (size_t row_num = 0; row_num < input_rows_count; ++row_num) + pos[offsets_to[row_num] - 1] = 0; + + return col_to; + } +}; + +class FunctionRandomString : public FunctionRandomStringImpl<TargetSpecific::Default::RandImpl> +{ +public: + explicit FunctionRandomString(ContextPtr context) : selector(context) + { + selector.registerImplementation<TargetArch::Default, + FunctionRandomStringImpl<TargetSpecific::Default::RandImpl>>(); + + #if USE_MULTITARGET_CODE + selector.registerImplementation<TargetArch::AVX2, + FunctionRandomStringImpl<TargetSpecific::AVX2::RandImpl>>(); + #endif + } + + ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override + { + return selector.selectAndExecute(arguments, result_type, input_rows_count); + } + + static FunctionPtr create(ContextPtr context) + { + return std::make_shared<FunctionRandomString>(context); + } + +private: + ImplementationSelector<IFunction> selector; +}; + +} + +REGISTER_FUNCTION(RandomString) +{ + factory.registerFunction<FunctionRandomString>(); +} + +} |
