summaryrefslogtreecommitdiffstats
path: root/contrib/clickhouse/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
diff options
context:
space:
mode:
authorAlexSm <[email protected]>2024-01-04 15:09:05 +0100
committerGitHub <[email protected]>2024-01-04 15:09:05 +0100
commitdab291146f6cd7d35684e3a1150e5bb1c412982c (patch)
tree36ef35f6cacb6432845a4a33f940c95871036b32 /contrib/clickhouse/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
parent63660ad5e7512029fd0218e7a636580695a24e1f (diff)
Library import 5, delete go dependencies (#832)
* Library import 5, delete go dependencies * Fix yt client
Diffstat (limited to 'contrib/clickhouse/src/TableFunctions/TableFunctionAzureBlobStorage.cpp')
-rw-r--r--contrib/clickhouse/src/TableFunctions/TableFunctionAzureBlobStorage.cpp317
1 files changed, 0 insertions, 317 deletions
diff --git a/contrib/clickhouse/src/TableFunctions/TableFunctionAzureBlobStorage.cpp b/contrib/clickhouse/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
deleted file mode 100644
index c2829fd9051..00000000000
--- a/contrib/clickhouse/src/TableFunctions/TableFunctionAzureBlobStorage.cpp
+++ /dev/null
@@ -1,317 +0,0 @@
-#include "clickhouse_config.h"
-
-#if USE_AZURE_BLOB_STORAGE
-
-#include <Interpreters/evaluateConstantExpression.h>
-#include <Interpreters/Context.h>
-#include <TableFunctions/TableFunctionFactory.h>
-#include <TableFunctions/TableFunctionS3.h>
-#include <TableFunctions/TableFunctionAzureBlobStorage.h>
-#include <Interpreters/parseColumnsListForTableFunction.h>
-#include <Access/Common/AccessFlags.h>
-#include <Parsers/ASTLiteral.h>
-#include <Parsers/ASTIdentifier.h>
-#include <Parsers/ASTFunction.h>
-#include <Storages/checkAndGetLiteralArgument.h>
-#include <Storages/StorageAzureBlob.h>
-#include <Storages/StorageURL.h>
-#include <Storages/NamedCollectionsHelpers.h>
-#include <Formats/FormatFactory.h>
-#include "registerTableFunctions.h"
-#error #include <Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypesNumber.h>
-
-#include <boost/algorithm/string.hpp>
-
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
- extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
- extern const int BAD_ARGUMENTS;
-}
-
-namespace
-{
-
-bool isConnectionString(const std::string & candidate)
-{
- return !candidate.starts_with("http");
-}
-
-}
-
-void TableFunctionAzureBlobStorage::parseArgumentsImpl(ASTs & engine_args, const ContextPtr & local_context)
-{
- /// Supported signatures:
- ///
- /// AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])
- ///
-
- if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, local_context))
- {
- StorageAzureBlob::processNamedCollectionResult(configuration, *named_collection);
-
- configuration.blobs_paths = {configuration.blob_path};
-
- if (configuration.format == "auto")
- configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
- }
- else
- {
- if (engine_args.size() < 3 || engine_args.size() > 8)
- throw Exception(
- ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
- "Storage Azure requires 3 to 7 arguments: "
- "AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])");
-
- for (auto & engine_arg : engine_args)
- engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, local_context);
-
- std::unordered_map<std::string_view, size_t> engine_args_to_idx;
-
- configuration.connection_url = checkAndGetLiteralArgument<String>(engine_args[0], "connection_string/storage_account_url");
- configuration.is_connection_string = isConnectionString(configuration.connection_url);
-
- configuration.container = checkAndGetLiteralArgument<String>(engine_args[1], "container");
- configuration.blob_path = checkAndGetLiteralArgument<String>(engine_args[2], "blobpath");
-
- auto is_format_arg
- = [](const std::string & s) -> bool { return s == "auto" || FormatFactory::instance().getAllFormats().contains(s); };
-
- if (engine_args.size() == 4)
- {
- auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name/structure");
- if (is_format_arg(fourth_arg))
- {
- configuration.format = fourth_arg;
- }
- else
- {
- configuration.structure = fourth_arg;
- }
- }
- else if (engine_args.size() == 5)
- {
- auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
- if (is_format_arg(fourth_arg))
- {
- configuration.format = fourth_arg;
- configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[4], "compression");
- }
- else
- {
- configuration.account_name = fourth_arg;
- configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
- }
- }
- else if (engine_args.size() == 6)
- {
- auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
- if (is_format_arg(fourth_arg))
- {
- configuration.format = fourth_arg;
- configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[4], "compression");
- configuration.structure = checkAndGetLiteralArgument<String>(engine_args[5], "structure");
- }
- else
- {
- configuration.account_name = fourth_arg;
- configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
- auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "format/account_name/structure");
- if (is_format_arg(sixth_arg))
- configuration.format = sixth_arg;
- else
- configuration.structure = sixth_arg;
- }
- }
- else if (engine_args.size() == 7)
- {
- auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
- configuration.account_name = fourth_arg;
- configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
- auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "format/account_name");
- if (!is_format_arg(sixth_arg))
- throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown format {}", sixth_arg);
- configuration.format = sixth_arg;
- configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[6], "compression");
- }
- else if (engine_args.size() == 8)
- {
- auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "format/account_name");
- configuration.account_name = fourth_arg;
- configuration.account_key = checkAndGetLiteralArgument<String>(engine_args[4], "account_key");
- auto sixth_arg = checkAndGetLiteralArgument<String>(engine_args[5], "format/account_name");
- if (!is_format_arg(sixth_arg))
- throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown format {}", sixth_arg);
- configuration.format = sixth_arg;
- configuration.compression_method = checkAndGetLiteralArgument<String>(engine_args[6], "compression");
- configuration.structure = checkAndGetLiteralArgument<String>(engine_args[7], "structure");
- }
-
- configuration.blobs_paths = {configuration.blob_path};
-
- if (configuration.format == "auto")
- configuration.format = FormatFactory::instance().getFormatFromFileName(configuration.blob_path, true);
- }
-}
-
-void TableFunctionAzureBlobStorage::parseArguments(const ASTPtr & ast_function, ContextPtr context)
-{
- /// Clone ast function, because we can modify its arguments like removing headers.
- auto ast_copy = ast_function->clone();
-
- ASTs & args_func = ast_function->children;
-
- if (args_func.size() != 1)
- throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' must have arguments.", getName());
-
- auto & args = args_func.at(0)->children;
-
- parseArgumentsImpl(args, context);
-}
-
-void TableFunctionAzureBlobStorage::addColumnsStructureToArguments(ASTs & args, const String & structure, const ContextPtr & context)
-{
- if (tryGetNamedCollectionWithOverrides(args, context))
- {
- /// In case of named collection, just add key-value pair "structure='...'"
- /// at the end of arguments to override existed structure.
- ASTs equal_func_args = {std::make_shared<ASTIdentifier>("structure"), std::make_shared<ASTLiteral>(structure)};
- auto equal_func = makeASTFunction("equals", std::move(equal_func_args));
- args.push_back(equal_func);
- }
- else
- {
- if (args.size() < 3 || args.size() > 8)
- throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
- "Storage Azure requires 3 to 7 arguments: "
- "AzureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])");
-
- auto structure_literal = std::make_shared<ASTLiteral>(structure);
-
- auto is_format_arg
- = [](const std::string & s) -> bool { return s == "auto" || FormatFactory::instance().getAllFormats().contains(s); };
-
-
- if (args.size() == 3)
- {
- /// Add format=auto & compression=auto before structure argument.
- args.push_back(std::make_shared<ASTLiteral>("auto"));
- args.push_back(std::make_shared<ASTLiteral>("auto"));
- args.push_back(structure_literal);
- }
- else if (args.size() == 4)
- {
- auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/account_name/structure");
- if (is_format_arg(fourth_arg))
- {
- /// Add compression=auto before structure argument.
- args.push_back(std::make_shared<ASTLiteral>("auto"));
- args.push_back(structure_literal);
- }
- else
- {
- args.back() = structure_literal;
- }
- }
- else if (args.size() == 5)
- {
- auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/account_name");
- if (!is_format_arg(fourth_arg))
- {
- /// Add format=auto & compression=auto before structure argument.
- args.push_back(std::make_shared<ASTLiteral>("auto"));
- args.push_back(std::make_shared<ASTLiteral>("auto"));
- }
- args.push_back(structure_literal);
- }
- else if (args.size() == 6)
- {
- auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/account_name");
- if (!is_format_arg(fourth_arg))
- {
- /// Add compression=auto before structure argument.
- args.push_back(std::make_shared<ASTLiteral>("auto"));
- args.push_back(structure_literal);
- }
- else
- {
- args.back() = structure_literal;
- }
- }
- else if (args.size() == 7)
- {
- args.push_back(structure_literal);
- }
- else if (args.size() == 8)
- {
- args.back() = structure_literal;
- }
- }
-}
-
-ColumnsDescription TableFunctionAzureBlobStorage::getActualTableStructure(ContextPtr context, bool is_insert_query) const
-{
- if (configuration.structure == "auto")
- {
- context->checkAccess(getSourceAccessType());
- auto client = StorageAzureBlob::createClient(configuration, !is_insert_query);
- auto settings = StorageAzureBlob::createSettings(context);
-
- auto object_storage = std::make_unique<AzureObjectStorage>("AzureBlobStorageTableFunction", std::move(client), std::move(settings));
- return StorageAzureBlob::getTableStructureFromData(object_storage.get(), configuration, std::nullopt, context, false);
- }
-
- return parseColumnsListFromString(configuration.structure, context);
-}
-
-bool TableFunctionAzureBlobStorage::supportsReadingSubsetOfColumns(const ContextPtr & context)
-{
- return FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(configuration.format, context);
-}
-
-StoragePtr TableFunctionAzureBlobStorage::executeImpl(const ASTPtr & /*ast_function*/, ContextPtr context, const std::string & table_name, ColumnsDescription /*cached_columns*/, bool is_insert_query) const
-{
- auto client = StorageAzureBlob::createClient(configuration, !is_insert_query);
- auto settings = StorageAzureBlob::createSettings(context);
-
- ColumnsDescription columns;
- if (configuration.structure != "auto")
- columns = parseColumnsListFromString(configuration.structure, context);
- else if (!structure_hint.empty())
- columns = structure_hint;
-
- StoragePtr storage = std::make_shared<StorageAzureBlob>(
- configuration,
- std::make_unique<AzureObjectStorage>(table_name, std::move(client), std::move(settings)),
- context,
- StorageID(getDatabaseName(), table_name),
- columns,
- ConstraintsDescription{},
- String{},
- /// No format_settings for table function Azure
- std::nullopt,
- /* distributed_processing */ false,
- nullptr);
-
- storage->startup();
-
- return storage;
-}
-
-void registerTableFunctionAzureBlobStorage(TableFunctionFactory & factory)
-{
- factory.registerFunction<TableFunctionAzureBlobStorage>(
- {.documentation
- = {.description=R"(The table function can be used to read the data stored on Azure Blob Storage.)",
- .examples{{"azureBlobStorage", "SELECT * FROM azureBlobStorage(connection_string|storage_account_url, container_name, blobpath, [account_name, account_key, format, compression, structure])", ""}}},
- .allow_readonly = false});
-}
-
-}
-
-#endif