#include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #if !defined(ARCADIA_BUILD) # include "config_core.h" #endif #if USE_MYSQL # include # include # include # include # include # include #endif #if USE_MYSQL || USE_LIBPQXX #include #include #include #endif #if USE_LIBPQXX #include // Y_IGNORE #include #include #endif #if USE_SQLITE #include #endif namespace fs = std::filesystem; namespace DB { namespace ErrorCodes { extern const int UNKNOWN_ELEMENT_IN_AST; extern const int BAD_ARGUMENTS; extern const int UNKNOWN_DATABASE_ENGINE; extern const int CANNOT_CREATE_DATABASE; } DatabasePtr DatabaseFactory::get(const ASTCreateQuery & create, const String & metadata_path, ContextPtr context) { bool created = false; try { /// Creates store/xxx/ for Atomic fs::create_directories(fs::path(metadata_path).parent_path()); /// Before 20.7 it's possible that .sql metadata file does not exist for some old database. /// In this case Ordinary database is created on server startup if the corresponding metadata directory exists. /// So we should remove metadata directory if database creation failed. created = fs::create_directory(metadata_path); DatabasePtr impl = getImpl(create, metadata_path, context); if (impl && context->hasQueryContext() && context->getSettingsRef().log_queries) context->getQueryContext()->addQueryFactoriesInfo(Context::QueryLogFactories::Database, impl->getEngineName()); return impl; } catch (...) { if (created && fs::exists(metadata_path)) fs::remove_all(metadata_path); throw; } } template static inline ValueType safeGetLiteralValue(const ASTPtr &ast, const String &engine_name) { if (!ast || !ast->as()) throw Exception("Database engine " + engine_name + " requested literal argument.", ErrorCodes::BAD_ARGUMENTS); return ast->as()->value.safeGet(); } DatabasePtr DatabaseFactory::getImpl(const ASTCreateQuery & create, const String & metadata_path, ContextPtr context) { auto * engine_define = create.storage; const String & database_name = create.database; const String & engine_name = engine_define->engine->name; const UUID & uuid = create.uuid; bool engine_may_have_arguments = engine_name == "MySQL" || engine_name == "MaterializedMySQL" || engine_name == "Lazy" || engine_name == "Replicated" || engine_name == "PostgreSQL" || engine_name == "MaterializedPostgreSQL" || engine_name == "SQLite"; if (engine_define->engine->arguments && !engine_may_have_arguments) throw Exception("Database engine " + engine_name + " cannot have arguments", ErrorCodes::BAD_ARGUMENTS); bool has_unexpected_element = engine_define->engine->parameters || engine_define->partition_by || engine_define->primary_key || engine_define->order_by || engine_define->sample_by; bool may_have_settings = endsWith(engine_name, "MySQL") || engine_name == "Replicated" || engine_name == "MaterializedPostgreSQL"; if (has_unexpected_element || (!may_have_settings && engine_define->settings)) throw Exception("Database engine " + engine_name + " cannot have parameters, primary_key, order_by, sample_by, settings", ErrorCodes::UNKNOWN_ELEMENT_IN_AST); if (engine_name == "Ordinary") return std::make_shared(database_name, metadata_path, context); else if (engine_name == "Atomic") return std::make_shared(database_name, metadata_path, uuid, context); else if (engine_name == "Memory") return std::make_shared(database_name, context); else if (engine_name == "Dictionary") return std::make_shared(database_name, context); #if USE_MYSQL else if (engine_name == "MySQL" || engine_name == "MaterializedMySQL") { const ASTFunction * engine = engine_define->engine; if (!engine->arguments || engine->arguments->children.size() != 4) throw Exception( engine_name + " Database require mysql_hostname, mysql_database_name, mysql_username, mysql_password arguments.", ErrorCodes::BAD_ARGUMENTS); ASTs & arguments = engine->arguments->children; arguments[1] = evaluateConstantExpressionOrIdentifierAsLiteral(arguments[1], context); const auto & host_port = safeGetLiteralValue(arguments[0], engine_name); const auto & mysql_database_name = safeGetLiteralValue(arguments[1], engine_name); const auto & mysql_user_name = safeGetLiteralValue(arguments[2], engine_name); const auto & mysql_user_password = safeGetLiteralValue(arguments[3], engine_name); try { if (engine_name == "MySQL") { auto mysql_database_settings = std::make_unique(); /// Split into replicas if needed. size_t max_addresses = context->getSettingsRef().glob_expansion_max_elements; auto addresses = parseRemoteDescriptionForExternalDatabase(host_port, max_addresses, 3306); auto mysql_pool = mysqlxx::PoolWithFailover(mysql_database_name, addresses, mysql_user_name, mysql_user_password); mysql_database_settings->loadFromQueryContext(context); mysql_database_settings->loadFromQuery(*engine_define); /// higher priority return std::make_shared( context, database_name, metadata_path, engine_define, mysql_database_name, std::move(mysql_database_settings), std::move(mysql_pool)); } const auto & [remote_host_name, remote_port] = parseAddress(host_port, 3306); MySQLClient client(remote_host_name, remote_port, mysql_user_name, mysql_user_password); auto mysql_pool = mysqlxx::Pool(mysql_database_name, remote_host_name, mysql_user_name, mysql_user_password, remote_port); auto materialize_mode_settings = std::make_unique(); if (engine_define->settings) materialize_mode_settings->loadFromQuery(*engine_define); if (create.uuid == UUIDHelpers::Nil) return std::make_shared>( context, database_name, metadata_path, uuid, mysql_database_name, std::move(mysql_pool), std::move(client) , std::move(materialize_mode_settings)); else return std::make_shared>( context, database_name, metadata_path, uuid, mysql_database_name, std::move(mysql_pool), std::move(client) , std::move(materialize_mode_settings)); } catch (...) { const auto & exception_message = getCurrentExceptionMessage(true); throw Exception("Cannot create MySQL database, because " + exception_message, ErrorCodes::CANNOT_CREATE_DATABASE); } } #endif else if (engine_name == "Lazy") { const ASTFunction * engine = engine_define->engine; if (!engine->arguments || engine->arguments->children.size() != 1) throw Exception("Lazy database require cache_expiration_time_seconds argument", ErrorCodes::BAD_ARGUMENTS); const auto & arguments = engine->arguments->children; const auto cache_expiration_time_seconds = safeGetLiteralValue(arguments[0], "Lazy"); return std::make_shared(database_name, metadata_path, cache_expiration_time_seconds, context); } else if (engine_name == "Replicated") { const ASTFunction * engine = engine_define->engine; if (!engine->arguments || engine->arguments->children.size() != 3) throw Exception("Replicated database requires 3 arguments: zookeeper path, shard name and replica name", ErrorCodes::BAD_ARGUMENTS); const auto & arguments = engine->arguments->children; String zookeeper_path = safeGetLiteralValue(arguments[0], "Replicated"); String shard_name = safeGetLiteralValue(arguments[1], "Replicated"); String replica_name = safeGetLiteralValue(arguments[2], "Replicated"); zookeeper_path = context->getMacros()->expand(zookeeper_path); shard_name = context->getMacros()->expand(shard_name); replica_name = context->getMacros()->expand(replica_name); DatabaseReplicatedSettings database_replicated_settings{}; if (engine_define->settings) database_replicated_settings.loadFromQuery(*engine_define); return std::make_shared(database_name, metadata_path, uuid, zookeeper_path, shard_name, replica_name, std::move(database_replicated_settings), context); } #if USE_LIBPQXX else if (engine_name == "PostgreSQL") { const ASTFunction * engine = engine_define->engine; if (!engine->arguments || engine->arguments->children.size() < 4 || engine->arguments->children.size() > 5) throw Exception(fmt::format( "{} Database require host:port, database_name, username, password arguments " "[, use_table_cache = 0].", engine_name), ErrorCodes::BAD_ARGUMENTS); ASTs & engine_args = engine->arguments->children; for (auto & engine_arg : engine_args) engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, context); const auto & host_port = safeGetLiteralValue(engine_args[0], engine_name); const auto & postgres_database_name = safeGetLiteralValue(engine_args[1], engine_name); const auto & username = safeGetLiteralValue(engine_args[2], engine_name); const auto & password = safeGetLiteralValue(engine_args[3], engine_name); auto use_table_cache = 0; if (engine->arguments->children.size() == 5) use_table_cache = safeGetLiteralValue(engine_args[4], engine_name); /// Split into replicas if needed. size_t max_addresses = context->getSettingsRef().glob_expansion_max_elements; auto addresses = parseRemoteDescriptionForExternalDatabase(host_port, max_addresses, 5432); /// no connection is made here auto connection_pool = std::make_shared( postgres_database_name, addresses, username, password, context->getSettingsRef().postgresql_connection_pool_size, context->getSettingsRef().postgresql_connection_pool_wait_timeout); return std::make_shared( context, metadata_path, engine_define, database_name, postgres_database_name, connection_pool, use_table_cache); } else if (engine_name == "MaterializedPostgreSQL") { const ASTFunction * engine = engine_define->engine; if (!engine->arguments || engine->arguments->children.size() != 4) { throw Exception( fmt::format("{} Database require host:port, database_name, username, password arguments ", engine_name), ErrorCodes::BAD_ARGUMENTS); } ASTs & engine_args = engine->arguments->children; for (auto & engine_arg : engine_args) engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, context); const auto & host_port = safeGetLiteralValue(engine_args[0], engine_name); const auto & postgres_database_name = safeGetLiteralValue(engine_args[1], engine_name); const auto & username = safeGetLiteralValue(engine_args[2], engine_name); const auto & password = safeGetLiteralValue(engine_args[3], engine_name); auto parsed_host_port = parseAddress(host_port, 5432); auto connection_info = postgres::formatConnectionString(postgres_database_name, parsed_host_port.first, parsed_host_port.second, username, password); auto postgresql_replica_settings = std::make_unique(); if (engine_define->settings) postgresql_replica_settings->loadFromQuery(*engine_define); return std::make_shared( context, metadata_path, uuid, engine_define, create.attach, database_name, postgres_database_name, connection_info, std::move(postgresql_replica_settings)); } #endif #if USE_SQLITE else if (engine_name == "SQLite") { const ASTFunction * engine = engine_define->engine; if (!engine->arguments || engine->arguments->children.size() != 1) throw Exception("SQLite database requires 1 argument: database path", ErrorCodes::BAD_ARGUMENTS); const auto & arguments = engine->arguments->children; String database_path = safeGetLiteralValue(arguments[0], "SQLite"); return std::make_shared(context, engine_define, database_path); } #endif throw Exception("Unknown database engine: " + engine_name, ErrorCodes::UNKNOWN_DATABASE_ENGINE); } }