2019-10-22 10:31:28 +00:00
|
|
|
#include <Interpreters/InterpreterInsertQuery.h>
|
2017-07-13 20:58:19 +00:00
|
|
|
|
2020-07-07 09:24:49 +00:00
|
|
|
#include <Access/AccessFlags.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <DataStreams/AddingDefaultBlockOutputStream.h>
|
2019-05-19 05:27:00 +00:00
|
|
|
#include <DataStreams/CheckConstraintsBlockOutputStream.h>
|
2019-02-07 13:18:04 +00:00
|
|
|
#include <DataStreams/CountingBlockOutputStream.h>
|
2019-10-22 10:31:28 +00:00
|
|
|
#include <DataStreams/InputStreamFromASTInsertQuery.h>
|
2017-12-20 07:39:52 +00:00
|
|
|
#include <DataStreams/NullAndDoCopyBlockInputStream.h>
|
|
|
|
#include <DataStreams/PushingToViewsBlockOutputStream.h>
|
|
|
|
#include <DataStreams/SquashingBlockOutputStream.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <DataStreams/copyData.h>
|
2020-12-10 22:05:02 +00:00
|
|
|
#include <IO/ConnectionTimeoutsContext.h>
|
2019-10-22 10:31:28 +00:00
|
|
|
#include <Interpreters/InterpreterSelectWithUnionQuery.h>
|
2020-04-25 11:33:47 +00:00
|
|
|
#include <Interpreters/InterpreterWatchQuery.h>
|
2019-10-22 10:31:28 +00:00
|
|
|
#include <Parsers/ASTFunction.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Parsers/ASTInsertQuery.h>
|
2020-03-19 16:51:09 +00:00
|
|
|
#include <Parsers/ASTSelectQuery.h>
|
2018-02-25 06:34:20 +00:00
|
|
|
#include <Parsers/ASTSelectWithUnionQuery.h>
|
2020-07-07 09:24:49 +00:00
|
|
|
#include <Parsers/ASTTablesInSelectQuery.h>
|
|
|
|
#include <Processors/Sources/SinkToOutputStream.h>
|
|
|
|
#include <Processors/Sources/SourceFromInputStream.h>
|
2020-11-17 17:16:55 +00:00
|
|
|
#include <Processors/Transforms/ExpressionTransform.h>
|
2020-03-19 16:51:09 +00:00
|
|
|
#include <Storages/StorageDistributed.h>
|
2021-01-05 03:22:06 +00:00
|
|
|
#include <Storages/StorageMaterializedView.h>
|
2017-11-02 14:01:11 +00:00
|
|
|
#include <TableFunctions/TableFunctionFactory.h>
|
2019-10-22 10:31:28 +00:00
|
|
|
#include <Common/checkStackSize.h>
|
2020-12-14 03:30:39 +00:00
|
|
|
#include <Interpreters/QueryLog.h>
|
2020-09-03 17:51:16 +00:00
|
|
|
#include <Interpreters/TranslateQualifiedNamesVisitor.h>
|
|
|
|
#include <Interpreters/getTableExpressions.h>
|
2020-12-01 09:10:12 +00:00
|
|
|
#include <Interpreters/processColumnTransformers.h>
|
2021-04-22 18:10:56 +00:00
|
|
|
#include <DataTypes/DataTypeNullable.h>
|
|
|
|
#include <Columns/ColumnNullable.h>
|
2016-10-24 02:02:37 +00:00
|
|
|
|
2018-02-19 03:00:16 +00:00
|
|
|
|
2011-10-30 11:30:52 +00:00
|
|
|
namespace DB
|
|
|
|
{
|
2018-02-19 03:00:16 +00:00
|
|
|
|
2016-01-11 21:46:36 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
extern const int NO_SUCH_COLUMN_IN_TABLE;
|
2018-02-19 00:45:32 +00:00
|
|
|
extern const int ILLEGAL_COLUMN;
|
2019-11-08 09:57:32 +00:00
|
|
|
extern const int DUPLICATE_COLUMN;
|
2016-01-11 21:46:36 +00:00
|
|
|
}
|
|
|
|
|
2018-01-12 13:03:19 +00:00
|
|
|
InterpreterInsertQuery::InterpreterInsertQuery(
|
2021-04-10 23:33:54 +00:00
|
|
|
const ASTPtr & query_ptr_, ContextPtr context_, bool allow_materialized_, bool no_squash_, bool no_destination_)
|
|
|
|
: WithContext(context_)
|
|
|
|
, query_ptr(query_ptr_)
|
2019-10-22 10:31:28 +00:00
|
|
|
, allow_materialized(allow_materialized_)
|
|
|
|
, no_squash(no_squash_)
|
|
|
|
, no_destination(no_destination_)
|
2011-10-30 11:30:52 +00:00
|
|
|
{
|
2019-08-10 17:51:47 +00:00
|
|
|
checkStackSize();
|
2011-10-30 11:30:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2020-01-24 16:20:36 +00:00
|
|
|
StoragePtr InterpreterInsertQuery::getTable(ASTInsertQuery & query)
|
2011-10-30 11:30:52 +00:00
|
|
|
{
|
2017-11-02 14:01:11 +00:00
|
|
|
if (query.table_function)
|
|
|
|
{
|
|
|
|
const auto & factory = TableFunctionFactory::instance();
|
2021-04-10 23:33:54 +00:00
|
|
|
TableFunctionPtr table_function_ptr = factory.get(query.table_function, getContext());
|
|
|
|
return table_function_ptr->execute(query.table_function, getContext(), table_function_ptr->getName());
|
2017-11-02 14:01:11 +00:00
|
|
|
}
|
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
query.table_id = getContext()->resolveStorageID(query.table_id);
|
|
|
|
return DatabaseCatalog::instance().getTable(query.table_id, getContext());
|
2011-10-30 11:30:52 +00:00
|
|
|
}
|
|
|
|
|
2020-06-16 12:48:10 +00:00
|
|
|
Block InterpreterInsertQuery::getSampleBlock(
|
|
|
|
const ASTInsertQuery & query,
|
|
|
|
const StoragePtr & table,
|
|
|
|
const StorageMetadataPtr & metadata_snapshot) const
|
2017-11-02 14:01:11 +00:00
|
|
|
{
|
2020-06-16 12:48:10 +00:00
|
|
|
Block table_sample_non_materialized = metadata_snapshot->getSampleBlockNonMaterialized();
|
2017-04-02 17:37:49 +00:00
|
|
|
/// If the query does not include information about columns
|
2017-04-01 07:20:54 +00:00
|
|
|
if (!query.columns)
|
2018-09-20 12:59:33 +00:00
|
|
|
{
|
2019-10-22 10:31:28 +00:00
|
|
|
if (no_destination)
|
2020-06-16 12:58:05 +00:00
|
|
|
return metadata_snapshot->getSampleBlockWithVirtuals(table->getVirtuals());
|
2018-09-20 12:59:33 +00:00
|
|
|
else
|
|
|
|
return table_sample_non_materialized;
|
|
|
|
}
|
2013-10-25 14:56:47 +00:00
|
|
|
|
2020-06-16 15:51:29 +00:00
|
|
|
Block table_sample = metadata_snapshot->getSampleBlock();
|
2020-09-14 13:45:32 +00:00
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
const auto columns_ast = processColumnTransformers(getContext()->getCurrentDatabase(), table, metadata_snapshot, query.columns);
|
2020-09-03 17:51:16 +00:00
|
|
|
|
2017-04-02 17:37:49 +00:00
|
|
|
/// Form the block based on the column names from the query
|
2017-04-01 07:20:54 +00:00
|
|
|
Block res;
|
2020-09-03 17:51:16 +00:00
|
|
|
for (const auto & identifier : columns_ast->children)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
|
|
|
std::string current_name = identifier->getColumnName();
|
2013-10-25 14:56:47 +00:00
|
|
|
|
2017-04-02 17:37:49 +00:00
|
|
|
/// The table does not have a column with that name
|
2017-04-01 07:20:54 +00:00
|
|
|
if (!table_sample.has(current_name))
|
2021-01-13 13:55:34 +00:00
|
|
|
throw Exception("No such column " + current_name + " in table " + table->getStorageID().getNameForLogs(),
|
2020-08-24 14:29:31 +00:00
|
|
|
ErrorCodes::NO_SUCH_COLUMN_IN_TABLE);
|
2012-03-19 12:57:56 +00:00
|
|
|
|
2018-02-19 00:45:32 +00:00
|
|
|
if (!allow_materialized && !table_sample_non_materialized.has(current_name))
|
|
|
|
throw Exception("Cannot insert column " + current_name + ", because it is MATERIALIZED column.", ErrorCodes::ILLEGAL_COLUMN);
|
2019-11-08 09:57:32 +00:00
|
|
|
if (res.has(current_name))
|
|
|
|
throw Exception("Column " + current_name + " specified more than once", ErrorCodes::DUPLICATE_COLUMN);
|
2014-06-26 00:58:14 +00:00
|
|
|
|
2018-02-19 00:45:32 +00:00
|
|
|
res.insert(ColumnWithTypeAndName(table_sample.getByName(current_name).type, current_name));
|
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
return res;
|
2013-10-25 14:56:47 +00:00
|
|
|
}
|
2012-03-19 12:57:56 +00:00
|
|
|
|
2011-10-30 11:30:52 +00:00
|
|
|
|
2020-08-24 14:29:31 +00:00
|
|
|
/** A query that just reads all data without any complex computations or filetering.
|
|
|
|
* If we just pipe the result to INSERT, we don't have to use too many threads for read.
|
|
|
|
*/
|
2020-11-02 05:28:37 +00:00
|
|
|
static bool isTrivialSelect(const ASTPtr & select)
|
2020-08-24 14:29:31 +00:00
|
|
|
{
|
2020-11-02 08:02:35 +00:00
|
|
|
if (auto * select_query = select->as<ASTSelectQuery>())
|
2020-11-02 05:28:37 +00:00
|
|
|
{
|
|
|
|
const auto & tables = select_query->tables();
|
2020-08-24 14:29:31 +00:00
|
|
|
|
2020-11-02 05:28:37 +00:00
|
|
|
if (!tables)
|
|
|
|
return false;
|
2020-08-24 14:29:31 +00:00
|
|
|
|
2020-11-02 05:28:37 +00:00
|
|
|
const auto & tables_in_select_query = tables->as<ASTTablesInSelectQuery &>();
|
2020-08-24 14:29:31 +00:00
|
|
|
|
2020-11-02 05:28:37 +00:00
|
|
|
if (tables_in_select_query.children.size() != 1)
|
|
|
|
return false;
|
2020-08-24 14:29:31 +00:00
|
|
|
|
2020-11-02 05:28:37 +00:00
|
|
|
const auto & child = tables_in_select_query.children.front();
|
|
|
|
const auto & table_element = child->as<ASTTablesInSelectQueryElement &>();
|
|
|
|
const auto & table_expr = table_element.table_expression->as<ASTTableExpression &>();
|
2020-08-24 14:29:31 +00:00
|
|
|
|
2020-11-02 05:28:37 +00:00
|
|
|
if (table_expr.subquery)
|
|
|
|
return false;
|
2020-08-24 14:29:31 +00:00
|
|
|
|
2020-11-02 05:28:37 +00:00
|
|
|
/// Note: how to write it in more generic way?
|
|
|
|
return (!select_query->distinct
|
|
|
|
&& !select_query->limit_with_ties
|
|
|
|
&& !select_query->prewhere()
|
|
|
|
&& !select_query->where()
|
|
|
|
&& !select_query->groupBy()
|
|
|
|
&& !select_query->having()
|
|
|
|
&& !select_query->orderBy()
|
|
|
|
&& !select_query->limitBy());
|
|
|
|
}
|
|
|
|
/// This query is ASTSelectWithUnionQuery subquery
|
|
|
|
return false;
|
2020-08-24 14:29:31 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
|
2014-03-20 10:59:45 +00:00
|
|
|
BlockIO InterpreterInsertQuery::execute()
|
2012-03-11 08:52:56 +00:00
|
|
|
{
|
2021-04-10 23:33:54 +00:00
|
|
|
const Settings & settings = getContext()->getSettingsRef();
|
2020-01-24 16:20:36 +00:00
|
|
|
auto & query = query_ptr->as<ASTInsertQuery &>();
|
2019-11-15 18:41:18 +00:00
|
|
|
|
2019-12-17 08:18:17 +00:00
|
|
|
BlockIO res;
|
2012-03-11 08:52:56 +00:00
|
|
|
|
2020-01-24 16:20:36 +00:00
|
|
|
StoragePtr table = getTable(query);
|
2021-04-10 23:33:54 +00:00
|
|
|
auto table_lock = table->lockForShare(getContext()->getInitialQueryId(), settings.lock_acquire_timeout);
|
2020-06-15 19:08:58 +00:00
|
|
|
auto metadata_snapshot = table->getInMemoryMetadataPtr();
|
2014-03-19 10:45:13 +00:00
|
|
|
|
2020-06-16 12:48:10 +00:00
|
|
|
auto query_sample_block = getSampleBlock(query, table, metadata_snapshot);
|
2020-03-02 20:23:58 +00:00
|
|
|
if (!query.table_function)
|
2021-04-10 23:33:54 +00:00
|
|
|
getContext()->checkAccess(AccessType::INSERT, query.table_id, query_sample_block.getNames());
|
2020-01-24 16:20:36 +00:00
|
|
|
|
2020-03-19 16:51:09 +00:00
|
|
|
bool is_distributed_insert_select = false;
|
2019-12-12 10:49:15 +00:00
|
|
|
|
2020-03-19 17:04:59 +00:00
|
|
|
if (query.select && table->isRemote() && settings.parallel_distributed_insert_select)
|
2020-03-19 16:51:09 +00:00
|
|
|
{
|
|
|
|
// Distributed INSERT SELECT
|
2021-04-10 23:33:54 +00:00
|
|
|
if (auto maybe_pipeline = table->distributedWrite(query, getContext()))
|
2020-01-24 09:09:47 +00:00
|
|
|
{
|
2021-04-04 10:27:45 +00:00
|
|
|
res.pipeline = std::move(*maybe_pipeline);
|
2020-03-19 16:51:09 +00:00
|
|
|
is_distributed_insert_select = true;
|
2020-01-24 09:09:47 +00:00
|
|
|
}
|
2018-03-11 18:36:09 +00:00
|
|
|
}
|
2019-12-12 10:49:15 +00:00
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
BlockOutputStreams out_streams;
|
2020-04-25 11:33:47 +00:00
|
|
|
if (!is_distributed_insert_select || query.watch)
|
2019-12-12 10:49:15 +00:00
|
|
|
{
|
2020-03-19 16:51:09 +00:00
|
|
|
size_t out_streams_size = 1;
|
|
|
|
if (query.select)
|
|
|
|
{
|
2020-08-24 14:29:31 +00:00
|
|
|
bool is_trivial_insert_select = false;
|
|
|
|
|
|
|
|
if (settings.optimize_trivial_insert_select)
|
2020-08-02 05:35:58 +00:00
|
|
|
{
|
2020-11-10 06:42:38 +00:00
|
|
|
const auto & select_query = query.select->as<ASTSelectWithUnionQuery &>();
|
|
|
|
const auto & selects = select_query.list_of_selects->children;
|
|
|
|
const auto & union_modes = select_query.list_of_modes;
|
2020-07-07 09:24:49 +00:00
|
|
|
|
2020-12-24 10:11:07 +00:00
|
|
|
/// ASTSelectWithUnionQuery is not normalized now, so it may pass some queries which can be Trivial select queries
|
2020-11-02 05:28:37 +00:00
|
|
|
is_trivial_insert_select
|
2020-11-10 06:42:38 +00:00
|
|
|
= std::all_of(
|
|
|
|
union_modes.begin(),
|
|
|
|
union_modes.end(),
|
|
|
|
[](const ASTSelectWithUnionQuery::Mode & mode) { return mode == ASTSelectWithUnionQuery::Mode::ALL; })
|
|
|
|
&& std::all_of(selects.begin(), selects.end(), [](const ASTPtr & select) { return isTrivialSelect(select); });
|
2020-08-24 14:29:31 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (is_trivial_insert_select)
|
|
|
|
{
|
|
|
|
/** When doing trivial INSERT INTO ... SELECT ... FROM table,
|
|
|
|
* don't need to process SELECT with more than max_insert_threads
|
|
|
|
* and it's reasonable to set block size for SELECT to the desired block size for INSERT
|
|
|
|
* to avoid unnecessary squashing.
|
|
|
|
*/
|
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
Settings new_settings = getContext()->getSettings();
|
2020-08-24 14:29:31 +00:00
|
|
|
|
|
|
|
new_settings.max_threads = std::max<UInt64>(1, settings.max_insert_threads);
|
|
|
|
|
2021-05-12 09:40:39 +00:00
|
|
|
if (table->prefersLargeBlocks())
|
|
|
|
{
|
|
|
|
if (settings.min_insert_block_size_rows)
|
|
|
|
new_settings.max_block_size = settings.min_insert_block_size_rows;
|
|
|
|
if (settings.min_insert_block_size_bytes)
|
|
|
|
new_settings.preferred_block_size_bytes = settings.min_insert_block_size_bytes;
|
|
|
|
}
|
2020-08-24 14:29:31 +00:00
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
auto new_context = Context::createCopy(context);
|
|
|
|
new_context->setSettings(new_settings);
|
2020-08-24 14:29:31 +00:00
|
|
|
|
|
|
|
InterpreterSelectWithUnionQuery interpreter_select{
|
|
|
|
query.select, new_context, SelectQueryOptions(QueryProcessingStage::Complete, 1)};
|
|
|
|
res = interpreter_select.execute();
|
2020-07-07 09:24:49 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2020-08-24 14:29:31 +00:00
|
|
|
/// Passing 1 as subquery_depth will disable limiting size of intermediate result.
|
2020-07-07 09:24:49 +00:00
|
|
|
InterpreterSelectWithUnionQuery interpreter_select{
|
2021-04-10 23:33:54 +00:00
|
|
|
query.select, getContext(), SelectQueryOptions(QueryProcessingStage::Complete, 1)};
|
2020-07-07 09:24:49 +00:00
|
|
|
res = interpreter_select.execute();
|
|
|
|
}
|
2019-12-12 10:49:15 +00:00
|
|
|
|
2021-05-06 17:30:24 +00:00
|
|
|
res.pipeline.dropTotalsAndExtremes();
|
|
|
|
|
2020-03-19 16:51:09 +00:00
|
|
|
if (table->supportsParallelInsert() && settings.max_insert_threads > 1)
|
2020-05-27 18:20:26 +00:00
|
|
|
out_streams_size = std::min(size_t(settings.max_insert_threads), res.pipeline.getNumStreams());
|
|
|
|
|
2020-06-05 09:30:16 +00:00
|
|
|
res.pipeline.resize(out_streams_size);
|
2021-04-22 18:10:56 +00:00
|
|
|
|
2021-04-22 21:30:31 +00:00
|
|
|
/// Allow to insert Nullable into non-Nullable columns, NULL values will be added as defaults values.
|
2021-04-22 22:13:07 +00:00
|
|
|
if (getContext()->getSettingsRef().insert_null_as_default)
|
2021-04-22 21:30:31 +00:00
|
|
|
{
|
2021-04-23 17:24:03 +00:00
|
|
|
const auto & input_columns = res.pipeline.getHeader().getColumnsWithTypeAndName();
|
|
|
|
const auto & query_columns = query_sample_block.getColumnsWithTypeAndName();
|
2021-04-23 09:50:56 +00:00
|
|
|
const auto & output_columns = metadata_snapshot->getColumns();
|
2021-04-22 18:10:56 +00:00
|
|
|
|
2021-04-23 19:08:13 +00:00
|
|
|
if (input_columns.size() == query_columns.size())
|
2021-04-22 18:10:56 +00:00
|
|
|
{
|
2021-04-23 19:08:13 +00:00
|
|
|
for (size_t col_idx = 0; col_idx < query_columns.size(); ++col_idx)
|
|
|
|
{
|
|
|
|
/// Change query sample block columns to Nullable to allow inserting nullable columns, where NULL values will be substituted with
|
|
|
|
/// default column values (in AddingDefaultBlockOutputStream), so all values will be cast correctly.
|
|
|
|
if (input_columns[col_idx].type->isNullable() && !query_columns[col_idx].type->isNullable() && output_columns.hasDefault(query_columns[col_idx].name))
|
|
|
|
query_sample_block.setColumn(col_idx, ColumnWithTypeAndName(makeNullable(query_columns[col_idx].column), makeNullable(query_columns[col_idx].type), query_columns[col_idx].name));
|
|
|
|
}
|
2021-04-22 18:10:56 +00:00
|
|
|
}
|
|
|
|
}
|
2020-03-19 16:51:09 +00:00
|
|
|
}
|
2020-04-25 11:33:47 +00:00
|
|
|
else if (query.watch)
|
|
|
|
{
|
2021-04-10 23:33:54 +00:00
|
|
|
InterpreterWatchQuery interpreter_watch{ query.watch, getContext() };
|
2020-04-25 11:33:47 +00:00
|
|
|
res = interpreter_watch.execute();
|
2020-05-27 18:20:26 +00:00
|
|
|
res.pipeline.init(Pipe(std::make_shared<SourceFromInputStream>(std::move(res.in))));
|
2020-04-25 11:33:47 +00:00
|
|
|
}
|
2018-09-20 11:40:04 +00:00
|
|
|
|
2020-03-19 16:51:09 +00:00
|
|
|
for (size_t i = 0; i < out_streams_size; i++)
|
2019-12-12 10:49:15 +00:00
|
|
|
{
|
2020-03-19 16:51:09 +00:00
|
|
|
/// We create a pipeline of several streams, into which we will write data.
|
|
|
|
BlockOutputStreamPtr out;
|
2019-05-19 05:27:00 +00:00
|
|
|
|
2020-03-19 16:51:09 +00:00
|
|
|
/// NOTE: we explicitly ignore bound materialized views when inserting into Kafka Storage.
|
|
|
|
/// Otherwise we'll get duplicates when MV reads same rows again from Kafka.
|
|
|
|
if (table->noPushingToViews() && !no_destination)
|
2021-04-10 23:33:54 +00:00
|
|
|
out = table->write(query_ptr, metadata_snapshot, getContext());
|
2020-03-19 16:51:09 +00:00
|
|
|
else
|
2021-04-10 23:33:54 +00:00
|
|
|
out = std::make_shared<PushingToViewsBlockOutputStream>(table, metadata_snapshot, getContext(), query_ptr, no_destination);
|
2016-12-06 20:55:13 +00:00
|
|
|
|
2020-05-29 02:08:48 +00:00
|
|
|
/// Note that we wrap transforms one on top of another, so we write them in reverse of data processing order.
|
|
|
|
|
|
|
|
/// Checking constraints. It must be done after calculation of all defaults, so we can check them on calculated columns.
|
2020-06-16 16:55:04 +00:00
|
|
|
if (const auto & constraints = metadata_snapshot->getConstraints(); !constraints.empty())
|
2020-05-29 02:08:48 +00:00
|
|
|
out = std::make_shared<CheckConstraintsBlockOutputStream>(
|
2021-04-10 23:33:54 +00:00
|
|
|
query.table_id, out, out->getHeader(), metadata_snapshot->getConstraints(), getContext());
|
2020-05-29 02:08:48 +00:00
|
|
|
|
2021-04-23 09:50:56 +00:00
|
|
|
bool null_as_default = query.select && getContext()->getSettingsRef().insert_null_as_default;
|
|
|
|
|
2020-05-29 02:08:48 +00:00
|
|
|
/// Actually we don't know structure of input blocks from query/table,
|
|
|
|
/// because some clients break insertion protocol (columns != header)
|
|
|
|
out = std::make_shared<AddingDefaultBlockOutputStream>(
|
2021-04-23 09:50:56 +00:00
|
|
|
out, query_sample_block, metadata_snapshot->getColumns(), getContext(), null_as_default);
|
2020-05-29 02:08:48 +00:00
|
|
|
|
|
|
|
/// It's important to squash blocks as early as possible (before other transforms),
|
|
|
|
/// because other transforms may work inefficient if block size is small.
|
|
|
|
|
2020-03-19 16:51:09 +00:00
|
|
|
/// Do not squash blocks if it is a sync INSERT into Distributed, since it lead to double bufferization on client and server side.
|
|
|
|
/// Client-side bufferization might cause excessive timeouts (especially in case of big blocks).
|
2021-02-07 01:49:52 +00:00
|
|
|
if (!(settings.insert_distributed_sync && table->isRemote()) && !no_squash && !query.watch)
|
2020-03-19 16:51:09 +00:00
|
|
|
{
|
2021-02-07 01:49:52 +00:00
|
|
|
bool table_prefers_large_blocks = table->prefersLargeBlocks();
|
|
|
|
|
2020-03-19 16:51:09 +00:00
|
|
|
out = std::make_shared<SquashingBlockOutputStream>(
|
|
|
|
out,
|
|
|
|
out->getHeader(),
|
2021-02-07 01:49:52 +00:00
|
|
|
table_prefers_large_blocks ? settings.min_insert_block_size_rows : settings.max_block_size,
|
|
|
|
table_prefers_large_blocks ? settings.min_insert_block_size_bytes : 0);
|
2020-03-19 16:51:09 +00:00
|
|
|
}
|
2019-12-12 10:49:15 +00:00
|
|
|
|
2020-03-19 16:51:09 +00:00
|
|
|
auto out_wrapper = std::make_shared<CountingBlockOutputStream>(out);
|
2021-04-10 23:33:54 +00:00
|
|
|
out_wrapper->setProcessListElement(getContext()->getProcessListElement());
|
2021-05-17 20:26:25 +00:00
|
|
|
out_streams.emplace_back(std::move(out_wrapper));
|
2020-03-19 16:51:09 +00:00
|
|
|
}
|
2019-12-12 10:49:15 +00:00
|
|
|
}
|
2014-03-19 10:45:13 +00:00
|
|
|
|
2020-04-25 11:33:47 +00:00
|
|
|
/// What type of query: INSERT or INSERT SELECT or INSERT WATCH?
|
2020-05-27 18:20:26 +00:00
|
|
|
if (is_distributed_insert_select)
|
|
|
|
{
|
|
|
|
/// Pipeline was already built.
|
|
|
|
}
|
|
|
|
else if (query.select || query.watch)
|
2017-04-01 07:20:54 +00:00
|
|
|
{
|
2020-05-27 18:20:26 +00:00
|
|
|
const auto & header = out_streams.at(0)->getHeader();
|
2020-11-17 17:16:55 +00:00
|
|
|
auto actions_dag = ActionsDAG::makeConvertingActions(
|
|
|
|
res.pipeline.getHeader().getColumnsWithTypeAndName(),
|
|
|
|
header.getColumnsWithTypeAndName(),
|
|
|
|
ActionsDAG::MatchColumnsMode::Position);
|
2021-05-19 14:32:07 +00:00
|
|
|
auto actions = std::make_shared<ExpressionActions>(actions_dag, ExpressionActionsSettings::fromContext(getContext(), CompileExpressions::yes));
|
2020-05-27 18:20:26 +00:00
|
|
|
|
|
|
|
res.pipeline.addSimpleTransform([&](const Block & in_header) -> ProcessorPtr
|
2019-12-12 10:49:15 +00:00
|
|
|
{
|
2020-11-17 17:16:55 +00:00
|
|
|
return std::make_shared<ExpressionTransform>(in_header, actions);
|
2020-05-27 18:20:26 +00:00
|
|
|
});
|
2019-12-12 10:49:15 +00:00
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
res.pipeline.setSinks([&](const Block &, QueryPipeline::StreamType type) -> ProcessorPtr
|
2019-12-12 10:49:15 +00:00
|
|
|
{
|
2020-05-27 18:20:26 +00:00
|
|
|
if (type != QueryPipeline::StreamType::Main)
|
|
|
|
return nullptr;
|
2016-08-25 12:38:47 +00:00
|
|
|
|
2020-05-27 18:20:26 +00:00
|
|
|
auto stream = std::move(out_streams.back());
|
|
|
|
out_streams.pop_back();
|
|
|
|
|
|
|
|
return std::make_shared<SinkToOutputStream>(std::move(stream));
|
|
|
|
});
|
2018-02-19 00:45:32 +00:00
|
|
|
|
|
|
|
if (!allow_materialized)
|
|
|
|
{
|
2020-06-17 16:39:58 +00:00
|
|
|
for (const auto & column : metadata_snapshot->getColumns())
|
2020-05-27 18:20:26 +00:00
|
|
|
if (column.default_desc.kind == ColumnDefaultKind::Materialized && header.has(column.name))
|
2019-03-14 15:20:51 +00:00
|
|
|
throw Exception("Cannot insert column " + column.name + ", because it is MATERIALIZED column.", ErrorCodes::ILLEGAL_COLUMN);
|
2018-02-19 00:45:32 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
}
|
2019-02-08 13:24:24 +00:00
|
|
|
else if (query.data && !query.has_tail) /// can execute without additional data
|
2019-02-07 13:18:04 +00:00
|
|
|
{
|
2019-12-19 16:09:05 +00:00
|
|
|
// res.out = std::move(out_streams.at(0));
|
2021-04-10 23:33:54 +00:00
|
|
|
res.in = std::make_shared<InputStreamFromASTInsertQuery>(query_ptr, nullptr, query_sample_block, getContext(), nullptr);
|
2019-12-19 16:09:05 +00:00
|
|
|
res.in = std::make_shared<NullAndDoCopyBlockInputStream>(res.in, out_streams.at(0));
|
2019-02-07 13:18:04 +00:00
|
|
|
}
|
2019-12-16 13:52:32 +00:00
|
|
|
else
|
2019-12-12 10:49:15 +00:00
|
|
|
res.out = std::move(out_streams.at(0));
|
2020-05-27 18:20:26 +00:00
|
|
|
|
2019-12-16 13:52:32 +00:00
|
|
|
res.pipeline.addStorageHolder(table);
|
2020-10-14 19:25:31 +00:00
|
|
|
if (const auto * mv = dynamic_cast<const StorageMaterializedView *>(table.get()))
|
|
|
|
{
|
|
|
|
if (auto inner_table = mv->tryGetTargetTable())
|
|
|
|
res.pipeline.addStorageHolder(inner_table);
|
|
|
|
}
|
2014-03-20 10:59:45 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return res;
|
2012-03-11 08:52:56 +00:00
|
|
|
}
|
|
|
|
|
2018-02-19 00:45:32 +00:00
|
|
|
|
2020-03-02 20:23:58 +00:00
|
|
|
StorageID InterpreterInsertQuery::getDatabaseTable() const
|
2018-07-16 14:52:02 +00:00
|
|
|
{
|
2020-03-02 20:23:58 +00:00
|
|
|
return query_ptr->as<ASTInsertQuery &>().table_id;
|
2018-07-16 14:52:02 +00:00
|
|
|
}
|
|
|
|
|
2020-12-14 03:30:39 +00:00
|
|
|
|
2021-04-10 23:33:54 +00:00
|
|
|
void InterpreterInsertQuery::extendQueryLogElemImpl(QueryLogElement & elem, const ASTPtr &, ContextPtr context_) const
|
2020-12-14 03:30:39 +00:00
|
|
|
{
|
|
|
|
elem.query_kind = "Insert";
|
2021-04-10 23:33:54 +00:00
|
|
|
const auto & insert_table = context_->getInsertionTable();
|
2020-12-14 03:30:39 +00:00
|
|
|
if (!insert_table.empty())
|
|
|
|
{
|
|
|
|
elem.query_databases.insert(insert_table.getDatabaseName());
|
|
|
|
elem.query_tables.insert(insert_table.getFullNameNotQuoted());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-10-30 11:30:52 +00:00
|
|
|
}
|