ClickHouse/dbms/src/Interpreters/Aggregator.cpp

#include <iomanip>
#include <thread>
#include <future>

#include <cxxabi.h>

#include <DB/Common/Stopwatch.h>
#include <DB/Common/setThreadName.h>

#include <DB/DataTypes/DataTypeAggregateFunction.h>
#include <DB/Columns/ColumnsNumber.h>
#include <DB/Columns/ColumnArray.h>
#include <DB/AggregateFunctions/AggregateFunctionCount.h>
#include <DB/DataStreams/IProfilingBlockInputStream.h>
#include <DB/DataStreams/NativeBlockOutputStream.h>
#include <DB/DataStreams/NullBlockInputStream.h>
#include <DB/IO/WriteBufferFromFile.h>
#include <DB/IO/CompressedWriteBuffer.h>

#include <DB/Interpreters/Aggregator.h>
#include <common/ClickHouseRevision.h>


namespace DB
{

namespace ErrorCodes
{
	extern const int CANNOT_COMPILE_CODE;
	extern const int TOO_MUCH_ROWS;
	extern const int EMPTY_DATA_PASSED;
	extern const int CANNOT_MERGE_DIFFERENT_AGGREGATED_DATA_VARIANTS;
}


AggregatedDataVariants::~AggregatedDataVariants()
{
	if (aggregator && !aggregator->all_aggregates_has_trivial_destructor)
	{
		try
		{
			aggregator->destroyAllAggregateStates(*this);
		}
		catch (...)
		{
			tryLogCurrentException(__PRETTY_FUNCTION__);
		}
	}
}


void AggregatedDataVariants::convertToTwoLevel()
{
	if (aggregator)
		LOG_TRACE(aggregator->log, "Converting aggregation data to two-level.");

	switch (type)
	{
	#define M(NAME) \
		case Type::NAME: \
			NAME ## _two_level.reset(new decltype(NAME ## _two_level)::element_type(*NAME)); \
			NAME.reset(); \
			type = Type::NAME ## _two_level; \
			break;

		APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)

	#undef M

		default:
			throw Exception("Wrong data variant passed.", ErrorCodes::LOGICAL_ERROR);
	}
}


void Aggregator::Params::calculateColumnNumbers(const Block & block)
{
	if (keys.empty() && !key_names.empty())
		for (Names::const_iterator it = key_names.begin(); it != key_names.end(); ++it)
			keys.push_back(block.getPositionByName(*it));

	for (AggregateDescriptions::iterator it = aggregates.begin(); it != aggregates.end(); ++it)
		if (it->arguments.empty() && !it->argument_names.empty())
			for (Names::const_iterator jt = it->argument_names.begin(); jt != it->argument_names.end(); ++jt)
				it->arguments.push_back(block.getPositionByName(*jt));
}


void Aggregator::initialize(const Block & block)
{
	if (isCancelled())
		return;

	std::lock_guard<std::mutex> lock(mutex);

	if (initialized)
		return;

	initialized = true;

	if (current_memory_tracker)
		memory_usage_before_aggregation = current_memory_tracker->get();

	aggregate_functions.resize(params.aggregates_size);
	for (size_t i = 0; i < params.aggregates_size; ++i)
		aggregate_functions[i] = params.aggregates[i].function.get();

	/// Инициализируем размеры состояний и смещения для агрегатных функций.
	offsets_of_aggregate_states.resize(params.aggregates_size);
	total_size_of_aggregate_states = 0;
	all_aggregates_has_trivial_destructor = true;

	for (size_t i = 0; i < params.aggregates_size; ++i)
	{
		offsets_of_aggregate_states[i] = total_size_of_aggregate_states;
		total_size_of_aggregate_states += params.aggregates[i].function->sizeOfData();

		if (!params.aggregates[i].function->hasTrivialDestructor())
			all_aggregates_has_trivial_destructor = false;
	}

	if (isCancelled())
		return;

	/** Всё остальное - только если передан непустой block.
	  * (всё остальное не нужно в методе merge блоков с готовыми состояниями агрегатных функций).
	  */
	if (!block)
		return;

	/// Преобразуем имена столбцов в номера, если номера не заданы
	params.calculateColumnNumbers(block);

	if (isCancelled())
		return;

	/// Создадим пример блока, описывающего результат
	if (!sample)
	{
		for (size_t i = 0; i < params.keys_size; ++i)
		{
			sample.insert(block.getByPosition(params.keys[i]).cloneEmpty());
			if (auto converted = sample.getByPosition(i).column->convertToFullColumnIfConst())
				sample.getByPosition(i).column = converted;
		}

		for (size_t i = 0; i < params.aggregates_size; ++i)
		{
			ColumnWithTypeAndName col;
			col.name = params.aggregates[i].column_name;

			size_t arguments_size = params.aggregates[i].arguments.size();
			DataTypes argument_types(arguments_size);
			for (size_t j = 0; j < arguments_size; ++j)
				argument_types[j] = block.getByPosition(params.aggregates[i].arguments[j]).type;

			col.type = std::make_shared<DataTypeAggregateFunction>(params.aggregates[i].function, argument_types, params.aggregates[i].parameters);
			col.column = col.type->createColumn();

			sample.insert(std::move(col));
		}
	}
}


void Aggregator::setSampleBlock(const Block & block)
{
	std::lock_guard<std::mutex> lock(mutex);

	if (!sample)
		sample = block.cloneEmpty();
}


void Aggregator::compileIfPossible(AggregatedDataVariants::Type type)
{
	std::lock_guard<std::mutex> lock(mutex);

	if (compiled_if_possible)
		return;

	compiled_if_possible = true;

	std::string method_typename;
	std::string method_typename_two_level;

	if (false) {}
#define M(NAME) \
	else if (type == AggregatedDataVariants::Type::NAME) \
	{ \
		method_typename = "decltype(AggregatedDataVariants::" #NAME ")::element_type"; \
		method_typename_two_level = "decltype(AggregatedDataVariants::" #NAME "_two_level)::element_type"; \
	}

	APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
#undef M

#define M(NAME) \
	else if (type == AggregatedDataVariants::Type::NAME) \
		method_typename = "decltype(AggregatedDataVariants::" #NAME ")::element_type";

	APPLY_FOR_VARIANTS_NOT_CONVERTIBLE_TO_TWO_LEVEL(M)
#undef M
	else if (type == AggregatedDataVariants::Type::without_key) {}
	else
		throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);

	/// Список типов агрегатных функций.
	std::stringstream aggregate_functions_typenames_str;
	for (size_t i = 0; i < params.aggregates_size; ++i)
	{
		IAggregateFunction & func = *aggregate_functions[i];

		int status = 0;
		char * type_name_ptr = abi::__cxa_demangle(typeid(func).name(), 0, 0, &status);
		std::string type_name = type_name_ptr;
		free(type_name_ptr);

		if (status)
			throw Exception("Cannot compile code: cannot demangle name " + String(typeid(func).name())
				+ ", status: " + toString(status), ErrorCodes::CANNOT_COMPILE_CODE);

		aggregate_functions_typenames_str << ((i != 0) ? ", " : "") << type_name;
	}

	std::string aggregate_functions_typenames = aggregate_functions_typenames_str.str();

	std::stringstream key_str;
	key_str << "Aggregate: ";
	if (!method_typename.empty())
		key_str << method_typename + ", ";
	key_str << aggregate_functions_typenames;
	std::string key = key_str.str();

	auto get_code = [method_typename, method_typename_two_level, aggregate_functions_typenames]
	{
		/// Короткий кусок кода, представляющий собой явное инстанцирование шаблона.
		std::stringstream code;
		code <<		/// Нет явного включения заголовочного файла. Он подключается с помощью опции компилятора -include.
			"namespace DB\n"
			"{\n"
			"\n";

		/// Может быть до двух инстанцирований шаблона - для обычного и two_level вариантов.
		auto append_code_for_specialization =
			[&code, &aggregate_functions_typenames] (const std::string & method_typename, const std::string & suffix)
		{
			code <<
				"template void Aggregator::executeSpecialized<\n"
					"\t" << method_typename << ", TypeList<" << aggregate_functions_typenames << ">>(\n"
					"\t" << method_typename << " &, Arena *, size_t, ConstColumnPlainPtrs &,\n"
					"\tAggregateColumns &, const Sizes &, StringRefs &, bool, AggregateDataPtr) const;\n"
				"\n"
				"static void wrapper" << suffix << "(\n"
					"\tconst Aggregator & aggregator,\n"
					"\t" << method_typename << " & method,\n"
					"\tArena * arena,\n"
					"\tsize_t rows,\n"
					"\tConstColumnPlainPtrs & key_columns,\n"
					"\tAggregator::AggregateColumns & aggregate_columns,\n"
					"\tconst Sizes & key_sizes,\n"
					"\tStringRefs & keys,\n"
					"\tbool no_more_keys,\n"
					"\tAggregateDataPtr overflow_row)\n"
				"{\n"
					"\taggregator.executeSpecialized<\n"
						"\t\t" << method_typename << ", TypeList<" << aggregate_functions_typenames << ">>(\n"
						"\t\tmethod, arena, rows, key_columns, aggregate_columns, key_sizes, keys, no_more_keys, overflow_row);\n"
				"}\n"
				"\n"
				"void * getPtr" << suffix << "() __attribute__((__visibility__(\"default\")));\n"
				"void * getPtr" << suffix << "()\n"	/// Без этой обёртки непонятно, как достать нужный символ из скомпилированной библиотеки.
				"{\n"
					"\treturn reinterpret_cast<void *>(&wrapper" << suffix << ");\n"
				"}\n";
		};

		if (!method_typename.empty())
			append_code_for_specialization(method_typename, "");
		else
		{
			/// Для метода without_key.
			code <<
				"template void Aggregator::executeSpecializedWithoutKey<\n"
					"\t" << "TypeList<" << aggregate_functions_typenames << ">>(\n"
					"\tAggregatedDataWithoutKey &, size_t, AggregateColumns &) const;\n"
				"\n"
				"static void wrapper(\n"
					"\tconst Aggregator & aggregator,\n"
					"\tAggregatedDataWithoutKey & method,\n"
					"\tsize_t rows,\n"
					"\tAggregator::AggregateColumns & aggregate_columns)\n"
				"{\n"
					"\taggregator.executeSpecializedWithoutKey<\n"
						"\t\tTypeList<" << aggregate_functions_typenames << ">>(\n"
						"\t\tmethod, rows, aggregate_columns);\n"
				"}\n"
				"\n"
				"void * getPtr() __attribute__((__visibility__(\"default\")));\n"
				"void * getPtr()\n"
				"{\n"
					"\treturn reinterpret_cast<void *>(&wrapper);\n"
				"}\n";
		}

		if (!method_typename_two_level.empty())
			append_code_for_specialization(method_typename_two_level, "TwoLevel");
		else
		{
			/// Заглушка.
			code <<
				"void * getPtrTwoLevel() __attribute__((__visibility__(\"default\")));\n"
				"void * getPtrTwoLevel()\n"
				"{\n"
					"\treturn nullptr;\n"
				"}\n";
		}

		code <<
			"}\n";

		return code.str();
	};

	auto compiled_data_owned_by_callback = compiled_data;
	auto on_ready = [compiled_data_owned_by_callback] (SharedLibraryPtr & lib)
	{
		if (compiled_data_owned_by_callback.unique())	/// Aggregator уже уничтожен.
			return;

		compiled_data_owned_by_callback->compiled_aggregator = lib;
		compiled_data_owned_by_callback->compiled_method_ptr = lib->get<void * (*) ()>("_ZN2DB6getPtrEv")();
		compiled_data_owned_by_callback->compiled_two_level_method_ptr = lib->get<void * (*) ()>("_ZN2DB14getPtrTwoLevelEv")();
	};

	/** Если библиотека уже была скомпилирована, то возвращается ненулевой SharedLibraryPtr.
	  * Если библиотека не была скомпилирована, то увеличивается счётчик, и возвращается nullptr.
	  * Если счётчик достигнул значения min_count_to_compile, то асинхронно (в отдельном потоке) запускается компиляция,
	  *  по окончании которой вызывается колбэк on_ready.
	  */
	SharedLibraryPtr lib = params.compiler->getOrCount(key, params.min_count_to_compile,
		"-include /usr/share/clickhouse/headers/dbms/include/DB/Interpreters/SpecializedAggregator.h",
		get_code, on_ready);

	/// Если результат уже готов.
	if (lib)
		on_ready(lib);
}


AggregatedDataVariants::Type Aggregator::chooseAggregationMethod(const ConstColumnPlainPtrs & key_columns, Sizes & key_sizes)
{
	/** Возвращает обычные (не two-level) методы, так как обработка начинается с них.
	  * Затем, в процессе работы, данные могут быть переконвертированы в two-level структуру, если их становится много.
	  */

	bool all_fixed = true;
	size_t keys_bytes = 0;

	size_t num_array_keys = 0;
	bool has_arrays_of_non_fixed_elems = false;
	bool all_non_array_keys_are_fixed = true;

	key_sizes.resize(params.keys_size);
	for (size_t j = 0; j < params.keys_size; ++j)
	{
		if (key_columns[j]->isFixed())
		{
			key_sizes[j] = key_columns[j]->sizeOfField();
			keys_bytes += key_sizes[j];
		}
		else
		{
			all_fixed = false;

			if (const ColumnArray * arr = typeid_cast<const ColumnArray *>(key_columns[j]))
			{
				++num_array_keys;

				if (!arr->getData().isFixed())
					has_arrays_of_non_fixed_elems = true;
			}
			else
				all_non_array_keys_are_fixed = false;
		}
	}

	/// Если ключей нет
	if (params.keys_size == 0)
		return AggregatedDataVariants::Type::without_key;

	/// Если есть один числовой ключ, который помещается в 64 бита
	if (params.keys_size == 1 && key_columns[0]->isNumericNotNullable())
	{
		size_t size_of_field = key_columns[0]->sizeOfField();
		if (size_of_field == 1)
			return AggregatedDataVariants::Type::key8;
		if (size_of_field == 2)
			return AggregatedDataVariants::Type::key16;
		if (size_of_field == 4)
			return AggregatedDataVariants::Type::key32;
		if (size_of_field == 8)
			return AggregatedDataVariants::Type::key64;
		throw Exception("Logical error: numeric column has sizeOfField not in 1, 2, 4, 8.", ErrorCodes::LOGICAL_ERROR);
	}

	/// Если ключи помещаются в N бит, будем использовать хэш-таблицу по упакованным в N-бит ключам
	if (all_fixed && keys_bytes <= 16)
		return AggregatedDataVariants::Type::keys128;
	if (all_fixed && keys_bytes <= 32)
		return AggregatedDataVariants::Type::keys256;

	/// Если есть один строковый ключ, то используем хэш-таблицу с ним
	if (params.keys_size == 1 && typeid_cast<const ColumnString *>(key_columns[0]))
		return AggregatedDataVariants::Type::key_string;

	if (params.keys_size == 1 && typeid_cast<const ColumnFixedString *>(key_columns[0]))
		return AggregatedDataVariants::Type::key_fixed_string;

	/** Если есть массивы.
	  * Если есть не более одного массива из элементов фиксированной длины, и остальные ключи фиксированной длины,
	  *  то всё ещё можно использовать метод concat. Иначе - serialized.
	  */
	if (num_array_keys > 1 || has_arrays_of_non_fixed_elems || (num_array_keys == 1 && !all_non_array_keys_are_fixed))
		return AggregatedDataVariants::Type::serialized;

	/// Иначе будем агрегировать по конкатенации ключей.
	return AggregatedDataVariants::Type::concat;

	/// NOTE AggregatedDataVariants::Type::hashed не используется.
}


void Aggregator::createAggregateStates(AggregateDataPtr & aggregate_data) const
{
	for (size_t j = 0; j < params.aggregates_size; ++j)
	{
		try
		{
			/** Может возникнуть исключение при нехватке памяти.
			  * Для того, чтобы потом всё правильно уничтожилось, "откатываем" часть созданных состояний.
			  * Код не очень удобный.
			  */
			aggregate_functions[j]->create(aggregate_data + offsets_of_aggregate_states[j]);
		}
		catch (...)
		{
			for (size_t rollback_j = 0; rollback_j < j; ++rollback_j)
				aggregate_functions[rollback_j]->destroy(aggregate_data + offsets_of_aggregate_states[rollback_j]);

			throw;
		}
	}
}


/** Интересно - если убрать noinline, то gcc зачем-то инлайнит эту функцию, и производительность уменьшается (~10%).
  * (Возможно из-за того, что после инлайна этой функции, перестают инлайниться более внутренние функции.)
  * Инлайнить не имеет смысла, так как внутренний цикл находится целиком внутри этой функции.
  */
template <typename Method>
void NO_INLINE Aggregator::executeImpl(
	Method & method,
	Arena * aggregates_pool,
	size_t rows,
	ConstColumnPlainPtrs & key_columns,
	AggregateFunctionInstruction * aggregate_instructions,
	const Sizes & key_sizes,
	StringRefs & keys,
	bool no_more_keys,
	AggregateDataPtr overflow_row) const
{
	typename Method::State state;
	state.init(key_columns);

	if (!no_more_keys)
		executeImplCase<false>(method, state, aggregates_pool, rows, key_columns, aggregate_instructions, key_sizes, keys, overflow_row);
	else
		executeImplCase<true>(method, state, aggregates_pool, rows, key_columns, aggregate_instructions, key_sizes, keys, overflow_row);
}

#ifndef __clang__
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wmaybe-uninitialized"
#endif

template <bool no_more_keys, typename Method>
void NO_INLINE Aggregator::executeImplCase(
	Method & method,
	typename Method::State & state,
	Arena * aggregates_pool,
	size_t rows,
	ConstColumnPlainPtrs & key_columns,
	AggregateFunctionInstruction * aggregate_instructions,
	const Sizes & key_sizes,
	StringRefs & keys,
	AggregateDataPtr overflow_row) const
{
	/// NOTE При редактировании этого кода, обратите также внимание на SpecializedAggregator.h.

	/// Для всех строчек.
	typename Method::iterator it;
	typename Method::Key prev_key;
	for (size_t i = 0; i < rows; ++i)
	{
		bool inserted;			/// Вставили новый ключ, или такой ключ уже был?
		bool overflow = false;	/// Новый ключ не поместился в хэш-таблицу из-за no_more_keys.

		/// Получаем ключ для вставки в хэш-таблицу.
		typename Method::Key key = state.getKey(key_columns, params.keys_size, i, key_sizes, keys, *aggregates_pool);

		if (!no_more_keys)	/// Вставляем.
		{
			/// Оптимизация для часто повторяющихся ключей.
			if (!Method::no_consecutive_keys_optimization)
			{
				if (i != 0 && key == prev_key)
				{
					/// Добавляем значения в агрегатные функции.
					AggregateDataPtr value = Method::getAggregateData(it->second);
					for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
						(*inst->func)(inst->that, value + inst->state_offset, inst->arguments, i);

					method.onExistingKey(key, keys, *aggregates_pool);
					continue;
				}
				else
					prev_key = key;
			}

			method.data.emplace(key, it, inserted);
		}
		else
		{
			/// Будем добавлять только если ключ уже есть.
			inserted = false;
			it = method.data.find(key);
			if (method.data.end() == it)
				overflow = true;
		}

		/// Если ключ не поместился, и данные не надо агрегировать в отдельную строку, то делать нечего.
		if (no_more_keys && overflow && !overflow_row)
		{
			method.onExistingKey(key, keys, *aggregates_pool);
			continue;
		}

		/// Если вставили новый ключ - инициализируем состояния агрегатных функций, и возможно, что-нибудь связанное с ключом.
		if (inserted)
		{
			AggregateDataPtr & aggregate_data = Method::getAggregateData(it->second);

			/// exception-safety - если не удалось выделить память или создать состояния, то не будут вызываться деструкторы.
			aggregate_data = nullptr;

			method.onNewKey(*it, params.keys_size, i, keys, *aggregates_pool);

			AggregateDataPtr place = aggregates_pool->alloc(total_size_of_aggregate_states);
			createAggregateStates(place);
			aggregate_data = place;
		}
		else
			method.onExistingKey(key, keys, *aggregates_pool);

		AggregateDataPtr value = (!no_more_keys || !overflow) ? Method::getAggregateData(it->second) : overflow_row;

		/// Добавляем значения в агрегатные функции.
		for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
			(*inst->func)(inst->that, value + inst->state_offset, inst->arguments, i);
	}
}

#ifndef __clang__
#pragma GCC diagnostic pop
#endif

void NO_INLINE Aggregator::executeWithoutKeyImpl(
	AggregatedDataWithoutKey & res,
	size_t rows,
	AggregateFunctionInstruction * aggregate_instructions) const
{
	/// Оптимизация в случае единственной агрегатной функции count.
	AggregateFunctionCount * agg_count = params.aggregates_size == 1
		? typeid_cast<AggregateFunctionCount *>(aggregate_functions[0])
		: NULL;

	if (agg_count)
		agg_count->addDelta(res, rows);
	else
	{
		for (size_t i = 0; i < rows; ++i)
		{
			/// Добавляем значения
			for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
				(*inst->func)(inst->that, res + inst->state_offset, inst->arguments, i);
		}
	}
}


bool Aggregator::executeOnBlock(Block & block, AggregatedDataVariants & result,
	ConstColumnPlainPtrs & key_columns, AggregateColumns & aggregate_columns,
	Sizes & key_sizes, StringRefs & key,
	bool & no_more_keys)
{
	initialize(block);

	if (isCancelled())
		return true;

	/// result будет уничтожать состояния агрегатных функций в деструкторе
	result.aggregator = this;

	for (size_t i = 0; i < params.aggregates_size; ++i)
		aggregate_columns[i].resize(params.aggregates[i].arguments.size());

	/** Константные столбцы не поддерживаются напрямую при агрегации.
	  * Чтобы они всё-равно работали, материализуем их.
	  */
	Columns materialized_columns;

	/// Запоминаем столбцы, с которыми будем работать
	for (size_t i = 0; i < params.keys_size; ++i)
	{
		key_columns[i] = block.getByPosition(params.keys[i]).column.get();

		if (auto converted = key_columns[i]->convertToFullColumnIfConst())
		{
			materialized_columns.push_back(converted);
			key_columns[i] = materialized_columns.back().get();
		}
	}

	AggregateFunctionInstructions aggregate_functions_instructions(params.aggregates_size + 1);
	aggregate_functions_instructions[params.aggregates_size].that = nullptr;

	for (size_t i = 0; i < params.aggregates_size; ++i)
	{
		for (size_t j = 0; j < aggregate_columns[i].size(); ++j)
		{
			aggregate_columns[i][j] = block.getByPosition(params.aggregates[i].arguments[j]).column.get();

			if (auto converted = aggregate_columns[i][j]->convertToFullColumnIfConst())
			{
				materialized_columns.push_back(converted);
				aggregate_columns[i][j] = materialized_columns.back().get();
			}
		}

		aggregate_functions_instructions[i].that = aggregate_functions[i];
		aggregate_functions_instructions[i].func = aggregate_functions[i]->getAddressOfAddFunction();
		aggregate_functions_instructions[i].state_offset = offsets_of_aggregate_states[i];
		aggregate_functions_instructions[i].arguments = aggregate_columns[i].data();
	}

	if (isCancelled())
		return true;

	size_t rows = block.rows();

	/// Каким способом выполнять агрегацию?
	if (result.empty())
	{
		result.init(chooseAggregationMethod(key_columns, key_sizes));
		result.keys_size = params.keys_size;
		result.key_sizes = key_sizes;
		LOG_TRACE(log, "Aggregation method: " << result.getMethodName());

		if (params.compiler)
			compileIfPossible(result.type);
	}

	if (isCancelled())
		return true;

	if ((params.overflow_row || result.type == AggregatedDataVariants::Type::without_key) && !result.without_key)
	{
		AggregateDataPtr place = result.aggregates_pool->alloc(total_size_of_aggregate_states);
		createAggregateStates(place);
		result.without_key = place;
	}

	/// Выбираем один из методов агрегации и вызываем его.

	/// Для случая, когда нет ключей (всё агегировать в одну строку).
	if (result.type == AggregatedDataVariants::Type::without_key)
	{
		/// Если есть динамически скомпилированный код.
		if (compiled_data->compiled_method_ptr)
		{
			reinterpret_cast<
				void (*)(const Aggregator &, AggregatedDataWithoutKey &, size_t, AggregateColumns &)>
					(compiled_data->compiled_method_ptr)(*this, result.without_key, rows, aggregate_columns);
		}
		else
			executeWithoutKeyImpl(result.without_key, rows, &aggregate_functions_instructions[0]);
	}
	else
	{
		/// Сюда пишутся данные, не поместившиеся в max_rows_to_group_by при group_by_overflow_mode = any.
		AggregateDataPtr overflow_row_ptr = params.overflow_row ? result.without_key : nullptr;

		bool is_two_level = result.isTwoLevel();

		/// Скомпилированный код, для обычной структуры.
		if (!is_two_level && compiled_data->compiled_method_ptr)
		{
		#define M(NAME, IS_TWO_LEVEL) \
			else if (result.type == AggregatedDataVariants::Type::NAME) \
				reinterpret_cast<void (*)( \
					const Aggregator &, decltype(result.NAME)::element_type &, \
					Arena *, size_t, ConstColumnPlainPtrs &, AggregateColumns &, \
					const Sizes &, StringRefs &, bool, AggregateDataPtr)>(compiled_data->compiled_method_ptr) \
				(*this, *result.NAME, result.aggregates_pool, rows, key_columns, aggregate_columns, \
					result.key_sizes, key, no_more_keys, overflow_row_ptr);

			if (false) {}
			APPLY_FOR_AGGREGATED_VARIANTS(M)
		#undef M
		}
		/// Скомпилированный код, для two-level структуры.
		else if (is_two_level && compiled_data->compiled_two_level_method_ptr)
		{
		#define M(NAME) \
			else if (result.type == AggregatedDataVariants::Type::NAME) \
				reinterpret_cast<void (*)( \
					const Aggregator &, decltype(result.NAME)::element_type &, \
					Arena *, size_t, ConstColumnPlainPtrs &, AggregateColumns &, \
					const Sizes &, StringRefs &, bool, AggregateDataPtr)>(compiled_data->compiled_two_level_method_ptr) \
				(*this, *result.NAME, result.aggregates_pool, rows, key_columns, aggregate_columns, \
					result.key_sizes, key, no_more_keys, overflow_row_ptr);

			if (false) {}
			APPLY_FOR_VARIANTS_TWO_LEVEL(M)
		#undef M
		}
		/// Когда нет динамически скомпилированного кода.
		else
		{
		#define M(NAME, IS_TWO_LEVEL) \
			else if (result.type == AggregatedDataVariants::Type::NAME) \
				executeImpl(*result.NAME, result.aggregates_pool, rows, key_columns, &aggregate_functions_instructions[0], \
					result.key_sizes, key, no_more_keys, overflow_row_ptr);

			if (false) {}
			APPLY_FOR_AGGREGATED_VARIANTS(M)
		#undef M
		}
	}

	size_t result_size = result.sizeWithoutOverflowRow();
	Int64 current_memory_usage = 0;
	if (current_memory_tracker)
		current_memory_usage = current_memory_tracker->get();

	auto result_size_bytes = current_memory_usage - memory_usage_before_aggregation;	/// Здесь учитываются все результаты в сумме, из разных потоков.

	bool worth_convert_to_two_level
		= (params.group_by_two_level_threshold && result_size >= params.group_by_two_level_threshold)
		|| (params.group_by_two_level_threshold_bytes && result_size_bytes >= static_cast<Int64>(params.group_by_two_level_threshold_bytes));

	/** Преобразование в двухуровневую структуру данных.
	  * Она позволяет делать, в последующем, эффективный мердж - либо экономный по памяти, либо распараллеленный.
	  */
	if (result.isConvertibleToTwoLevel() && worth_convert_to_two_level)
		result.convertToTwoLevel();

	/// Проверка ограничений.
	if (!checkLimits(result_size, no_more_keys))
		return false;

	/** Сброс данных на диск, если потребляется слишком много оперативки.
	  * Данные можно сбросить на диск только если используется двухуровневая структура агрегации.
	  */
	if (params.max_bytes_before_external_group_by
		&& result.isTwoLevel()
		&& current_memory_usage > static_cast<Int64>(params.max_bytes_before_external_group_by)
		&& worth_convert_to_two_level)
	{
		writeToTemporaryFile(result, result_size);
	}

	return true;
}


void Aggregator::writeToTemporaryFile(AggregatedDataVariants & data_variants, size_t rows)
{
	Stopwatch watch;

	auto file = std::make_unique<Poco::TemporaryFile>(params.tmp_path);
	const std::string & path = file->path();
	WriteBufferFromFile file_buf(path);
	CompressedWriteBuffer compressed_buf(file_buf);
	NativeBlockOutputStream block_out(compressed_buf, ClickHouseRevision::get());

	LOG_DEBUG(log, "Writing part of aggregation data into temporary file " << path << ".");
	ProfileEvents::increment(ProfileEvents::ExternalAggregationWritePart);

	/// Сбрасываем только двухуровневые данные.

#define M(NAME) \
	else if (data_variants.type == AggregatedDataVariants::Type::NAME) \
		writeToTemporaryFileImpl(data_variants, *data_variants.NAME, block_out, path);

	if (false) {}
	APPLY_FOR_VARIANTS_TWO_LEVEL(M)
#undef M
	else
		throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);

	/// NOTE Вместо освобождения памяти и создания новых хэш-таблиц и арены, можно переиспользовать старые.
	data_variants.init(data_variants.type);
	data_variants.aggregates_pools = Arenas(1, std::make_shared<Arena>());
	data_variants.aggregates_pool = data_variants.aggregates_pools.back().get();

	block_out.flush();
	compressed_buf.next();
	file_buf.next();

	double elapsed_seconds = watch.elapsedSeconds();
	double compressed_bytes = file_buf.count();
	double uncompressed_bytes = compressed_buf.count();

	{
		std::lock_guard<std::mutex> lock(temporary_files.mutex);
		temporary_files.files.emplace_back(std::move(file));
		temporary_files.sum_size_uncompressed += uncompressed_bytes;
		temporary_files.sum_size_compressed += compressed_bytes;
	}

	ProfileEvents::increment(ProfileEvents::ExternalAggregationCompressedBytes, compressed_bytes);
	ProfileEvents::increment(ProfileEvents::ExternalAggregationUncompressedBytes, uncompressed_bytes);

	LOG_TRACE(log, std::fixed << std::setprecision(3)
		<< "Written part in " << elapsed_seconds << " sec., "
		<< rows << " rows, "
		<< (uncompressed_bytes / 1048576.0) << " MiB uncompressed, "
		<< (compressed_bytes / 1048576.0) << " MiB compressed, "
		<< (uncompressed_bytes / rows) << " uncompressed bytes per row, "
		<< (compressed_bytes / rows) << " compressed bytes per row, "
		<< "compression rate: " << (uncompressed_bytes / compressed_bytes)
		<< " (" << (rows / elapsed_seconds) << " rows/sec., "
		<< (uncompressed_bytes / elapsed_seconds / 1048576.0) << " MiB/sec. uncompressed, "
		<< (compressed_bytes / elapsed_seconds / 1048576.0) << " MiB/sec. compressed)");
}


template <typename Method>
Block Aggregator::convertOneBucketToBlock(
	AggregatedDataVariants & data_variants,
	Method & method,
	bool final,
	size_t bucket) const
{
	Block block = prepareBlockAndFill(data_variants, final, method.data.impls[bucket].size(),
		[bucket, &method, this] (
			ColumnPlainPtrs & key_columns,
			AggregateColumnsData & aggregate_columns,
			ColumnPlainPtrs & final_aggregate_columns,
			const Sizes & key_sizes,
			bool final)
		{
			convertToBlockImpl(method, method.data.impls[bucket],
				key_columns, aggregate_columns, final_aggregate_columns, key_sizes, final);
		});

	block.info.bucket_num = bucket;
	return block;
}


template <typename Method>
void Aggregator::writeToTemporaryFileImpl(
	AggregatedDataVariants & data_variants,
	Method & method,
	IBlockOutputStream & out,
	const String & path)
{
	size_t max_temporary_block_size_rows = 0;
	size_t max_temporary_block_size_bytes = 0;

	for (size_t bucket = 0; bucket < Method::Data::NUM_BUCKETS; ++bucket)
	{
		Block block = convertOneBucketToBlock(data_variants, method, false, bucket);
		out.write(block);

		size_t block_size_rows = block.rowsInFirstColumn();
		size_t block_size_bytes = block.bytes();

		if (block_size_rows > max_temporary_block_size_rows)
			max_temporary_block_size_rows = block.rowsInFirstColumn();
		if (block_size_bytes > max_temporary_block_size_bytes)
			max_temporary_block_size_bytes = block_size_bytes;
	}

	/// data_variants не будет уничтожать состояния агрегатных функций в деструкторе. Теперь состояниями владеют ColumnAggregateFunction.
	data_variants.aggregator = nullptr;

	LOG_TRACE(log, std::fixed << std::setprecision(3)
		<< "Max size of temporary block: " << max_temporary_block_size_rows << " rows, "
		<< (max_temporary_block_size_bytes / 1048576.0) << " MiB.");
}


bool Aggregator::checkLimits(size_t result_size, bool & no_more_keys) const
{
	if (!no_more_keys && params.max_rows_to_group_by && result_size > params.max_rows_to_group_by)
	{
		if (params.group_by_overflow_mode == OverflowMode::THROW)
			throw Exception("Limit for rows to GROUP BY exceeded: has " + toString(result_size)
				+ " rows, maximum: " + toString(params.max_rows_to_group_by),
				ErrorCodes::TOO_MUCH_ROWS);
		else if (params.group_by_overflow_mode == OverflowMode::BREAK)
			return false;
		else if (params.group_by_overflow_mode == OverflowMode::ANY)
			no_more_keys = true;
		else
			throw Exception("Logical error: unknown overflow mode", ErrorCodes::LOGICAL_ERROR);
	}

	return true;
}


void Aggregator::execute(BlockInputStreamPtr stream, AggregatedDataVariants & result)
{
	if (isCancelled())
		return;

	StringRefs key(params.keys_size);
	ConstColumnPlainPtrs key_columns(params.keys_size);
	AggregateColumns aggregate_columns(params.aggregates_size);
	Sizes key_sizes;

	/** Используется, если есть ограничение на максимальное количество строк при агрегации,
	  *  и если group_by_overflow_mode == ANY.
	  * В этом случае, новые ключи не добавляются в набор, а производится агрегация только по
	  *  ключам, которые уже успели попасть в набор.
	  */
	bool no_more_keys = false;

	LOG_TRACE(log, "Aggregating");

	Stopwatch watch;

	size_t src_rows = 0;
	size_t src_bytes = 0;

	/// Читаем все данные
	while (Block block = stream->read())
	{
		if (isCancelled())
			return;

		src_rows += block.rows();
		src_bytes += block.bytes();

		if (!executeOnBlock(block, result,
			key_columns, aggregate_columns, key_sizes, key,
			no_more_keys))
			break;
	}

	double elapsed_seconds = watch.elapsedSeconds();
	size_t rows = result.size();
	LOG_TRACE(log, std::fixed << std::setprecision(3)
		<< "Aggregated. " << src_rows << " to " << rows << " rows (from " << src_bytes / 1048576.0 << " MiB)"
		<< " in " << elapsed_seconds << " sec."
		<< " (" << src_rows / elapsed_seconds << " rows/sec., " << src_bytes / elapsed_seconds / 1048576.0 << " MiB/sec.)");
}


template <typename Method, typename Table>
void Aggregator::convertToBlockImpl(
	Method & method,
	Table & data,
	ColumnPlainPtrs & key_columns,
	AggregateColumnsData & aggregate_columns,
	ColumnPlainPtrs & final_aggregate_columns,
	const Sizes & key_sizes,
	bool final) const
{
	if (data.empty())
		return;

	if (final)
		convertToBlockImplFinal(method, data, key_columns, final_aggregate_columns, key_sizes);
	else
		convertToBlockImplNotFinal(method, data, key_columns, aggregate_columns, key_sizes);

	/// Для того, чтобы пораньше освободить память.
	data.clearAndShrink();
}


template <typename Method, typename Table>
void NO_INLINE Aggregator::convertToBlockImplFinal(
	Method & method,
	Table & data,
	ColumnPlainPtrs & key_columns,
	ColumnPlainPtrs & final_aggregate_columns,
	const Sizes & key_sizes) const
{
	for (const auto & value : data)
	{
		method.insertKeyIntoColumns(value, key_columns, params.keys_size, key_sizes);

		for (size_t i = 0; i < params.aggregates_size; ++i)
			aggregate_functions[i]->insertResultInto(
				Method::getAggregateData(value.second) + offsets_of_aggregate_states[i],
				*final_aggregate_columns[i]);
	}

	destroyImpl(method, data);		/// NOTE Можно сделать лучше.
}

template <typename Method, typename Table>
void NO_INLINE Aggregator::convertToBlockImplNotFinal(
	Method & method,
	Table & data,
	ColumnPlainPtrs & key_columns,
	AggregateColumnsData & aggregate_columns,
	const Sizes & key_sizes) const
{
	for (auto & value : data)
	{
		method.insertKeyIntoColumns(value, key_columns, params.keys_size, key_sizes);

		/// reserved, поэтому push_back не кидает исключений
		for (size_t i = 0; i < params.aggregates_size; ++i)
			aggregate_columns[i]->push_back(Method::getAggregateData(value.second) + offsets_of_aggregate_states[i]);

		Method::getAggregateData(value.second) = nullptr;
	}
}


template <typename Filler>
Block Aggregator::prepareBlockAndFill(
	AggregatedDataVariants & data_variants,
	bool final,
	size_t rows,
 	Filler && filler) const
{
	Block res = sample.cloneEmpty();

	ColumnPlainPtrs key_columns(params.keys_size);
	AggregateColumnsData aggregate_columns(params.aggregates_size);
	ColumnPlainPtrs final_aggregate_columns(params.aggregates_size);

	for (size_t i = 0; i < params.keys_size; ++i)
	{
		key_columns[i] = res.getByPosition(i).column.get();
		key_columns[i]->reserve(rows);
	}

	for (size_t i = 0; i < params.aggregates_size; ++i)
	{
		if (!final)
		{
			/// Столбец ColumnAggregateFunction захватывает разделяемое владение ареной с состояниями агрегатных функций.
			ColumnAggregateFunction & column_aggregate_func = static_cast<ColumnAggregateFunction &>(
				*res.getByPosition(i + params.keys_size).column);

			for (size_t j = 0; j < data_variants.aggregates_pools.size(); ++j)
				column_aggregate_func.addArena(data_variants.aggregates_pools[j]);

			aggregate_columns[i] = &column_aggregate_func.getData();
			aggregate_columns[i]->reserve(rows);
		}
		else
		{
			ColumnWithTypeAndName & column = res.getByPosition(i + params.keys_size);
			column.type = aggregate_functions[i]->getReturnType();
			column.column = column.type->createColumn();
			column.column->reserve(rows);

			if (aggregate_functions[i]->isState())
			{
				/// Столбец ColumnAggregateFunction захватывает разделяемое владение ареной с состояниями агрегатных функций.
				ColumnAggregateFunction & column_aggregate_func = static_cast<ColumnAggregateFunction &>(*column.column);

				for (size_t j = 0; j < data_variants.aggregates_pools.size(); ++j)
					column_aggregate_func.addArena(data_variants.aggregates_pools[j]);
			}

			final_aggregate_columns[i] = column.column.get();
		}
	}

	filler(key_columns, aggregate_columns, final_aggregate_columns, data_variants.key_sizes, final);

	/// Изменяем размер столбцов-констант в блоке.
	size_t columns = res.columns();
	for (size_t i = 0; i < columns; ++i)
		if (res.getByPosition(i).column->isConst())
			res.getByPosition(i).column = res.getByPosition(i).column->cut(0, rows);

	return res;
}


BlocksList Aggregator::prepareBlocksAndFillWithoutKey(AggregatedDataVariants & data_variants, bool final, bool is_overflows) const
{
	size_t rows = 1;

	auto filler = [&data_variants, this](
		ColumnPlainPtrs & key_columns,
		AggregateColumnsData & aggregate_columns,
		ColumnPlainPtrs & final_aggregate_columns,
		const Sizes & key_sizes,
		bool final)
	{
		if (data_variants.type == AggregatedDataVariants::Type::without_key || params.overflow_row)
		{
			AggregatedDataWithoutKey & data = data_variants.without_key;

			for (size_t i = 0; i < params.aggregates_size; ++i)
			{
				if (!final)
					aggregate_columns[i]->push_back(data + offsets_of_aggregate_states[i]);
				else
					aggregate_functions[i]->insertResultInto(data + offsets_of_aggregate_states[i], *final_aggregate_columns[i]);
			}

			if (!final)
				data = nullptr;

			if (params.overflow_row)
				for (size_t i = 0; i < params.keys_size; ++i)
					key_columns[i]->insertDefault();
		}
	};

	Block block = prepareBlockAndFill(data_variants, final, rows, filler);

	if (is_overflows)
		block.info.is_overflows = true;

	if (final)
		destroyWithoutKey(data_variants);

	BlocksList blocks;
	blocks.emplace_back(std::move(block));
	return blocks;
}

BlocksList Aggregator::prepareBlocksAndFillSingleLevel(AggregatedDataVariants & data_variants, bool final) const
{
	size_t rows = data_variants.sizeWithoutOverflowRow();

	auto filler = [&data_variants, this](
		ColumnPlainPtrs & key_columns,
		AggregateColumnsData & aggregate_columns,
		ColumnPlainPtrs & final_aggregate_columns,
		const Sizes & key_sizes,
		bool final)
	{
	#define M(NAME) \
		else if (data_variants.type == AggregatedDataVariants::Type::NAME) \
			convertToBlockImpl(*data_variants.NAME, data_variants.NAME->data, \
				key_columns, aggregate_columns, final_aggregate_columns, data_variants.key_sizes, final);

		if (false) {}
		APPLY_FOR_VARIANTS_SINGLE_LEVEL(M)
	#undef M
		else
			throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
	};

	BlocksList blocks;
	blocks.emplace_back(prepareBlockAndFill(data_variants, final, rows, filler));
	return blocks;
}


BlocksList Aggregator::prepareBlocksAndFillTwoLevel(AggregatedDataVariants & data_variants, bool final, ThreadPool * thread_pool) const
{
#define M(NAME) \
	else if (data_variants.type == AggregatedDataVariants::Type::NAME) \
		return prepareBlocksAndFillTwoLevelImpl(data_variants, *data_variants.NAME, final, thread_pool);

	if (false) {}
	APPLY_FOR_VARIANTS_TWO_LEVEL(M)
#undef M
	else
		throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
}


template <typename Method>
BlocksList Aggregator::prepareBlocksAndFillTwoLevelImpl(
	AggregatedDataVariants & data_variants,
	Method & method,
	bool final,
	ThreadPool * thread_pool) const
{
	auto converter = [&](size_t bucket, MemoryTracker * memory_tracker)
	{
		current_memory_tracker = memory_tracker;
		return convertOneBucketToBlock(data_variants, method, final, bucket);
	};

	/// packaged_task используются, чтобы исключения автоматически прокидывались в основной поток.

	std::vector<std::packaged_task<Block()>> tasks(Method::Data::NUM_BUCKETS);

	try
	{
		for (size_t bucket = 0; bucket < Method::Data::NUM_BUCKETS; ++bucket)
		{
			if (method.data.impls[bucket].empty())
				continue;

			tasks[bucket] = std::packaged_task<Block()>(std::bind(converter, bucket, current_memory_tracker));

			if (thread_pool)
				thread_pool->schedule([bucket, &tasks] { tasks[bucket](); });
			else
				tasks[bucket]();
		}
	}
	catch (...)
	{
		/// Если этого не делать, то в случае исключения, tasks уничтожится раньше завершения потоков, и будет плохо.
		if (thread_pool)
			thread_pool->wait();

		throw;
	}

	if (thread_pool)
		thread_pool->wait();

	BlocksList blocks;

	for (auto & task : tasks)
	{
		if (!task.valid())
			continue;

		blocks.emplace_back(task.get_future().get());
	}

	return blocks;
}


BlocksList Aggregator::convertToBlocks(AggregatedDataVariants & data_variants, bool final, size_t max_threads) const
{
	if (isCancelled())
		return BlocksList();

	LOG_TRACE(log, "Converting aggregated data to blocks");

	Stopwatch watch;

	BlocksList blocks;

	/// В какой структуре данных агрегированы данные?
	if (data_variants.empty())
		return blocks;

	std::unique_ptr<ThreadPool> thread_pool;
	if (max_threads > 1 && data_variants.sizeWithoutOverflowRow() > 100000	/// TODO Сделать настраиваемый порог.
		&& data_variants.isTwoLevel())						/// TODO Использовать общий тред-пул с функцией merge.
		thread_pool.reset(new ThreadPool(max_threads));

	if (isCancelled())
		return BlocksList();

	if (data_variants.type == AggregatedDataVariants::Type::without_key || params.overflow_row)
		blocks.splice(blocks.end(), prepareBlocksAndFillWithoutKey(
			data_variants, final, data_variants.type != AggregatedDataVariants::Type::without_key));

	if (isCancelled())
		return BlocksList();

	if (data_variants.type != AggregatedDataVariants::Type::without_key)
	{
		if (!data_variants.isTwoLevel())
			blocks.splice(blocks.end(), prepareBlocksAndFillSingleLevel(data_variants, final));
		else
			blocks.splice(blocks.end(), prepareBlocksAndFillTwoLevel(data_variants, final, thread_pool.get()));
	}

	if (!final)
	{
		/// data_variants не будет уничтожать состояния агрегатных функций в деструкторе.
		/// Теперь состояниями владеют ColumnAggregateFunction.
		data_variants.aggregator = nullptr;
	}

	if (isCancelled())
		return BlocksList();

	size_t rows = 0;
	size_t bytes = 0;

	for (const auto & block : blocks)
	{
		rows += block.rowsInFirstColumn();
		bytes += block.bytes();
	}

	double elapsed_seconds = watch.elapsedSeconds();
	LOG_TRACE(log, std::fixed << std::setprecision(3)
		<< "Converted aggregated data to blocks. "
		<< rows << " rows, " << bytes / 1048576.0 << " MiB"
		<< " in " << elapsed_seconds << " sec."
		<< " (" << rows / elapsed_seconds << " rows/sec., " << bytes / elapsed_seconds / 1048576.0 << " MiB/sec.)");

	return blocks;
}


template <typename Method, typename Table>
void NO_INLINE Aggregator::mergeDataImpl(
	Table & table_dst,
	Table & table_src) const
{
	for (auto it = table_src.begin(); it != table_src.end(); ++it)
	{
		decltype(it) res_it;
		bool inserted;
		table_dst.emplace(it->first, res_it, inserted, it.getHash());

		if (!inserted)
		{
			for (size_t i = 0; i < params.aggregates_size; ++i)
				aggregate_functions[i]->merge(
					Method::getAggregateData(res_it->second) + offsets_of_aggregate_states[i],
					Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);

			for (size_t i = 0; i < params.aggregates_size; ++i)
				aggregate_functions[i]->destroy(
					Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);
		}
		else
		{
			res_it->second = it->second;
		}

		Method::getAggregateData(it->second) = nullptr;
	}

	table_src.clearAndShrink();
}


template <typename Method, typename Table>
void NO_INLINE Aggregator::mergeDataNoMoreKeysImpl(
	Table & table_dst,
	AggregatedDataWithoutKey & overflows,
	Table & table_src) const
{
	for (auto it = table_src.begin(); it != table_src.end(); ++it)
	{
		decltype(it) res_it = table_dst.find(it->first, it.getHash());

		AggregateDataPtr res_data = table_dst.end() == res_it
			? overflows
			: Method::getAggregateData(res_it->second);

		for (size_t i = 0; i < params.aggregates_size; ++i)
			aggregate_functions[i]->merge(
				res_data + offsets_of_aggregate_states[i],
				Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);

		for (size_t i = 0; i < params.aggregates_size; ++i)
			aggregate_functions[i]->destroy(
				Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);

		Method::getAggregateData(it->second) = nullptr;
	}

	table_src.clearAndShrink();
}

template <typename Method, typename Table>
void NO_INLINE Aggregator::mergeDataOnlyExistingKeysImpl(
	Table & table_dst,
	Table & table_src) const
{
	for (auto it = table_src.begin(); it != table_src.end(); ++it)
	{
		decltype(it) res_it = table_dst.find(it->first, it.getHash());

		if (table_dst.end() == res_it)
			continue;

		AggregateDataPtr res_data = Method::getAggregateData(res_it->second);

		for (size_t i = 0; i < params.aggregates_size; ++i)
			aggregate_functions[i]->merge(
				res_data + offsets_of_aggregate_states[i],
				Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);

		for (size_t i = 0; i < params.aggregates_size; ++i)
			aggregate_functions[i]->destroy(
				Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);

		Method::getAggregateData(it->second) = nullptr;
	}

	table_src.clearAndShrink();
}


void NO_INLINE Aggregator::mergeWithoutKeyDataImpl(
	ManyAggregatedDataVariants & non_empty_data) const
{
	AggregatedDataVariantsPtr & res = non_empty_data[0];

	/// Все результаты агрегации соединяем с первым.
	for (size_t i = 1, size = non_empty_data.size(); i < size; ++i)
	{
		AggregatedDataWithoutKey & res_data = res->without_key;
		AggregatedDataWithoutKey & current_data = non_empty_data[i]->without_key;

		for (size_t i = 0; i < params.aggregates_size; ++i)
			aggregate_functions[i]->merge(res_data + offsets_of_aggregate_states[i], current_data + offsets_of_aggregate_states[i]);

		for (size_t i = 0; i < params.aggregates_size; ++i)
			aggregate_functions[i]->destroy(current_data + offsets_of_aggregate_states[i]);

		current_data = nullptr;
	}
}


template <typename Method>
void NO_INLINE Aggregator::mergeSingleLevelDataImpl(
	ManyAggregatedDataVariants & non_empty_data) const
{
	AggregatedDataVariantsPtr & res = non_empty_data[0];
	bool no_more_keys = false;

	/// Все результаты агрегации соединяем с первым.
	for (size_t i = 1, size = non_empty_data.size(); i < size; ++i)
	{
		if (!checkLimits(res->sizeWithoutOverflowRow(), no_more_keys))
			break;

		AggregatedDataVariants & current = *non_empty_data[i];

		if (!no_more_keys)
			mergeDataImpl<Method>(
				getDataVariant<Method>(*res).data,
				getDataVariant<Method>(current).data);
		else if (res->without_key)
			mergeDataNoMoreKeysImpl<Method>(
				getDataVariant<Method>(*res).data,
				res->without_key,
				getDataVariant<Method>(current).data);
		else
			mergeDataOnlyExistingKeysImpl<Method>(
				getDataVariant<Method>(*res).data,
				getDataVariant<Method>(current).data);

		/// current не будет уничтожать состояния агрегатных функций в деструкторе
		current.aggregator = nullptr;
	}
}


template <typename Method>
void NO_INLINE Aggregator::mergeBucketImpl(
	ManyAggregatedDataVariants & data, Int32 bucket) const
{
	/// Все результаты агрегации соединяем с первым.
	AggregatedDataVariantsPtr & res = data[0];
	for (size_t i = 1, size = data.size(); i < size; ++i)
	{
		AggregatedDataVariants & current = *data[i];

		mergeDataImpl<Method>(
			getDataVariant<Method>(*res).data.impls[bucket],
			getDataVariant<Method>(current).data.impls[bucket]);
	}
}


/** Объединят вместе состояния агрегации, превращает их в блоки и выдаёт потоково.
  * Если состояния агрегации двухуровневые, то выдаёт блоки строго по порядку bucket_num.
  * (Это важно при распределённой обработке.)
  * При этом, может обрабатывать разные bucket-ы параллельно, используя до threads потоков.
  */
class MergingAndConvertingBlockInputStream : public IProfilingBlockInputStream
{
public:
	/** На вход подаётся набор непустых множеств частично агрегированных данных,
	  *  которые все либо являются одноуровневыми, либо являются двухуровневыми.
	  */
	MergingAndConvertingBlockInputStream(const Aggregator & aggregator_, ManyAggregatedDataVariants & data_, bool final_, size_t threads_)
		: aggregator(aggregator_), data(data_), final(final_), threads(threads_) {}

	String getName() const override { return "MergingAndConverting"; }

	String getID() const override
	{
		std::stringstream res;
		res << this;
		return res.str();
	}

protected:
	Block readImpl() override
	{
		if (data.empty())
			return {};

		if (current_bucket_num >= NUM_BUCKETS)
			return {};

		AggregatedDataVariantsPtr & first = data[0];

		if (current_bucket_num == -1)
		{
			++current_bucket_num;

			if (first->type == AggregatedDataVariants::Type::without_key || aggregator.params.overflow_row)
			{
				aggregator.mergeWithoutKeyDataImpl(data);
				return aggregator.prepareBlocksAndFillWithoutKey(
					*first, final, first->type != AggregatedDataVariants::Type::without_key).front();
			}
		}

		if (!first->isTwoLevel())
		{
			if (current_bucket_num > 0)
				return {};

			if (first->type == AggregatedDataVariants::Type::without_key)
				return {};

			++current_bucket_num;

		#define M(NAME) \
			else if (first->type == AggregatedDataVariants::Type::NAME) \
				aggregator.mergeSingleLevelDataImpl<decltype(first->NAME)::element_type>(data);
			if (false) {}
			APPLY_FOR_VARIANTS_SINGLE_LEVEL(M)
		#undef M
			else
				throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);

			return aggregator.prepareBlocksAndFillSingleLevel(*first, final).front();
		}
		else
		{
			if (!parallel_merge_data)
			{
				parallel_merge_data.reset(new ParallelMergeData(threads));
				for (size_t i = 0; i < threads; ++i)
					scheduleThreadForNextBucket();
			}

			Block res;

			while (true)
			{
				std::unique_lock<std::mutex> lock(parallel_merge_data->mutex);

				if (parallel_merge_data->exception)
					std::rethrow_exception(parallel_merge_data->exception);

				auto it = parallel_merge_data->ready_blocks.find(current_bucket_num);
				if (it != parallel_merge_data->ready_blocks.end())
				{
					++current_bucket_num;
					scheduleThreadForNextBucket();

					if (it->second)
					{
						res.swap(it->second);
						break;
					}
					else if (current_bucket_num >= NUM_BUCKETS)
						break;
				}

				parallel_merge_data->condvar.wait(lock);
			}

			return res;
		}
	}

private:
	const Aggregator & aggregator;
	ManyAggregatedDataVariants data;
	bool final;
	size_t threads;

	Int32 current_bucket_num = -1;
	Int32 max_scheduled_bucket_num = -1;
	static constexpr Int32 NUM_BUCKETS = 256;

	struct ParallelMergeData
	{
		ThreadPool pool;
		std::map<Int32, Block> ready_blocks;
		std::exception_ptr exception;
		std::mutex mutex;
		std::condition_variable condvar;

		ParallelMergeData(size_t threads) : pool(threads) {}

		~ParallelMergeData()
		{
			LOG_TRACE(&Logger::get(__PRETTY_FUNCTION__), "Waiting for threads to finish");
			pool.wait();
		}
	};

	std::unique_ptr<ParallelMergeData> parallel_merge_data;

	void scheduleThreadForNextBucket()
	{
		++max_scheduled_bucket_num;
		if (max_scheduled_bucket_num >= NUM_BUCKETS)
			return;

		parallel_merge_data->pool.schedule(std::bind(&MergingAndConvertingBlockInputStream::thread, this,
			max_scheduled_bucket_num, current_memory_tracker));
	}

	void thread(Int32 bucket_num, MemoryTracker * memory_tracker)
	{
		current_memory_tracker = memory_tracker;
		setThreadName("MergingAggregtd");
		CurrentMetrics::Increment metric_increment{CurrentMetrics::QueryThread};

		try
		{
			/// TODO Возможно, поддержать no_more_keys

			auto & merged_data = *data[0];
			auto method = merged_data.type;
			Block block;

			if (false) {}
		#define M(NAME) \
			else if (method == AggregatedDataVariants::Type::NAME) \
			{ \
				aggregator.mergeBucketImpl<decltype(merged_data.NAME)::element_type>(data, bucket_num); \
				block = aggregator.convertOneBucketToBlock(merged_data, *merged_data.NAME, final, bucket_num); \
			}

			APPLY_FOR_VARIANTS_TWO_LEVEL(M)
		#undef M

			std::lock_guard<std::mutex> lock(parallel_merge_data->mutex);
			parallel_merge_data->ready_blocks[bucket_num] = std::move(block);
		}
		catch (...)
		{
			std::lock_guard<std::mutex> lock(parallel_merge_data->mutex);
			if (!parallel_merge_data->exception)
				parallel_merge_data->exception = std::current_exception();
		}

		parallel_merge_data->condvar.notify_all();
	}
};


std::unique_ptr<IBlockInputStream> Aggregator::mergeAndConvertToBlocks(
	ManyAggregatedDataVariants & data_variants, bool final, size_t max_threads) const
{
	if (data_variants.empty())
		throw Exception("Empty data passed to Aggregator::mergeAndConvertToBlocks.", ErrorCodes::EMPTY_DATA_PASSED);

	LOG_TRACE(log, "Merging aggregated data");

	ManyAggregatedDataVariants non_empty_data;
	non_empty_data.reserve(data_variants.size());
	for (auto & data : data_variants)
		if (!data->empty())
			non_empty_data.push_back(data);

	if (non_empty_data.empty())
		return std::make_unique<NullBlockInputStream>();

	if (non_empty_data.size() > 1)
	{
		/// Отсортируем состояния по убыванию размера, чтобы мердж был более эффективным (так как все состояния мерджатся в первое).
		std::sort(non_empty_data.begin(), non_empty_data.end(),
			[](const AggregatedDataVariantsPtr & lhs, const AggregatedDataVariantsPtr & rhs)
			{
				return lhs->sizeWithoutOverflowRow() > rhs->sizeWithoutOverflowRow();
			});
	}

	/// Если хотя бы один из вариантов двухуровневый, то переконвертируем все варианты в двухуровневые, если есть не такие.
	/// Замечание - возможно, было бы более оптимально не конвертировать одноуровневые варианты перед мерджем, а мерджить их отдельно, в конце.

	bool has_at_least_one_two_level = false;
	for (const auto & variant : non_empty_data)
	{
		if (variant->isTwoLevel())
		{
			has_at_least_one_two_level = true;
			break;
		}
	}

	if (has_at_least_one_two_level)
		for (auto & variant : non_empty_data)
			if (!variant->isTwoLevel())
				variant->convertToTwoLevel();

	AggregatedDataVariantsPtr & first = non_empty_data[0];

	for (size_t i = 1, size = non_empty_data.size(); i < size; ++i)
	{
		if (first->type != non_empty_data[i]->type)
			throw Exception("Cannot merge different aggregated data variants.", ErrorCodes::CANNOT_MERGE_DIFFERENT_AGGREGATED_DATA_VARIANTS);

		/** В первое множество данных могут быть перемещены элементы из остальных множеств.
		  * Поэтому, оно должно владеть всеми аренами всех остальных множеств.
		  */
		first->aggregates_pools.insert(first->aggregates_pools.end(),
			non_empty_data[i]->aggregates_pools.begin(), non_empty_data[i]->aggregates_pools.end());
	}

	return std::make_unique<MergingAndConvertingBlockInputStream>(*this, non_empty_data, final, max_threads);
}


template <bool no_more_keys, typename Method, typename Table>
void NO_INLINE Aggregator::mergeStreamsImplCase(
	Block & block,
	const Sizes & key_sizes,
	Arena * aggregates_pool,
	Method & method,
	Table & data,
	AggregateDataPtr overflow_row) const
{
	ConstColumnPlainPtrs key_columns(params.keys_size);
	AggregateColumnsData aggregate_columns(params.aggregates_size);

	/// Запоминаем столбцы, с которыми будем работать
	for (size_t i = 0; i < params.keys_size; ++i)
		key_columns[i] = block.getByPosition(i).column.get();

	for (size_t i = 0; i < params.aggregates_size; ++i)
		aggregate_columns[i] = &typeid_cast<ColumnAggregateFunction &>(*block.getByPosition(params.keys_size + i).column).getData();

	typename Method::State state;
	state.init(key_columns);

	/// Для всех строчек.
	StringRefs keys(params.keys_size);
	size_t rows = block.rowsInFirstColumn();
	for (size_t i = 0; i < rows; ++i)
	{
		typename Table::iterator it;

		bool inserted;			/// Вставили новый ключ, или такой ключ уже был?
		bool overflow = false;	/// Новый ключ не поместился в хэш-таблицу из-за no_more_keys.

		/// Получаем ключ для вставки в хэш-таблицу.
		auto key = state.getKey(key_columns, params.keys_size, i, key_sizes, keys, *aggregates_pool);

		if (!no_more_keys)
		{
			data.emplace(key, it, inserted);
		}
		else
		{
			inserted = false;
			it = data.find(key);
			if (data.end() == it)
				overflow = true;
		}

		/// Если ключ не поместился, и данные не надо агрегировать в отдельную строку, то делать нечего.
		if (no_more_keys && overflow && !overflow_row)
		{
			method.onExistingKey(key, keys, *aggregates_pool);
			continue;
		}

		/// Если вставили новый ключ - инициализируем состояния агрегатных функций, и возможно, что-нибудь связанное с ключом.
		if (inserted)
		{
			AggregateDataPtr & aggregate_data = Method::getAggregateData(it->second);
			aggregate_data = nullptr;

			method.onNewKey(*it, params.keys_size, i, keys, *aggregates_pool);

			AggregateDataPtr place = aggregates_pool->alloc(total_size_of_aggregate_states);
			createAggregateStates(place);
			aggregate_data = place;
		}
		else
			method.onExistingKey(key, keys, *aggregates_pool);

		AggregateDataPtr value = (!no_more_keys || !overflow) ? Method::getAggregateData(it->second) : overflow_row;

		/// Мерджим состояния агрегатных функций.
		for (size_t j = 0; j < params.aggregates_size; ++j)
			aggregate_functions[j]->merge(
				value + offsets_of_aggregate_states[j],
				(*aggregate_columns[j])[i]);
	}

	/// Пораньше освобождаем память.
	block.clear();
}

template <typename Method, typename Table>
void NO_INLINE Aggregator::mergeStreamsImpl(
	Block & block,
	const Sizes & key_sizes,
	Arena * aggregates_pool,
	Method & method,
	Table & data,
	AggregateDataPtr overflow_row,
	bool no_more_keys) const
{
	if (!no_more_keys)
		mergeStreamsImplCase<false>(block, key_sizes, aggregates_pool, method, data, overflow_row);
	else
		mergeStreamsImplCase<true>(block, key_sizes, aggregates_pool, method, data, overflow_row);
}


void NO_INLINE Aggregator::mergeWithoutKeyStreamsImpl(
	Block & block,
	AggregatedDataVariants & result) const
{
	AggregateColumnsData aggregate_columns(params.aggregates_size);

	/// Запоминаем столбцы, с которыми будем работать
	for (size_t i = 0; i < params.aggregates_size; ++i)
		aggregate_columns[i] = &typeid_cast<ColumnAggregateFunction &>(*block.getByPosition(params.keys_size + i).column).getData();

	AggregatedDataWithoutKey & res = result.without_key;
	if (!res)
	{
		AggregateDataPtr place = result.aggregates_pool->alloc(total_size_of_aggregate_states);
		createAggregateStates(place);
		res = place;
	}

	/// Добавляем значения
	for (size_t i = 0; i < params.aggregates_size; ++i)
		aggregate_functions[i]->merge(res + offsets_of_aggregate_states[i], (*aggregate_columns[i])[0]);

	/// Пораньше освобождаем память.
	block.clear();
}


void Aggregator::mergeStream(BlockInputStreamPtr stream, AggregatedDataVariants & result, size_t max_threads)
{
	if (isCancelled())
		return;

	StringRefs key(params.keys_size);
	ConstColumnPlainPtrs key_columns(params.keys_size);

	AggregateColumnsData aggregate_columns(params.aggregates_size);

	initialize({});

	if (isCancelled())
		return;

	/** Если на удалённых серверах использовался двухуровневый метод агрегации,
	  *  то в блоках будет расположена информация о номере корзины.
	  * Тогда вычисления можно будет распараллелить по корзинам.
	  * Разложим блоки по указанным в них номерам корзин.
	  */
	using BucketToBlocks = std::map<Int32, BlocksList>;
	BucketToBlocks bucket_to_blocks;

	/// Читаем все данные.
	LOG_TRACE(log, "Reading blocks of partially aggregated data.");

	size_t total_input_rows = 0;
	size_t total_input_blocks = 0;
	while (Block block = stream->read())
	{
		if (isCancelled())
			return;

		total_input_rows += block.rowsInFirstColumn();
		++total_input_blocks;
		bucket_to_blocks[block.info.bucket_num].emplace_back(std::move(block));
	}

	LOG_TRACE(log, "Read " << total_input_blocks << " blocks of partially aggregated data, total " << total_input_rows << " rows.");

	if (bucket_to_blocks.empty())
		return;

	setSampleBlock(bucket_to_blocks.begin()->second.front());

	/// Каким способом выполнять агрегацию?
	for (size_t i = 0; i < params.keys_size; ++i)
		key_columns[i] = sample.getByPosition(i).column.get();

	Sizes key_sizes;
	AggregatedDataVariants::Type method = chooseAggregationMethod(key_columns, key_sizes);

	/** Минус единицей обозначается отсутствие информации о корзине
	  * - в случае одноуровневой агрегации, а также для блоков с "переполнившимися" значениями.
	  * Если есть хотя бы один блок с номером корзины больше нуля, значит была двухуровневая агрегация.
	  */
	auto max_bucket = bucket_to_blocks.rbegin()->first;
	size_t has_two_level = max_bucket > 0;

	if (has_two_level)
	{
	#define M(NAME) \
		if (method == AggregatedDataVariants::Type::NAME) \
			method = AggregatedDataVariants::Type::NAME ## _two_level;

		APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)

	#undef M
	}

	if (isCancelled())
		return;

	/// result будет уничтожать состояния агрегатных функций в деструкторе
	result.aggregator = this;

	result.init(method);
	result.keys_size = params.keys_size;
	result.key_sizes = key_sizes;

	bool has_blocks_with_unknown_bucket = bucket_to_blocks.count(-1);

	/// Сначала параллельно мерджим для отдельных bucket-ов. Затем домердживаем данные, не распределённые по bucket-ам.
	if (has_two_level)
	{
		/** В этом случае, no_more_keys не поддерживается в связи с тем, что
		  *  из разных потоков трудно обновлять общее состояние для "остальных" ключей (overflows).
		  * То есть, ключей в итоге может оказаться существенно больше, чем max_rows_to_group_by.
		  */

		LOG_TRACE(log, "Merging partially aggregated two-level data.");

		auto merge_bucket = [&bucket_to_blocks, &result, &key_sizes, this](Int32 bucket, Arena * aggregates_pool, MemoryTracker * memory_tracker)
		{
			current_memory_tracker = memory_tracker;

			for (Block & block : bucket_to_blocks[bucket])
			{
				if (isCancelled())
					return;

			#define M(NAME) \
				else if (result.type == AggregatedDataVariants::Type::NAME) \
					mergeStreamsImpl(block, key_sizes, aggregates_pool, *result.NAME, result.NAME->data.impls[bucket], nullptr, false);

				if (false) {}
					APPLY_FOR_VARIANTS_TWO_LEVEL(M)
			#undef M
				else
					throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
			}
		};

		std::unique_ptr<ThreadPool> thread_pool;
		if (max_threads > 1 && total_input_rows > 100000	/// TODO Сделать настраиваемый порог.
			&& has_two_level)
			thread_pool.reset(new ThreadPool(max_threads));

		for (const auto & bucket_blocks : bucket_to_blocks)
		{
			const auto bucket = bucket_blocks.first;

			if (bucket == -1)
				continue;

			result.aggregates_pools.push_back(std::make_shared<Arena>());
			Arena * aggregates_pool = result.aggregates_pools.back().get();

			auto task = std::bind(merge_bucket, bucket, aggregates_pool, current_memory_tracker);

			if (thread_pool)
				thread_pool->schedule(task);
			else
				task();
		}

		if (thread_pool)
			thread_pool->wait();

		LOG_TRACE(log, "Merged partially aggregated two-level data.");
	}

	if (isCancelled())
	{
		result.invalidate();
		return;
	}

	if (has_blocks_with_unknown_bucket)
	{
		LOG_TRACE(log, "Merging partially aggregated single-level data.");

		bool no_more_keys = false;

		BlocksList & blocks = bucket_to_blocks[-1];
		for (Block & block : blocks)
		{
			if (isCancelled())
			{
				result.invalidate();
				return;
			}

			if (!checkLimits(result.sizeWithoutOverflowRow(), no_more_keys))
				break;

			if (result.type == AggregatedDataVariants::Type::without_key || block.info.is_overflows)
				mergeWithoutKeyStreamsImpl(block, result);

		#define M(NAME, IS_TWO_LEVEL) \
			else if (result.type == AggregatedDataVariants::Type::NAME) \
				mergeStreamsImpl(block, key_sizes, result.aggregates_pool, *result.NAME, result.NAME->data, result.without_key, no_more_keys);

			APPLY_FOR_AGGREGATED_VARIANTS(M)
		#undef M
			else if (result.type != AggregatedDataVariants::Type::without_key)
				throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
		}

		LOG_TRACE(log, "Merged partially aggregated single-level data.");
	}
}


Block Aggregator::mergeBlocks(BlocksList & blocks, bool final)
{
	if (blocks.empty())
		return {};

	StringRefs key(params.keys_size);
	ConstColumnPlainPtrs key_columns(params.keys_size);

	AggregateColumnsData aggregate_columns(params.aggregates_size);

	initialize({});
	setSampleBlock(blocks.front());

	/// Каким способом выполнять агрегацию?
	for (size_t i = 0; i < params.keys_size; ++i)
		key_columns[i] = sample.getByPosition(i).column.get();

	Sizes key_sizes;
	AggregatedDataVariants::Type method = chooseAggregationMethod(key_columns, key_sizes);

	/// Временные данные для агрегации.
	AggregatedDataVariants result;

	/// result будет уничтожать состояния агрегатных функций в деструкторе
	result.aggregator = this;

	result.init(method);
	result.keys_size = params.keys_size;
	result.key_sizes = key_sizes;

	auto bucket_num = blocks.front().info.bucket_num;
	LOG_TRACE(log, "Merging partially aggregated blocks (bucket = " << bucket_num << ").");

	for (Block & block : blocks)
	{
		if (result.type == AggregatedDataVariants::Type::without_key || block.info.is_overflows)
			mergeWithoutKeyStreamsImpl(block, result);

	#define M(NAME, IS_TWO_LEVEL) \
		else if (result.type == AggregatedDataVariants::Type::NAME) \
			mergeStreamsImpl(block, key_sizes, result.aggregates_pool, *result.NAME, result.NAME->data, nullptr, false);

		APPLY_FOR_AGGREGATED_VARIANTS(M)
	#undef M
		else if (result.type != AggregatedDataVariants::Type::without_key)
			throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
	}

	BlocksList merged_blocks = convertToBlocks(result, final, 1);

	if (merged_blocks.size() > 1)
	{
		/** Может быть два блока. Один с is_overflows, другой - нет.
		  * Если есть непустой блок не is_overflows, то удаляем блок с is_overflows.
		  * Если есть пустой блок не is_overflows и блок с is_overflows, то удаляем пустой блок.
		  *
		  * Это делаем, потому что исходим из допущения, что в функцию передаются
		  *  либо все блоки не is_overflows, либо все блоки is_overflows.
		  */

		bool has_nonempty_nonoverflows = false;
		bool has_overflows = false;

		for (const auto & block : merged_blocks)
		{
			if (block && block.rowsInFirstColumn() && !block.info.is_overflows)
				has_nonempty_nonoverflows = true;
			else if (block.info.is_overflows)
				has_overflows = true;
		}

		if (has_nonempty_nonoverflows)
		{
			for (auto it = merged_blocks.begin(); it != merged_blocks.end(); ++it)
			{
				if (it->info.is_overflows)
				{
					merged_blocks.erase(it);
					break;
				}
			}
		}
		else if (has_overflows)
		{
			for (auto it = merged_blocks.begin(); it != merged_blocks.end(); ++it)
			{
				if (!*it || it->rowsInFirstColumn() == 0)
				{
					merged_blocks.erase(it);
					break;
				}
			}
		}

		if (merged_blocks.size() > 1)
			throw Exception("Logical error: temporary result is not single-level", ErrorCodes::LOGICAL_ERROR);
	}

	LOG_TRACE(log, "Merged partially aggregated blocks.");

	if (merged_blocks.empty())
		return {};

	auto res = std::move(merged_blocks.front());
	res.info.bucket_num = bucket_num;
	return res;
}


template <typename Method>
void NO_INLINE Aggregator::convertBlockToTwoLevelImpl(
	Method & method,
	Arena * pool,
	ConstColumnPlainPtrs & key_columns,
	const Sizes & key_sizes,
	StringRefs & keys,
	const Block & source,
	std::vector<Block> & destinations) const
{
	typename Method::State state;
	state.init(key_columns);

	size_t rows = source.rowsInFirstColumn();
	size_t columns = source.columns();

	/// Для каждого номера корзины создадим фильтр, где будут отмечены строки, относящиеся к этой корзине.
	std::vector<IColumn::Filter> filters(destinations.size());

	/// Для всех строчек.
	for (size_t i = 0; i < rows; ++i)
	{
		/// Получаем ключ. Вычисляем на его основе номер корзины.
		typename Method::Key key = state.getKey(key_columns, params.keys_size, i, key_sizes, keys, *pool);

		auto hash = method.data.hash(key);
		auto bucket = method.data.getBucketFromHash(hash);

		/// Этот ключ нам больше не нужен.
		method.onExistingKey(key, keys, *pool);

		auto & filter = filters[bucket];

		if (unlikely(filter.empty()))
			filter.resize_fill(rows);

		filter[i] = 1;
	}

	ssize_t size_hint = ((source.rowsInFirstColumn() + method.data.NUM_BUCKETS - 1)
		/ method.data.NUM_BUCKETS) * 1.1;	/// Число 1.1 выбрано наугад.

	for (size_t bucket = 0, size = destinations.size(); bucket < size; ++bucket)
	{
		const auto & filter = filters[bucket];

		if (filter.empty())
			continue;

		Block & dst = destinations[bucket];
		dst.info.bucket_num = bucket;

		for (size_t j = 0; j < columns; ++j)
		{
			const ColumnWithTypeAndName & src_col = source.unsafeGetByPosition(j);
			dst.insert({src_col.column->filter(filter, size_hint), src_col.type, src_col.name});

			/** Вставленные в блок столбцы типа ColumnAggregateFunction будут владеть состояниями агрегатных функций
			  *  путём удержания shared_ptr-а на исходный столбец. См. ColumnAggregateFunction.h
			  */
		}
	}
}


std::vector<Block> Aggregator::convertBlockToTwoLevel(const Block & block)
{
	if (!block)
		return {};

	initialize({});
	setSampleBlock(block);

	AggregatedDataVariants data;

	StringRefs key(params.keys_size);
	ConstColumnPlainPtrs key_columns(params.keys_size);
	Sizes key_sizes;

	/// Запоминаем столбцы, с которыми будем работать
	for (size_t i = 0; i < params.keys_size; ++i)
		key_columns[i] = block.getByPosition(i).column.get();

	AggregatedDataVariants::Type type = chooseAggregationMethod(key_columns, key_sizes);
	data.keys_size = params.keys_size;
	data.key_sizes = key_sizes;

#define M(NAME) \
	else if (type == AggregatedDataVariants::Type::NAME) \
		type = AggregatedDataVariants::Type::NAME ## _two_level;

	if (false) {}
	APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
#undef M
	else
		throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);

	data.init(type);

	size_t num_buckets = 0;

#define M(NAME) \
	else if (data.type == AggregatedDataVariants::Type::NAME) \
		num_buckets = data.NAME->data.NUM_BUCKETS;

	if (false) {}
	APPLY_FOR_VARIANTS_TWO_LEVEL(M)
#undef M
	else
		throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);

	std::vector<Block> splitted_blocks(num_buckets);

#define M(NAME) \
	else if (data.type == AggregatedDataVariants::Type::NAME) \
		convertBlockToTwoLevelImpl(*data.NAME, data.aggregates_pool, \
			key_columns, data.key_sizes, key, block, splitted_blocks);

	if (false) {}
	APPLY_FOR_VARIANTS_TWO_LEVEL(M)
#undef M
	else
		throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);

	return splitted_blocks;
}


template <typename Method, typename Table>
void NO_INLINE Aggregator::destroyImpl(
	Method & method,
	Table & table) const
{
	for (auto elem : table)
	{
		AggregateDataPtr & data = Method::getAggregateData(elem.second);

		/** Если исключение (обычно нехватка памяти, кидается MemoryTracker-ом) возникло
		  *  после вставки ключа в хэш-таблицу, но до создания всех состояний агрегатных функций,
		  *  то data будет равен nullptr-у.
		  */
		if (nullptr == data)
			continue;

		for (size_t i = 0; i < params.aggregates_size; ++i)
			if (!aggregate_functions[i]->isState())
				aggregate_functions[i]->destroy(data + offsets_of_aggregate_states[i]);

		data = nullptr;
	}
}


void Aggregator::destroyWithoutKey(AggregatedDataVariants & result) const
{
	AggregatedDataWithoutKey & res_data = result.without_key;

	if (nullptr != res_data)
	{
		for (size_t i = 0; i < params.aggregates_size; ++i)
			if (!aggregate_functions[i]->isState())
				aggregate_functions[i]->destroy(res_data + offsets_of_aggregate_states[i]);

		res_data = nullptr;
	}
}


void Aggregator::destroyAllAggregateStates(AggregatedDataVariants & result)
{
	if (result.size() == 0)
		return;

	LOG_TRACE(log, "Destroying aggregate states");

	/// В какой структуре данных агрегированы данные?
	if (result.type == AggregatedDataVariants::Type::without_key || params.overflow_row)
		destroyWithoutKey(result);

#define M(NAME, IS_TWO_LEVEL) \
	else if (result.type == AggregatedDataVariants::Type::NAME) \
		destroyImpl(*result.NAME, result.NAME->data);

	if (false) {}
	APPLY_FOR_AGGREGATED_VARIANTS(M)
#undef M
	else if (result.type != AggregatedDataVariants::Type::without_key)
		throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
}


String Aggregator::getID() const
{
	std::stringstream res;

	if (params.keys.empty())
	{
		res << "key_names";
		for (size_t i = 0; i < params.key_names.size(); ++i)
			res << ", " << params.key_names[i];
	}
	else
	{
		res << "keys";
		for (size_t i = 0; i < params.keys.size(); ++i)
			res << ", " << params.keys[i];
	}

	res << ", aggregates";
	for (size_t i = 0; i < params.aggregates_size; ++i)
		res << ", " << params.aggregates[i].column_name;

	return res.str();
}

void Aggregator::setCancellationHook(const CancellationHook cancellation_hook)
{
	isCancelled = cancellation_hook;
}


}
-												dbms: improved performance of queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:39:09 +00:00
+								#include <iomanip>
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+								#include <thread>
 								#include <future>
-												dbms: improved performance of queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:39:09 +00:00
-												dbms: Aggregator.cpp include <cxxabi.h>
@milovidov check if this fix is rightful

											
										
										
											2015-01-12 08:06:17 +00:00
+								#include <cxxabi.h>
-												Moved file [#METR-17973].

											
										
										
											2015-10-05 00:44:40 +00:00
+								#include <DB/Common/Stopwatch.h>
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+								#include <DB/Common/setThreadName.h>
-												dbms: improved performance of queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:39:09 +00:00
-												dbms: development [#CONV-2944].



											
										
										
											2011-09-19 03:34:23 +00:00
+								#include <DB/DataTypes/DataTypeAggregateFunction.h>
-												dbms: development [#CONV-2944].



											
										
										
											2011-09-26 07:25:22 +00:00
+								#include <DB/Columns/ColumnsNumber.h>
-												dbms: added full support of GROUP BY arrays [#METR-13168].

											
										
										
											2015-10-04 06:10:48 +00:00
+								#include <DB/Columns/ColumnArray.h>
-												dbms: development [#CONV-2944].



											
										
										
											2012-07-15 23:13:08 +00:00
+								#include <DB/AggregateFunctions/AggregateFunctionCount.h>
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
+								#include <DB/DataStreams/IProfilingBlockInputStream.h>
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+								#include <DB/DataStreams/NativeBlockOutputStream.h>
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+								#include <DB/DataStreams/NullBlockInputStream.h>
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+								#include <DB/IO/WriteBufferFromFile.h>
 								#include <DB/IO/CompressedWriteBuffer.h>
-												dbms: development [#CONV-2944].



											
										
										
											2011-09-19 03:34:23 +00:00
 								#include <DB/Interpreters/Aggregator.h>
-												dbms: renamed Revision to ClickHouseRevision. Daemon to BaseDaemon

											
										
										
											2016-02-09 17:06:50 +00:00
+								#include <common/ClickHouseRevision.h>
-												dbms: development.



											
										
										
											2011-09-19 01:42:16 +00:00
 								namespace DB
 								{
-												dbms: cutting dependency [#METR-2944]..

											
										
										
											2016-01-11 21:46:36 +00:00
+								namespace ErrorCodes
 								{
 									extern const int CANNOT_COMPILE_CODE;
 									extern const int TOO_MUCH_ROWS;
 									extern const int EMPTY_DATA_PASSED;
 									extern const int CANNOT_MERGE_DIFFERENT_AGGREGATED_DATA_VARIANTS;
 								}
-												dbms: development [#CONV-2944].



											
										
										
											2011-09-26 07:25:22 +00:00
-												dbms: fixed possible leak [#CONV-2944].



											
										
										
											2013-02-16 18:59:05 +00:00
+								AggregatedDataVariants::~AggregatedDataVariants()
 								{
-												dbms: additional performance improvement [#METR-2944].



											
										
										
											2013-11-03 23:54:12 +00:00
+									if (aggregator && !aggregator->all_aggregates_has_trivial_destructor)
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+									{
 										try
 										{
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11160].

											
										
										
											2014-05-19 19:41:56 +00:00
+											aggregator->destroyAllAggregateStates(*this);
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+										}
 										catch (...)
 										{
 											tryLogCurrentException(__PRETTY_FUNCTION__);
 										}
 									}
-												dbms: fixed possible leak [#CONV-2944].



											
										
										
											2013-02-16 18:59:05 +00:00
+								}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+								void AggregatedDataVariants::convertToTwoLevel()
 								{
 									if (aggregator)
 										LOG_TRACE(aggregator->log, "Converting aggregation data to two-level.");
 									switch (type)
 									{
 									#define M(NAME) \
 										case Type::NAME: \
 											NAME ## _two_level.reset(new decltype(NAME ## _two_level)::element_type(*NAME)); \
 											NAME.reset(); \
 											type = Type::NAME ## _two_level; \
 											break;
 										APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
 									#undef M
 										default:
 											throw Exception("Wrong data variant passed.", ErrorCodes::LOGICAL_ERROR);
 									}
 								}
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+								void Aggregator::Params::calculateColumnNumbers(const Block & block)
 								{
 									if (keys.empty() && !key_names.empty())
 										for (Names::const_iterator it = key_names.begin(); it != key_names.end(); ++it)
 											keys.push_back(block.getPositionByName(*it));
 									for (AggregateDescriptions::iterator it = aggregates.begin(); it != aggregates.end(); ++it)
 										if (it->arguments.empty() && !it->argument_names.empty())
 											for (Names::const_iterator jt = it->argument_names.begin(); jt != it->argument_names.end(); ++jt)
 												it->arguments.push_back(block.getPositionByName(*jt));
 								}
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
+								void Aggregator::initialize(const Block & block)
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
+								{
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return;
-												dbms: tiny modifications [#METR-2944].

											
										
										
											2015-01-08 18:52:48 +00:00
+									std::lock_guard<std::mutex> lock(mutex);
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
 									if (initialized)
 										return;
 									initialized = true;
-												dbms: probably fixed error in Aggregator [#CONV-2944].



											
										
										
											2013-02-13 19:24:19 +00:00
-												dbms: fixed error [#METR-19288].

											
										
										
											2015-12-07 20:08:00 +00:00
+									if (current_memory_tracker)
 										memory_usage_before_aggregation = current_memory_tracker->get();
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									aggregate_functions.resize(params.aggregates_size);
 									for (size_t i = 0; i < params.aggregates_size; ++i)
 										aggregate_functions[i] = params.aggregates[i].function.get();
-												dbms: probably fixed error in Aggregator [#CONV-2944].



											
										
										
											2013-02-13 19:24:19 +00:00
 									/// Инициализируем размеры состояний и смещения для агрегатных функций.
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									offsets_of_aggregate_states.resize(params.aggregates_size);
-												dbms: probably fixed error in Aggregator [#CONV-2944].



											
										
										
											2013-02-13 19:24:19 +00:00
+									total_size_of_aggregate_states = 0;
-												dbms: additional performance improvement [#METR-2944].



											
										
										
											2013-11-03 23:54:12 +00:00
+									all_aggregates_has_trivial_destructor = true;
-												dbms: probably fixed error in Aggregator [#CONV-2944].



											
										
										
											2013-02-13 19:24:19 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: probably fixed error in Aggregator [#CONV-2944].



											
										
										
											2013-02-13 19:24:19 +00:00
+									{
 										offsets_of_aggregate_states[i] = total_size_of_aggregate_states;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										total_size_of_aggregate_states += params.aggregates[i].function->sizeOfData();
-												dbms: additional performance improvement [#METR-2944].



											
										
										
											2013-11-03 23:54:12 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										if (!params.aggregates[i].function->hasTrivialDestructor())
-												dbms: additional performance improvement [#METR-2944].



											
										
										
											2013-11-03 23:54:12 +00:00
+											all_aggregates_has_trivial_destructor = false;
-												dbms: probably fixed error in Aggregator [#CONV-2944].



											
										
										
											2013-02-13 19:24:19 +00:00
+									}
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return;
-												dbms: probably fixed error in Aggregator [#CONV-2944].



											
										
										
											2013-02-13 19:24:19 +00:00
+									/** Всё остальное - только если передан непустой block.
 									  * (всё остальное не нужно в методе merge блоков с готовыми состояниями агрегатных функций).
 									  */
 									if (!block)
 										return;
-												dbms: improved performance on short queries [#METR-11571].

											
										
										
											2014-06-26 00:58:14 +00:00
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
+									/// Преобразуем имена столбцов в номера, если номера не заданы
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									params.calculateColumnNumbers(block);
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return;
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
+									/// Создадим пример блока, описывающего результат
 									if (!sample)
 									{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.keys_size; ++i)
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-31 01:13:15 +00:00
+										{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											sample.insert(block.getByPosition(params.keys[i]).cloneEmpty());
-												dbms: fixed error with tuples of consts [#METR-18586].

											
										
										
											2015-10-28 21:21:18 +00:00
+											if (auto converted = sample.getByPosition(i).column->convertToFullColumnIfConst())
 												sample.getByPosition(i).column = converted;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-31 01:13:15 +00:00
+										}
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
+										{
-												dbms: renamed ColumnWithNameAndType to ColumnWithTypeAndName for clarification [#METR-2944].

											
										
										
											2015-07-17 01:27:35 +00:00
+											ColumnWithTypeAndName col;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											col.name = params.aggregates[i].column_name;
-												dbms: probably fixed error with aggregate function serialization (incomplete) [#CONV-2944].



											
										
										
											2012-10-24 18:14:36 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											size_t arguments_size = params.aggregates[i].arguments.size();
-												dbms: probably fixed error with aggregate function serialization (incomplete) [#CONV-2944].



											
										
										
											2012-10-24 18:14:36 +00:00
+											DataTypes argument_types(arguments_size);
 											for (size_t j = 0; j < arguments_size; ++j)
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+												argument_types[j] = block.getByPosition(params.aggregates[i].arguments[j]).type;
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
-												Using std::shared_ptr for data types [#METR-21503].

											
										
										
											2016-05-28 07:48:40 +00:00
+											col.type = std::make_shared<DataTypeAggregateFunction>(params.aggregates[i].function, argument_types, params.aggregates[i].parameters);
-												dbms: development [#METR-10894].

											
										
										
											2014-06-05 23:52:28 +00:00
+											col.column = col.type->createColumn();
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
-												Avoid copying ColumnWithTypeAndName [#METR-22173].

											
										
										
											2016-08-04 23:35:07 +00:00
+											sample.insert(std::move(col));
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
+										}
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+									}
-												dbms: development [#CONV-2944].



											
										
										
											2012-03-05 07:58:34 +00:00
+								}
-												dbms: fixed error in memory-efficient merging of aggregated states [#METR-17000].

											
										
										
											2015-12-09 02:56:18 +00:00
+								void Aggregator::setSampleBlock(const Block & block)
 								{
 									std::lock_guard<std::mutex> lock(mutex);
 									if (!sample)
 										sample = block.cloneEmpty();
 								}
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+								void Aggregator::compileIfPossible(AggregatedDataVariants::Type type)
 								{
 									std::lock_guard<std::mutex> lock(mutex);
 									if (compiled_if_possible)
 										return;
 									compiled_if_possible = true;
 									std::string method_typename;
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+									std::string method_typename_two_level;
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+									if (false) {}
 								#define M(NAME) \
 									else if (type == AggregatedDataVariants::Type::NAME) \
 									{ \
 										method_typename = "decltype(AggregatedDataVariants::" #NAME ")::element_type"; \
 										method_typename_two_level = "decltype(AggregatedDataVariants::" #NAME "_two_level)::element_type"; \
 									}
 									APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
 								#undef M
 								#define M(NAME) \
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+									else if (type == AggregatedDataVariants::Type::NAME) \
-												dbms: addition to prev. revision [#METR-2944].

											
										
										
											2015-01-10 02:34:38 +00:00
+										method_typename = "decltype(AggregatedDataVariants::" #NAME ")::element_type";
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+									APPLY_FOR_VARIANTS_NOT_CONVERTIBLE_TO_TWO_LEVEL(M)
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+								#undef M
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+									else if (type == AggregatedDataVariants::Type::without_key) {}
 									else
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+										throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
 									/// Список типов агрегатных функций.
 									std::stringstream aggregate_functions_typenames_str;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+									{
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+										IAggregateFunction & func = *aggregate_functions[i];
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+										int status = 0;
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+										char * type_name_ptr = abi::__cxa_demangle(typeid(func).name(), 0, 0, &status);
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+										std::string type_name = type_name_ptr;
 										free(type_name_ptr);
 										if (status)
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+											throw Exception("Cannot compile code: cannot demangle name " + String(typeid(func).name())
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+												+ ", status: " + toString(status), ErrorCodes::CANNOT_COMPILE_CODE);
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
 										aggregate_functions_typenames_str << ((i != 0) ? ", " : "") << type_name;
 									}
 									std::string aggregate_functions_typenames = aggregate_functions_typenames_str.str();
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+									std::stringstream key_str;
 									key_str << "Aggregate: ";
 									if (!method_typename.empty())
 										key_str << method_typename + ", ";
 									key_str << aggregate_functions_typenames;
 									std::string key = key_str.str();
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+									auto get_code = [method_typename, method_typename_two_level, aggregate_functions_typenames]
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+									{
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-11 02:00:26 +00:00
+										/// Короткий кусок кода, представляющий собой явное инстанцирование шаблона.
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+										std::stringstream code;
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-18 01:18:39 +00:00
+										code <<		/// Нет явного включения заголовочного файла. Он подключается с помощью опции компилятора -include.
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+											"namespace DB\n"
 											"{\n"
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+											"\n";
 										/// Может быть до двух инстанцирований шаблона - для обычного и two_level вариантов.
 										auto append_code_for_specialization =
 											[&code, &aggregate_functions_typenames] (const std::string & method_typename, const std::string & suffix)
 										{
 											code <<
 												"template void Aggregator::executeSpecialized<\n"
 													"\t" << method_typename << ", TypeList<" << aggregate_functions_typenames << ">>(\n"
 													"\t" << method_typename << " &, Arena *, size_t, ConstColumnPlainPtrs &,\n"
 													"\tAggregateColumns &, const Sizes &, StringRefs &, bool, AggregateDataPtr) const;\n"
 												"\n"
 												"static void wrapper" << suffix << "(\n"
 													"\tconst Aggregator & aggregator,\n"
 													"\t" << method_typename << " & method,\n"
 													"\tArena * arena,\n"
 													"\tsize_t rows,\n"
 													"\tConstColumnPlainPtrs & key_columns,\n"
 													"\tAggregator::AggregateColumns & aggregate_columns,\n"
 													"\tconst Sizes & key_sizes,\n"
 													"\tStringRefs & keys,\n"
 													"\tbool no_more_keys,\n"
 													"\tAggregateDataPtr overflow_row)\n"
 												"{\n"
 													"\taggregator.executeSpecialized<\n"
 														"\t\t" << method_typename << ", TypeList<" << aggregate_functions_typenames << ">>(\n"
 														"\t\tmethod, arena, rows, key_columns, aggregate_columns, key_sizes, keys, no_more_keys, overflow_row);\n"
 												"}\n"
 												"\n"
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+												"void * getPtr" << suffix << "() __attribute__((__visibility__(\"default\")));\n"
 												"void * getPtr" << suffix << "()\n"	/// Без этой обёртки непонятно, как достать нужный символ из скомпилированной библиотеки.
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+												"{\n"
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+													"\treturn reinterpret_cast<void *>(&wrapper" << suffix << ");\n"
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+												"}\n";
 										};
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+										if (!method_typename.empty())
 											append_code_for_specialization(method_typename, "");
 										else
 										{
 											/// Для метода without_key.
 											code <<
 												"template void Aggregator::executeSpecializedWithoutKey<\n"
 													"\t" << "TypeList<" << aggregate_functions_typenames << ">>(\n"
 													"\tAggregatedDataWithoutKey &, size_t, AggregateColumns &) const;\n"
 												"\n"
 												"static void wrapper(\n"
 													"\tconst Aggregator & aggregator,\n"
 													"\tAggregatedDataWithoutKey & method,\n"
 													"\tsize_t rows,\n"
 													"\tAggregator::AggregateColumns & aggregate_columns)\n"
 												"{\n"
 													"\taggregator.executeSpecializedWithoutKey<\n"
 														"\t\tTypeList<" << aggregate_functions_typenames << ">>(\n"
 														"\t\tmethod, rows, aggregate_columns);\n"
 												"}\n"
 												"\n"
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+												"void * getPtr() __attribute__((__visibility__(\"default\")));\n"
 												"void * getPtr()\n"
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+												"{\n"
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+													"\treturn reinterpret_cast<void *>(&wrapper);\n"
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+												"}\n";
 										}
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
 										if (!method_typename_two_level.empty())
 											append_code_for_specialization(method_typename_two_level, "TwoLevel");
 										else
 										{
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+											/// Заглушка.
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+											code <<
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+												"void * getPtrTwoLevel() __attribute__((__visibility__(\"default\")));\n"
 												"void * getPtrTwoLevel()\n"
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+												"{\n"
 													"\treturn nullptr;\n"
 												"}\n";
 										}
 										code <<
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+											"}\n";
 										return code.str();
 									};
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-11 02:00:26 +00:00
+									auto compiled_data_owned_by_callback = compiled_data;
 									auto on_ready = [compiled_data_owned_by_callback] (SharedLibraryPtr & lib)
 									{
 										if (compiled_data_owned_by_callback.unique())	/// Aggregator уже уничтожен.
 											return;
 										compiled_data_owned_by_callback->compiled_aggregator = lib;
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+										compiled_data_owned_by_callback->compiled_method_ptr = lib->get<void * (*) ()>("_ZN2DB6getPtrEv")();
 										compiled_data_owned_by_callback->compiled_two_level_method_ptr = lib->get<void * (*) ()>("_ZN2DB14getPtrTwoLevelEv")();
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-11 02:00:26 +00:00
+									};
 									/** Если библиотека уже была скомпилирована, то возвращается ненулевой SharedLibraryPtr.
 									  * Если библиотека не была скомпилирована, то увеличивается счётчик, и возвращается nullptr.
 									  * Если счётчик достигнул значения min_count_to_compile, то асинхронно (в отдельном потоке) запускается компиляция,
 									  *  по окончании которой вызывается колбэк on_ready.
 									  */
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									SharedLibraryPtr lib = params.compiler->getOrCount(key, params.min_count_to_compile,
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-18 01:18:39 +00:00
+										"-include /usr/share/clickhouse/headers/dbms/include/DB/Interpreters/SpecializedAggregator.h",
 										get_code, on_ready);
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-11 02:00:26 +00:00
+									/// Если результат уже готов.
 									if (lib)
 										on_ready(lib);
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+								}
-												dbms: improved performance of aggregation by many fields: lowered number of allocs; more direct memory layout; don't use temporary Fields; lowered memory consumption [#CONV-2944].



											
										
										
											2013-06-30 16:56:00 +00:00
+								AggregatedDataVariants::Type Aggregator::chooseAggregationMethod(const ConstColumnPlainPtrs & key_columns, Sizes & key_sizes)
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+								{
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+									/** Возвращает обычные (не two-level) методы, так как обработка начинается с них.
 									  * Затем, в процессе работы, данные могут быть переконвертированы в two-level структуру, если их становится много.
 									  */
-												dbms: Aggregator: added specialization for many (up to 256 bit) fixed-size keys (up to 3x performance improvement) [#METR-2944].

											
										
										
											2015-02-22 05:53:16 +00:00
+									bool all_fixed = true;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+									size_t keys_bytes = 0;
-												dbms: added full support of GROUP BY arrays [#METR-13168].

											
										
										
											2015-10-04 06:10:48 +00:00
 									size_t num_array_keys = 0;
 									bool has_arrays_of_non_fixed_elems = false;
 									bool all_non_array_keys_are_fixed = true;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									key_sizes.resize(params.keys_size);
 									for (size_t j = 0; j < params.keys_size; ++j)
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+									{
-												dbms: added full support of GROUP BY arrays [#METR-13168].

											
										
										
											2015-10-04 06:10:48 +00:00
+										if (key_columns[j]->isFixed())
 										{
 											key_sizes[j] = key_columns[j]->sizeOfField();
 											keys_bytes += key_sizes[j];
 										}
 										else
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+										{
-												dbms: Aggregator: added specialization for many (up to 256 bit) fixed-size keys (up to 3x performance improvement) [#METR-2944].

											
										
										
											2015-02-22 05:53:16 +00:00
+											all_fixed = false;
-												dbms: added full support of GROUP BY arrays [#METR-13168].

											
										
										
											2015-10-04 06:10:48 +00:00
 											if (const ColumnArray * arr = typeid_cast<const ColumnArray *>(key_columns[j]))
 											{
 												++num_array_keys;
 												if (!arr->getData().isFixed())
 													has_arrays_of_non_fixed_elems = true;
 											}
 											else
 												all_non_array_keys_are_fixed = false;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+										}
 									}
 									/// Если ключей нет
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									if (params.keys_size == 0)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+										return AggregatedDataVariants::Type::without_key;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												dbms: improved performance of aggregation by FixedString columns [#CONV-2944].



											
										
										
											2013-07-19 20:12:02 +00:00
+									/// Если есть один числовой ключ, который помещается в 64 бита
-												dbms: cleanup [#METR-19266]

											
										
										
											2016-08-18 15:58:46 +00:00
+									if (params.keys_size == 1 && key_columns[0]->isNumericNotNullable())
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+									{
 										size_t size_of_field = key_columns[0]->sizeOfField();
 										if (size_of_field == 1)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+											return AggregatedDataVariants::Type::key8;
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+										if (size_of_field == 2)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+											return AggregatedDataVariants::Type::key16;
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+										if (size_of_field == 4)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+											return AggregatedDataVariants::Type::key32;
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+										if (size_of_field == 8)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+											return AggregatedDataVariants::Type::key64;
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+										throw Exception("Logical error: numeric column has sizeOfField not in 1, 2, 4, 8.", ErrorCodes::LOGICAL_ERROR);
 									}
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												dbms: Aggregator: added specialization for many (up to 256 bit) fixed-size keys (up to 3x performance improvement) [#METR-2944].

											
										
										
											2015-02-22 05:53:16 +00:00
+									/// Если ключи помещаются в N бит, будем использовать хэш-таблицу по упакованным в N-бит ключам
 									if (all_fixed && keys_bytes <= 16)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+										return AggregatedDataVariants::Type::keys128;
-												dbms: Aggregator: added specialization for many (up to 256 bit) fixed-size keys (up to 3x performance improvement) [#METR-2944].

											
										
										
											2015-02-22 05:53:16 +00:00
+									if (all_fixed && keys_bytes <= 32)
 										return AggregatedDataVariants::Type::keys256;
-												dbms: improved performance of aggregation by FixedString columns [#CONV-2944].



											
										
										
											2013-07-19 20:12:02 +00:00
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+									/// Если есть один строковый ключ, то используем хэш-таблицу с ним
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									if (params.keys_size == 1 && typeid_cast<const ColumnString *>(key_columns[0]))
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+										return AggregatedDataVariants::Type::key_string;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									if (params.keys_size == 1 && typeid_cast<const ColumnFixedString *>(key_columns[0]))
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+										return AggregatedDataVariants::Type::key_fixed_string;
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
-												dbms: added full support of GROUP BY arrays [#METR-13168].

											
										
										
											2015-10-04 06:10:48 +00:00
+									/** Если есть массивы.
 									  * Если есть не более одного массива из элементов фиксированной длины, и остальные ключи фиксированной длины,
 									  *  то всё ещё можно использовать метод concat. Иначе - serialized.
 									  */
 									if (num_array_keys > 1 || has_arrays_of_non_fixed_elems || (num_array_keys == 1 && !all_non_array_keys_are_fixed))
 										return AggregatedDataVariants::Type::serialized;
-												dbms: added aggregation method 'concat' - performance improvement in generic case [#METR-2944].

											
										
										
											2015-02-22 16:09:16 +00:00
+									/// Иначе будем агрегировать по конкатенации ключей.
 									return AggregatedDataVariants::Type::concat;
 									/// NOTE AggregatedDataVariants::Type::hashed не используется.
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+								}
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11160].

											
										
										
											2014-05-19 19:41:56 +00:00
+								void Aggregator::createAggregateStates(AggregateDataPtr & aggregate_data) const
 								{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t j = 0; j < params.aggregates_size; ++j)
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11160].

											
										
										
											2014-05-19 19:41:56 +00:00
+									{
 										try
 										{
 											/** Может возникнуть исключение при нехватке памяти.
 											  * Для того, чтобы потом всё правильно уничтожилось, "откатываем" часть созданных состояний.
 											  * Код не очень удобный.
 											  */
 											aggregate_functions[j]->create(aggregate_data + offsets_of_aggregate_states[j]);
 										}
 										catch (...)
 										{
 											for (size_t rollback_j = 0; rollback_j < j; ++rollback_j)
-												dbms: Fixed error in prev. revision [#METR-11160].

											
										
										
											2014-05-20 19:30:39 +00:00
+												aggregate_functions[rollback_j]->destroy(aggregate_data + offsets_of_aggregate_states[rollback_j]);
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11160].

											
										
										
											2014-05-19 19:41:56 +00:00
 											throw;
 										}
 									}
 								}
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+								/** Интересно - если убрать noinline, то gcc зачем-то инлайнит эту функцию, и производительность уменьшается (~10%).
 								  * (Возможно из-за того, что после инлайна этой функции, перестают инлайниться более внутренние функции.)
 								  * Инлайнить не имеет смысла, так как внутренний цикл находится целиком внутри этой функции.
 								  */
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+								template <typename Method>
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+								void NO_INLINE Aggregator::executeImpl(
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+									Method & method,
 									Arena * aggregates_pool,
 									size_t rows,
 									ConstColumnPlainPtrs & key_columns,
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+									AggregateFunctionInstruction * aggregate_instructions,
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+									const Sizes & key_sizes,
 									StringRefs & keys,
 									bool no_more_keys,
 									AggregateDataPtr overflow_row) const
 								{
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 06:49:32 +00:00
+									typename Method::State state;
 									state.init(key_columns);
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+									if (!no_more_keys)
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+										executeImplCase<false>(method, state, aggregates_pool, rows, key_columns, aggregate_instructions, key_sizes, keys, overflow_row);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+									else
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+										executeImplCase<true>(method, state, aggregates_pool, rows, key_columns, aggregate_instructions, key_sizes, keys, overflow_row);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+								}
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+								#ifndef __clang__
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+								#pragma GCC diagnostic push
 								#pragma GCC diagnostic ignored "-Wmaybe-uninitialized"
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+								#endif
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
 								template <bool no_more_keys, typename Method>
 								void NO_INLINE Aggregator::executeImplCase(
 									Method & method,
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 06:49:32 +00:00
+									typename Method::State & state,
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+									Arena * aggregates_pool,
 									size_t rows,
 									ConstColumnPlainPtrs & key_columns,
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+									AggregateFunctionInstruction * aggregate_instructions,
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+									const Sizes & key_sizes,
 									StringRefs & keys,
 									AggregateDataPtr overflow_row) const
 								{
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 01:57:22 +00:00
+									/// NOTE При редактировании этого кода, обратите также внимание на SpecializedAggregator.h.
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+									/// Для всех строчек.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+									typename Method::iterator it;
 									typename Method::Key prev_key;
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+									for (size_t i = 0; i < rows; ++i)
 									{
 										bool inserted;			/// Вставили новый ключ, или такой ключ уже был?
 										bool overflow = false;	/// Новый ключ не поместился в хэш-таблицу из-за no_more_keys.
 										/// Получаем ключ для вставки в хэш-таблицу.
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										typename Method::Key key = state.getKey(key_columns, params.keys_size, i, key_sizes, keys, *aggregates_pool);
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+										if (!no_more_keys)	/// Вставляем.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+										{
 											/// Оптимизация для часто повторяющихся ключей.
-												dbms: fixed error in prev. revision [#METR-2944].

											
										
										
											2015-02-22 18:02:54 +00:00
+											if (!Method::no_consecutive_keys_optimization)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+											{
-												dbms: fixed error in prev. revision [#METR-2944].

											
										
										
											2015-02-22 18:02:54 +00:00
+												if (i != 0 && key == prev_key)
 												{
 													/// Добавляем значения в агрегатные функции.
 													AggregateDataPtr value = Method::getAggregateData(it->second);
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+													for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
 														(*inst->func)(inst->that, value + inst->state_offset, inst->arguments, i);
-												dbms: fixed error in prev. revision [#METR-2944].

											
										
										
											2015-02-22 18:02:54 +00:00
 													method.onExistingKey(key, keys, *aggregates_pool);
 													continue;
 												}
 												else
 													prev_key = key;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+											}
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+											method.data.emplace(key, it, inserted);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+										}
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+										else
 										{
 											/// Будем добавлять только если ключ уже есть.
 											inserted = false;
 											it = method.data.find(key);
 											if (method.data.end() == it)
 												overflow = true;
 										}
 										/// Если ключ не поместился, и данные не надо агрегировать в отдельную строку, то делать нечего.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+										if (no_more_keys && overflow && !overflow_row)
-												dbms: added aggregation method 'concat' - performance improvement in generic case [#METR-2944].

											
										
										
											2015-02-22 16:09:16 +00:00
+										{
 											method.onExistingKey(key, keys, *aggregates_pool);
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+											continue;
-												dbms: added aggregation method 'concat' - performance improvement in generic case [#METR-2944].

											
										
										
											2015-02-22 16:09:16 +00:00
+										}
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
-												some grammar fixes. [#METR-2807]

											
										
										
											2014-08-12 09:35:15 +00:00
+										/// Если вставили новый ключ - инициализируем состояния агрегатных функций, и возможно, что-нибудь связанное с ключом.
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+										if (inserted)
 										{
 											AggregateDataPtr & aggregate_data = Method::getAggregateData(it->second);
-												dbms: fixed exception safety [#METR-15352].

											
										
										
											2015-03-07 01:05:06 +00:00
 											/// exception-safety - если не удалось выделить память или создать состояния, то не будут вызываться деструкторы.
 											aggregate_data = nullptr;
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											method.onNewKey(*it, params.keys_size, i, keys, *aggregates_pool);
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
-												dbms: fixed exception safety [#METR-15352].

											
										
										
											2015-03-07 01:05:06 +00:00
+											AggregateDataPtr place = aggregates_pool->alloc(total_size_of_aggregate_states);
 											createAggregateStates(place);
 											aggregate_data = place;
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+										}
-												dbms: added aggregation method 'concat' - performance improvement in generic case [#METR-2944].

											
										
										
											2015-02-22 16:09:16 +00:00
+										else
 											method.onExistingKey(key, keys, *aggregates_pool);
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+										AggregateDataPtr value = (!no_more_keys || !overflow) ? Method::getAggregateData(it->second) : overflow_row;
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
 										/// Добавляем значения в агрегатные функции.
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+										for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
 											(*inst->func)(inst->that, value + inst->state_offset, inst->arguments, i);
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+									}
 								}
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+								#ifndef __clang__
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+								#pragma GCC diagnostic pop
-												Fixed errors in clang (part 4) [#METR-2807].

											
										
										
											2015-01-21 04:23:22 +00:00
+								#endif
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 11:27:58 +00:00
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+								void NO_INLINE Aggregator::executeWithoutKeyImpl(
 									AggregatedDataWithoutKey & res,
 									size_t rows,
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+									AggregateFunctionInstruction * aggregate_instructions) const
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+								{
 									/// Оптимизация в случае единственной агрегатной функции count.
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									AggregateFunctionCount * agg_count = params.aggregates_size == 1
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+										? typeid_cast<AggregateFunctionCount *>(aggregate_functions[0])
 										: NULL;
 									if (agg_count)
 										agg_count->addDelta(res, rows);
 									else
 									{
 										for (size_t i = 0; i < rows; ++i)
 										{
 											/// Добавляем значения
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+											for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
 												(*inst->func)(inst->that, res + inst->state_offset, inst->arguments, i);
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+										}
 									}
 								}
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+								bool Aggregator::executeOnBlock(Block & block, AggregatedDataVariants & result,
 									ConstColumnPlainPtrs & key_columns, AggregateColumns & aggregate_columns,
 									Sizes & key_sizes, StringRefs & key,
 									bool & no_more_keys)
 								{
 									initialize(block);
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return true;
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									/// result будет уничтожать состояния агрегатных функций в деструкторе
 									result.aggregator = this;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
 										aggregate_columns[i].resize(params.aggregates[i].arguments.size());
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
-												dbms: allowed constant arguments of aggregate functions and keys [#METRIKASUPP-5388].

											
										
										
											2015-06-30 19:05:30 +00:00
+									/** Константные столбцы не поддерживаются напрямую при агрегации.
 									  * Чтобы они всё-равно работали, материализуем их.
 									  */
 									Columns materialized_columns;
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									/// Запоминаем столбцы, с которыми будем работать
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.keys_size; ++i)
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+									{
-												Using std::shared_ptr for columns [#METR-21503].

											
										
										
											2016-05-28 05:31:36 +00:00
+										key_columns[i] = block.getByPosition(params.keys[i]).column.get();
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
-												dbms: fixed error with tuples of consts [#METR-18586].

											
										
										
											2015-10-28 21:21:18 +00:00
+										if (auto converted = key_columns[i]->convertToFullColumnIfConst())
-												dbms: allowed constant arguments of aggregate functions and keys [#METRIKASUPP-5388].

											
										
										
											2015-06-30 19:05:30 +00:00
+										{
-												dbms: fixed error with tuples of consts [#METR-18586].

											
										
										
											2015-10-28 21:21:18 +00:00
+											materialized_columns.push_back(converted);
-												dbms: allowed constant arguments of aggregate functions and keys [#METRIKASUPP-5388].

											
										
										
											2015-06-30 19:05:30 +00:00
+											key_columns[i] = materialized_columns.back().get();
 										}
-												dbms: improved performance of aggregation by one numeric key (up to: 2x for UInt8, 5x for UInt16, 1.1x for UInt32, UInt64) [#METR-2944].

											
										
										
											2014-10-29 01:18:50 +00:00
+									}
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									AggregateFunctionInstructions aggregate_functions_instructions(params.aggregates_size + 1);
 									aggregate_functions_instructions[params.aggregates_size].that = nullptr;
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									{
 										for (size_t j = 0; j < aggregate_columns[i].size(); ++j)
 										{
-												Using std::shared_ptr for columns [#METR-21503].

											
										
										
											2016-05-28 05:31:36 +00:00
+											aggregate_columns[i][j] = block.getByPosition(params.aggregates[i].arguments[j]).column.get();
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
-												dbms: fixed error with tuples of consts [#METR-18586].

											
										
										
											2015-10-28 21:21:18 +00:00
+											if (auto converted = aggregate_columns[i][j]->convertToFullColumnIfConst())
-												dbms: allowed constant arguments of aggregate functions and keys [#METRIKASUPP-5388].

											
										
										
											2015-06-30 19:05:30 +00:00
+											{
-												dbms: fixed error with tuples of consts [#METR-18586].

											
										
										
											2015-10-28 21:21:18 +00:00
+												materialized_columns.push_back(converted);
-												dbms: allowed constant arguments of aggregate functions and keys [#METRIKASUPP-5388].

											
										
										
											2015-06-30 19:05:30 +00:00
+												aggregate_columns[i][j] = materialized_columns.back().get();
 											}
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+										}
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
 										aggregate_functions_instructions[i].that = aggregate_functions[i];
 										aggregate_functions_instructions[i].func = aggregate_functions[i]->getAddressOfAddFunction();
 										aggregate_functions_instructions[i].state_offset = offsets_of_aggregate_states[i];
-												Another improvement for UBSan [#METR-2944].

											
										
										
											2016-07-31 06:36:39 +00:00
+										aggregate_functions_instructions[i].arguments = aggregate_columns[i].data();
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									}
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return true;
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									size_t rows = block.rows();
 									/// Каким способом выполнять агрегацию?
 									if (result.empty())
 									{
 										result.init(chooseAggregationMethod(key_columns, key_sizes));
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										result.keys_size = params.keys_size;
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+										result.key_sizes = key_sizes;
 										LOG_TRACE(log, "Aggregation method: " << result.getMethodName());
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										if (params.compiler)
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+											compileIfPossible(result.type);
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									}
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return true;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									if ((params.overflow_row || result.type == AggregatedDataVariants::Type::without_key) && !result.without_key)
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									{
-												dbms: fixed exception safety [#METR-15352].

											
										
										
											2015-03-07 01:05:06 +00:00
+										AggregateDataPtr place = result.aggregates_pool->alloc(total_size_of_aggregate_states);
 										createAggregateStates(place);
 										result.without_key = place;
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									}
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+									/// Выбираем один из методов агрегации и вызываем его.
 									/// Для случая, когда нет ключей (всё агегировать в одну строку).
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+									if (result.type == AggregatedDataVariants::Type::without_key)
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									{
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+										/// Если есть динамически скомпилированный код.
 										if (compiled_data->compiled_method_ptr)
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+										{
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+											reinterpret_cast<
 												void (*)(const Aggregator &, AggregatedDataWithoutKey &, size_t, AggregateColumns &)>
 													(compiled_data->compiled_method_ptr)(*this, result.without_key, rows, aggregate_columns);
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+										}
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+										else
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+											executeWithoutKeyImpl(result.without_key, rows, &aggregate_functions_instructions[0]);
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+									}
 									else
 									{
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+										/// Сюда пишутся данные, не поместившиеся в max_rows_to_group_by при group_by_overflow_mode = any.
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										AggregateDataPtr overflow_row_ptr = params.overflow_row ? result.without_key : nullptr;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+										bool is_two_level = result.isTwoLevel();
 										/// Скомпилированный код, для обычной структуры.
 										if (!is_two_level && compiled_data->compiled_method_ptr)
 										{
 										#define M(NAME, IS_TWO_LEVEL) \
 											else if (result.type == AggregatedDataVariants::Type::NAME) \
 												reinterpret_cast<void (*)( \
 													const Aggregator &, decltype(result.NAME)::element_type &, \
 													Arena *, size_t, ConstColumnPlainPtrs &, AggregateColumns &, \
 													const Sizes &, StringRefs &, bool, AggregateDataPtr)>(compiled_data->compiled_method_ptr) \
 												(*this, *result.NAME, result.aggregates_pool, rows, key_columns, aggregate_columns, \
 													result.key_sizes, key, no_more_keys, overflow_row_ptr);
 											if (false) {}
 											APPLY_FOR_AGGREGATED_VARIANTS(M)
 										#undef M
 										}
 										/// Скомпилированный код, для two-level структуры.
 										else if (is_two_level && compiled_data->compiled_two_level_method_ptr)
 										{
 										#define M(NAME) \
 											else if (result.type == AggregatedDataVariants::Type::NAME) \
 												reinterpret_cast<void (*)( \
 													const Aggregator &, decltype(result.NAME)::element_type &, \
 													Arena *, size_t, ConstColumnPlainPtrs &, AggregateColumns &, \
 													const Sizes &, StringRefs &, bool, AggregateDataPtr)>(compiled_data->compiled_two_level_method_ptr) \
 												(*this, *result.NAME, result.aggregates_pool, rows, key_columns, aggregate_columns, \
 													result.key_sizes, key, no_more_keys, overflow_row_ptr);
 											if (false) {}
 											APPLY_FOR_VARIANTS_TWO_LEVEL(M)
 										#undef M
 										}
 										/// Когда нет динамически скомпилированного кода.
 										else
 										{
 										#define M(NAME, IS_TWO_LEVEL) \
 											else if (result.type == AggregatedDataVariants::Type::NAME) \
-												dbms: improved performance of Aggregator in non-compiled case [#METR-2944].

											
										
										
											2015-11-21 19:46:27 +00:00
+												executeImpl(*result.NAME, result.aggregates_pool, rows, key_columns, &aggregate_functions_instructions[0], \
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-13 03:03:45 +00:00
+													result.key_sizes, key, no_more_keys, overflow_row_ptr);
 											if (false) {}
 											APPLY_FOR_AGGREGATED_VARIANTS(M)
 										#undef M
 										}
-												dbms: compiled aggregator: development [#METR-2944].

											
										
										
											2015-01-10 02:30:03 +00:00
+									}
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
-												dbms: fixed error with WITH TOTALS and group_by_overflow_mode [#METR-14604].

											
										
										
											2015-01-15 19:29:37 +00:00
+									size_t result_size = result.sizeWithoutOverflowRow();
-												dbms: fixed error [#METR-19288].

											
										
										
											2015-12-07 20:08:00 +00:00
+									Int64 current_memory_usage = 0;
 									if (current_memory_tracker)
 										current_memory_usage = current_memory_tracker->get();
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									auto result_size_bytes = current_memory_usage - memory_usage_before_aggregation;	/// Здесь учитываются все результаты в сумме, из разных потоков.
 									bool worth_convert_to_two_level
 										= (params.group_by_two_level_threshold && result_size >= params.group_by_two_level_threshold)
 										|| (params.group_by_two_level_threshold_bytes && result_size_bytes >= static_cast<Int64>(params.group_by_two_level_threshold_bytes));
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+									/** Преобразование в двухуровневую структуру данных.
 									  * Она позволяет делать, в последующем, эффективный мердж - либо экономный по памяти, либо распараллеленный.
 									  */
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									if (result.isConvertibleToTwoLevel() && worth_convert_to_two_level)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 12:58:02 +00:00
+										result.convertToTwoLevel();
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									/// Проверка ограничений.
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+									if (!checkLimits(result_size, no_more_keys))
 										return false;
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+									/** Сброс данных на диск, если потребляется слишком много оперативки.
 									  * Данные можно сбросить на диск только если используется двухуровневая структура агрегации.
 									  */
 									if (params.max_bytes_before_external_group_by
 										&& result.isTwoLevel()
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+										&& current_memory_usage > static_cast<Int64>(params.max_bytes_before_external_group_by)
 										&& worth_convert_to_two_level)
 									{
 										writeToTemporaryFile(result, result_size);
 									}
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+									return true;
 								}
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+								void Aggregator::writeToTemporaryFile(AggregatedDataVariants & data_variants, size_t rows)
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+								{
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									Stopwatch watch;
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+									auto file = std::make_unique<Poco::TemporaryFile>(params.tmp_path);
 									const std::string & path = file->path();
 									WriteBufferFromFile file_buf(path);
 									CompressedWriteBuffer compressed_buf(file_buf);
-												dbms: renamed Revision to ClickHouseRevision. Daemon to BaseDaemon

											
										
										
											2016-02-09 17:06:50 +00:00
+									NativeBlockOutputStream block_out(compressed_buf, ClickHouseRevision::get());
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									LOG_DEBUG(log, "Writing part of aggregation data into temporary file " << path << ".");
-												dbms: instrumenting external sort/aggregation [#METR-17000].

											
										
										
											2015-12-03 21:23:21 +00:00
+									ProfileEvents::increment(ProfileEvents::ExternalAggregationWritePart);
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+									/// Сбрасываем только двухуровневые данные.
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+								#define M(NAME) \
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+									else if (data_variants.type == AggregatedDataVariants::Type::NAME) \
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+										writeToTemporaryFileImpl(data_variants, *data_variants.NAME, block_out, path);
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
 									if (false) {}
 									APPLY_FOR_VARIANTS_TWO_LEVEL(M)
 								#undef M
 									else
 										throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									/// NOTE Вместо освобождения памяти и создания новых хэш-таблиц и арены, можно переиспользовать старые.
 									data_variants.init(data_variants.type);
-												Using std::shared_ptr for data types [#METR-21503].

											
										
										
											2016-05-28 10:15:36 +00:00
+									data_variants.aggregates_pools = Arenas(1, std::make_shared<Arena>());
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									data_variants.aggregates_pool = data_variants.aggregates_pools.back().get();
 									block_out.flush();
 									compressed_buf.next();
 									file_buf.next();
 									double elapsed_seconds = watch.elapsedSeconds();
 									double compressed_bytes = file_buf.count();
 									double uncompressed_bytes = compressed_buf.count();
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-12-01 16:58:15 +00:00
+									{
 										std::lock_guard<std::mutex> lock(temporary_files.mutex);
 										temporary_files.files.emplace_back(std::move(file));
 										temporary_files.sum_size_uncompressed += uncompressed_bytes;
 										temporary_files.sum_size_compressed += compressed_bytes;
 									}
-												dbms: instrumenting external sort/aggregation [#METR-17000].

											
										
										
											2015-12-03 21:23:21 +00:00
+									ProfileEvents::increment(ProfileEvents::ExternalAggregationCompressedBytes, compressed_bytes);
 									ProfileEvents::increment(ProfileEvents::ExternalAggregationUncompressedBytes, uncompressed_bytes);
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									LOG_TRACE(log, std::fixed << std::setprecision(3)
 										<< "Written part in " << elapsed_seconds << " sec., "
 										<< rows << " rows, "
 										<< (uncompressed_bytes / 1048576.0) << " MiB uncompressed, "
 										<< (compressed_bytes / 1048576.0) << " MiB compressed, "
 										<< (uncompressed_bytes / rows) << " uncompressed bytes per row, "
 										<< (compressed_bytes / rows) << " compressed bytes per row, "
 										<< "compression rate: " << (uncompressed_bytes / compressed_bytes)
 										<< " (" << (rows / elapsed_seconds) << " rows/sec., "
 										<< (uncompressed_bytes / elapsed_seconds / 1048576.0) << " MiB/sec. uncompressed, "
 										<< (compressed_bytes / elapsed_seconds / 1048576.0) << " MiB/sec. compressed)");
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+								}
-												dbms: fixed error [#METR-17000].

											
										
										
											2015-12-06 14:27:09 +00:00
+								template <typename Method>
 								Block Aggregator::convertOneBucketToBlock(
 									AggregatedDataVariants & data_variants,
 									Method & method,
 									bool final,
 									size_t bucket) const
 								{
 									Block block = prepareBlockAndFill(data_variants, final, method.data.impls[bucket].size(),
 										[bucket, &method, this] (
 											ColumnPlainPtrs & key_columns,
 											AggregateColumnsData & aggregate_columns,
 											ColumnPlainPtrs & final_aggregate_columns,
 											const Sizes & key_sizes,
 											bool final)
 										{
 											convertToBlockImpl(method, method.data.impls[bucket],
 												key_columns, aggregate_columns, final_aggregate_columns, key_sizes, final);
 										});
 									block.info.bucket_num = bucket;
 									return block;
 								}
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+								template <typename Method>
 								void Aggregator::writeToTemporaryFileImpl(
 									AggregatedDataVariants & data_variants,
 									Method & method,
 									IBlockOutputStream & out,
 									const String & path)
 								{
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									size_t max_temporary_block_size_rows = 0;
 									size_t max_temporary_block_size_bytes = 0;
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
 									for (size_t bucket = 0; bucket < Method::Data::NUM_BUCKETS; ++bucket)
 									{
-												dbms: fixed error [#METR-17000].

											
										
										
											2015-12-06 14:27:09 +00:00
+										Block block = convertOneBucketToBlock(data_variants, method, false, bucket);
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+										out.write(block);
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
 										size_t block_size_rows = block.rowsInFirstColumn();
 										size_t block_size_bytes = block.bytes();
 										if (block_size_rows > max_temporary_block_size_rows)
 											max_temporary_block_size_rows = block.rowsInFirstColumn();
 										if (block_size_bytes > max_temporary_block_size_bytes)
 											max_temporary_block_size_bytes = block_size_bytes;
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+									}
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-12-01 16:58:15 +00:00
+									/// data_variants не будет уничтожать состояния агрегатных функций в деструкторе. Теперь состояниями владеют ColumnAggregateFunction.
 									data_variants.aggregator = nullptr;
-												dbms: external aggregation: initial implementation [#METR-17000].

											
										
										
											2015-12-01 14:09:05 +00:00
+									LOG_TRACE(log, std::fixed << std::setprecision(3)
 										<< "Max size of temporary block: " << max_temporary_block_size_rows << " rows, "
 										<< (max_temporary_block_size_bytes / 1048576.0) << " MiB.");
-												dbms: external aggregation: development [#METR-17000].

											
										
										
											2015-11-30 19:57:46 +00:00
+								}
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+								bool Aggregator::checkLimits(size_t result_size, bool & no_more_keys) const
 								{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									if (!no_more_keys && params.max_rows_to_group_by && result_size > params.max_rows_to_group_by)
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										if (params.group_by_overflow_mode == OverflowMode::THROW)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 18:04:53 +00:00
+											throw Exception("Limit for rows to GROUP BY exceeded: has " + toString(result_size)
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+												+ " rows, maximum: " + toString(params.max_rows_to_group_by),
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+												ErrorCodes::TOO_MUCH_ROWS);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										else if (params.group_by_overflow_mode == OverflowMode::BREAK)
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+											return false;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										else if (params.group_by_overflow_mode == OverflowMode::ANY)
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+											no_more_keys = true;
 										else
 											throw Exception("Logical error: unknown overflow mode", ErrorCodes::LOGICAL_ERROR);
 									}
 									return true;
 								}
-												dbms: development [#CONV-2944].



											
										
										
											2011-09-26 07:25:22 +00:00
+								void Aggregator::execute(BlockInputStreamPtr stream, AggregatedDataVariants & result)
-												dbms: development.



											
										
										
											2011-09-19 01:42:16 +00:00
+								{
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									StringRefs key(params.keys_size);
 									ConstColumnPlainPtrs key_columns(params.keys_size);
 									AggregateColumns aggregate_columns(params.aggregates_size);
-												dbms: preparation [#METR-2944].

											
										
										
											2014-05-10 05:16:23 +00:00
+									Sizes key_sizes;
-												dbms: development.



											
										
										
											2011-09-19 01:42:16 +00:00
-												dbms: development of limits [#CONV-2944].



											
										
										
											2012-12-25 19:28:59 +00:00
+									/** Используется, если есть ограничение на максимальное количество строк при агрегации,
 									  *  и если group_by_overflow_mode == ANY.
 									  * В этом случае, новые ключи не добавляются в набор, а производится агрегация только по
 									  *  ключам, которые уже успели попасть в набор.
 									  */
 									bool no_more_keys = false;
-												dbms: Aggregator: more logging [#CONV-2944].



											
										
										
											2013-02-04 03:31:53 +00:00
+									LOG_TRACE(log, "Aggregating");
-												dbms: continuing improvement (incomplete) [#CONV-2944].



											
										
										
											2013-02-08 20:34:30 +00:00
-												dbms: Aggregator: more logging [#CONV-2944].



											
										
										
											2013-02-04 03:31:53 +00:00
+									Stopwatch watch;
 									size_t src_rows = 0;
 									size_t src_bytes = 0;
-												dbms: improvement [#CONV-2944].



											
										
										
											2013-02-09 01:02:52 +00:00
 									/// Читаем все данные
-												dbms: development.



											
										
										
											2011-09-19 01:42:16 +00:00
+									while (Block block = stream->read())
 									{
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+										if (isCancelled())
 											return;
-												dbms: Aggregator: more logging [#CONV-2944].



											
										
										
											2013-02-04 03:31:53 +00:00
+										src_rows += block.rows();
 										src_bytes += block.bytes();
-												dbms: development [#CONV-2944].



											
										
										
											2011-09-25 05:07:47 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										if (!executeOnBlock(block, result,
 											key_columns, aggregate_columns, key_sizes, key,
 											no_more_keys))
 											break;
 									}
 									double elapsed_seconds = watch.elapsedSeconds();
 									size_t rows = result.size();
 									LOG_TRACE(log, std::fixed << std::setprecision(3)
 										<< "Aggregated. " << src_rows << " to " << rows << " rows (from " << src_bytes / 1048576.0 << " MiB)"
 										<< " in " << elapsed_seconds << " sec."
 										<< " (" << src_rows / elapsed_seconds << " rows/sec., " << src_bytes / elapsed_seconds / 1048576.0 << " MiB/sec.)");
 								}
 								template <typename Method, typename Table>
 								void Aggregator::convertToBlockImpl(
 									Method & method,
 									Table & data,
 									ColumnPlainPtrs & key_columns,
 									AggregateColumnsData & aggregate_columns,
 									ColumnPlainPtrs & final_aggregate_columns,
 									const Sizes & key_sizes,
 									bool final) const
 								{
-												dbms: Aggregator: fixes [#METR-19371].

											
										
										
											2015-12-11 00:34:00 +00:00
+									if (data.empty())
 										return;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									if (final)
 										convertToBlockImplFinal(method, data, key_columns, final_aggregate_columns, key_sizes);
 									else
 										convertToBlockImplNotFinal(method, data, key_columns, aggregate_columns, key_sizes);
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
 									/// Для того, чтобы пораньше освободить память.
 									data.clearAndShrink();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								}
 								template <typename Method, typename Table>
 								void NO_INLINE Aggregator::convertToBlockImplFinal(
 									Method & method,
 									Table & data,
 									ColumnPlainPtrs & key_columns,
 									ColumnPlainPtrs & final_aggregate_columns,
 									const Sizes & key_sizes) const
 								{
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+									for (const auto & value : data)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									{
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+										method.insertKeyIntoColumns(value, key_columns, params.keys_size, key_sizes);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											aggregate_functions[i]->insertResultInto(
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+												Method::getAggregateData(value.second) + offsets_of_aggregate_states[i],
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+												*final_aggregate_columns[i]);
 									}
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
 									destroyImpl(method, data);		/// NOTE Можно сделать лучше.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								}
 								template <typename Method, typename Table>
 								void NO_INLINE Aggregator::convertToBlockImplNotFinal(
 									Method & method,
 									Table & data,
 									ColumnPlainPtrs & key_columns,
 									AggregateColumnsData & aggregate_columns,
 									const Sizes & key_sizes) const
 								{
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+									for (auto & value : data)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									{
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+										method.insertKeyIntoColumns(value, key_columns, params.keys_size, key_sizes);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+										/// reserved, поэтому push_back не кидает исключений
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+											aggregate_columns[i]->push_back(Method::getAggregateData(value.second) + offsets_of_aggregate_states[i]);
 										Method::getAggregateData(value.second) = nullptr;
-												dbms: development [#CONV-2944].



											
										
										
											2011-09-26 07:25:22 +00:00
+									}
-												dbms: development.



											
										
										
											2011-09-19 01:42:16 +00:00
+								}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+								template <typename Filler>
 								Block Aggregator::prepareBlockAndFill(
 									AggregatedDataVariants & data_variants,
 									bool final,
 									size_t rows,
 								 	Filler && filler) const
-												dbms: development [#CONV-2944].



											
										
										
											2012-02-27 06:28:20 +00:00
+								{
-												dbms: Aggregator: fixed error [#CONV-2944].



											
										
										
											2013-09-16 05:33:49 +00:00
+									Block res = sample.cloneEmpty();
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-10 07:47:13 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									ColumnPlainPtrs key_columns(params.keys_size);
 									AggregateColumnsData aggregate_columns(params.aggregates_size);
 									ColumnPlainPtrs final_aggregate_columns(params.aggregates_size);
-												dbms: improved performance for queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:08:52 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.keys_size; ++i)
-												dbms: improved performance of queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:39:09 +00:00
+									{
-												Using std::shared_ptr for columns [#METR-21503].

											
										
										
											2016-05-28 05:31:36 +00:00
+										key_columns[i] = res.getByPosition(i).column.get();
-												dbms: improved performance of queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:39:09 +00:00
+										key_columns[i]->reserve(rows);
 									}
-												dbms: improved performance for queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:08:52 +00:00
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: improved performance of queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:39:09 +00:00
+									{
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+										if (!final)
-												Merge

											
										
										
											2014-05-26 16:11:20 +00:00
+										{
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+											/// Столбец ColumnAggregateFunction захватывает разделяемое владение ареной с состояниями агрегатных функций.
 											ColumnAggregateFunction & column_aggregate_func = static_cast<ColumnAggregateFunction &>(
 												*res.getByPosition(i + params.keys_size).column);
 											for (size_t j = 0; j < data_variants.aggregates_pools.size(); ++j)
 												column_aggregate_func.addArena(data_variants.aggregates_pools[j]);
 											aggregate_columns[i] = &column_aggregate_func.getData();
 											aggregate_columns[i]->reserve(rows);
 										}
 										else
 										{
 											ColumnWithTypeAndName & column = res.getByPosition(i + params.keys_size);
 											column.type = aggregate_functions[i]->getReturnType();
 											column.column = column.type->createColumn();
 											column.column->reserve(rows);
 											if (aggregate_functions[i]->isState())
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
+											{
 												/// Столбец ColumnAggregateFunction захватывает разделяемое владение ареной с состояниями агрегатных функций.
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+												ColumnAggregateFunction & column_aggregate_func = static_cast<ColumnAggregateFunction &>(*column.column);
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
 												for (size_t j = 0; j < data_variants.aggregates_pools.size(); ++j)
 													column_aggregate_func.addArena(data_variants.aggregates_pools[j]);
 											}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:50:14 +00:00
-												Using std::shared_ptr for columns [#METR-21503].

											
										
										
											2016-05-28 05:31:36 +00:00
+											final_aggregate_columns[i] = column.column.get();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+										}
 									}
-												dbms: development [#METR-10894].

											
										
										
											2014-06-05 19:52:13 +00:00
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+									filler(key_columns, aggregate_columns, final_aggregate_columns, data_variants.key_sizes, final);
 									/// Изменяем размер столбцов-констант в блоке.
 									size_t columns = res.columns();
 									for (size_t i = 0; i < columns; ++i)
 										if (res.getByPosition(i).column->isConst())
 											res.getByPosition(i).column = res.getByPosition(i).column->cut(0, rows);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
 									return res;
 								}
-												Merge

											
										
										
											2014-05-28 14:54:42 +00:00
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
-												dbms: fixed error [#METR-17109].

											
										
										
											2015-11-09 18:45:55 +00:00
+								BlocksList Aggregator::prepareBlocksAndFillWithoutKey(AggregatedDataVariants & data_variants, bool final, bool is_overflows) const
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+								{
 									size_t rows = 1;
 									auto filler = [&data_variants, this](
 										ColumnPlainPtrs & key_columns,
 										AggregateColumnsData & aggregate_columns,
 										ColumnPlainPtrs & final_aggregate_columns,
 										const Sizes & key_sizes,
 										bool final)
 									{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										if (data_variants.type == AggregatedDataVariants::Type::without_key || params.overflow_row)
-												dbms: merged convertToBlock and finalize aggregation steps whenever possible [#METR-2944].



											
										
										
											2013-11-03 23:35:18 +00:00
+										{
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
+											AggregatedDataWithoutKey & data = data_variants.without_key;
-												dbms: continuing improvement (incomplete) [#CONV-2944].



											
										
										
											2013-02-08 20:34:30 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+											{
-												Merge

											
										
										
											2014-05-28 14:54:42 +00:00
+												if (!final)
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+													aggregate_columns[i]->push_back(data + offsets_of_aggregate_states[i]);
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
+												else
 													aggregate_functions[i]->insertResultInto(data + offsets_of_aggregate_states[i], *final_aggregate_columns[i]);
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+											}
 											if (!final)
 												data = nullptr;
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											if (params.overflow_row)
 												for (size_t i = 0; i < params.keys_size; ++i)
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
+													key_columns[i]->insertDefault();
-												dbms: merged convertToBlock and finalize aggregation steps whenever possible [#METR-2944].



											
										
										
											2013-11-03 23:35:18 +00:00
+										}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									};
-												dbms: improved performance for queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:08:52 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 03:18:49 +00:00
+									Block block = prepareBlockAndFill(data_variants, final, rows, filler);
-												dbms: fixed error [#METR-17109].

											
										
										
											2015-11-09 18:45:55 +00:00
 									if (is_overflows)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 03:18:49 +00:00
+										block.info.is_overflows = true;
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
+									if (final)
 										destroyWithoutKey(data_variants);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									BlocksList blocks;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 03:18:49 +00:00
+									blocks.emplace_back(std::move(block));
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									return blocks;
 								}
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+								BlocksList Aggregator::prepareBlocksAndFillSingleLevel(AggregatedDataVariants & data_variants, bool final) const
 								{
-												dbms: fixed error with WITH TOTALS and group_by_overflow_mode [#METR-14604].

											
										
										
											2015-01-15 19:29:37 +00:00
+									size_t rows = data_variants.sizeWithoutOverflowRow();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
 									auto filler = [&data_variants, this](
 										ColumnPlainPtrs & key_columns,
 										AggregateColumnsData & aggregate_columns,
 										ColumnPlainPtrs & final_aggregate_columns,
 										const Sizes & key_sizes,
 										bool final)
 									{
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
+									#define M(NAME) \
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+										else if (data_variants.type == AggregatedDataVariants::Type::NAME) \
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+											convertToBlockImpl(*data_variants.NAME, data_variants.NAME->data, \
 												key_columns, aggregate_columns, final_aggregate_columns, data_variants.key_sizes, final);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
 										if (false) {}
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
+										APPLY_FOR_VARIANTS_SINGLE_LEVEL(M)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+									#undef M
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+										else
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
+											throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									};
 									BlocksList blocks;
 									blocks.emplace_back(prepareBlockAndFill(data_variants, final, rows, filler));
 									return blocks;
 								}
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+								BlocksList Aggregator::prepareBlocksAndFillTwoLevel(AggregatedDataVariants & data_variants, bool final, ThreadPool * thread_pool) const
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+								{
 								#define M(NAME) \
 									else if (data_variants.type == AggregatedDataVariants::Type::NAME) \
 										return prepareBlocksAndFillTwoLevelImpl(data_variants, *data_variants.NAME, final, thread_pool);
 									if (false) {}
 									APPLY_FOR_VARIANTS_TWO_LEVEL(M)
 								#undef M
 									else
 										throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
 								}
 								template <typename Method>
 								BlocksList Aggregator::prepareBlocksAndFillTwoLevelImpl(
 									AggregatedDataVariants & data_variants,
 									Method & method,
 									bool final,
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+									ThreadPool * thread_pool) const
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+								{
 									auto converter = [&](size_t bucket, MemoryTracker * memory_tracker)
 									{
 										current_memory_tracker = memory_tracker;
-												dbms: fixed error [#METR-17000].

											
										
										
											2015-12-06 14:27:09 +00:00
+										return convertOneBucketToBlock(data_variants, method, final, bucket);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									};
 									/// packaged_task используются, чтобы исключения автоматически прокидывались в основной поток.
-												dbms: fixed error [#METR-15530].

											
										
										
											2015-03-19 05:15:38 +00:00
+									std::vector<std::packaged_task<Block()>> tasks(Method::Data::NUM_BUCKETS);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
-												dbms: fixed error with exception safety [#METR-15357].

											
										
										
											2015-03-16 19:24:57 +00:00
+									try
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									{
-												dbms: fixed error with exception safety [#METR-15357].

											
										
										
											2015-03-16 19:24:57 +00:00
+										for (size_t bucket = 0; bucket < Method::Data::NUM_BUCKETS; ++bucket)
 										{
 											if (method.data.impls[bucket].empty())
 												continue;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
-												dbms: fixed error [#METR-15530].

											
										
										
											2015-03-19 05:15:38 +00:00
+											tasks[bucket] = std::packaged_task<Block()>(std::bind(converter, bucket, current_memory_tracker));
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
-												dbms: fixed error with exception safety [#METR-15357].

											
										
										
											2015-03-16 19:24:57 +00:00
+											if (thread_pool)
 												thread_pool->schedule([bucket, &tasks] { tasks[bucket](); });
 											else
 												tasks[bucket]();
 										}
 									}
 									catch (...)
 									{
 										/// Если этого не делать, то в случае исключения, tasks уничтожится раньше завершения потоков, и будет плохо.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+										if (thread_pool)
-												dbms: fixed error with exception safety [#METR-15357].

											
										
										
											2015-03-16 19:24:57 +00:00
+											thread_pool->wait();
 										throw;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									}
 									if (thread_pool)
 										thread_pool->wait();
 									BlocksList blocks;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:50:14 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									for (auto & task : tasks)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:50:14 +00:00
+									{
-												dbms: fixed error [#METR-15530].

											
										
										
											2015-03-19 05:15:38 +00:00
+										if (!task.valid())
 											continue;
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+										blocks.emplace_back(task.get_future().get());
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:50:14 +00:00
+									}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
 									return blocks;
 								}
-												dbms: fixed error [#METR-17000].

											
										
										
											2015-12-08 02:01:46 +00:00
+								BlocksList Aggregator::convertToBlocks(AggregatedDataVariants & data_variants, bool final, size_t max_threads) const
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+								{
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return BlocksList();
-												dbms: fixed exception safety [#METR-15352].

											
										
										
											2015-03-07 01:05:06 +00:00
+									LOG_TRACE(log, "Converting aggregated data to blocks");
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
 									Stopwatch watch;
 									BlocksList blocks;
 									/// В какой структуре данных агрегированы данные?
 									if (data_variants.empty())
 										return blocks;
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+									std::unique_ptr<ThreadPool> thread_pool;
-												dbms: fixed error with WITH TOTALS and group_by_overflow_mode [#METR-14604].

											
										
										
											2015-01-15 19:29:37 +00:00
+									if (max_threads > 1 && data_variants.sizeWithoutOverflowRow() > 100000	/// TODO Сделать настраиваемый порог.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:50:14 +00:00
+										&& data_variants.isTwoLevel())						/// TODO Использовать общий тред-пул с функцией merge.
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+										thread_pool.reset(new ThreadPool(max_threads));
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+									if (isCancelled())
 										return BlocksList();
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+									if (data_variants.type == AggregatedDataVariants::Type::without_key || params.overflow_row)
 										blocks.splice(blocks.end(), prepareBlocksAndFillWithoutKey(
 											data_variants, final, data_variants.type != AggregatedDataVariants::Type::without_key));
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+									if (isCancelled())
 										return BlocksList();
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+									if (data_variants.type != AggregatedDataVariants::Type::without_key)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:50:14 +00:00
+									{
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+										if (!data_variants.isTwoLevel())
 											blocks.splice(blocks.end(), prepareBlocksAndFillSingleLevel(data_variants, final));
 										else
 											blocks.splice(blocks.end(), prepareBlocksAndFillTwoLevel(data_variants, final, thread_pool.get()));
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11220].

											
										
										
											2014-05-22 18:58:41 +00:00
+									}
-												clickhouse: totals mode: development. [#METR-9365]

											
										
										
											2014-02-26 11:44:54 +00:00
-												dbms: merged convertToBlock and finalize aggregation steps whenever possible [#METR-2944].



											
										
										
											2013-11-03 23:35:18 +00:00
+									if (!final)
 									{
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+										/// data_variants не будет уничтожать состояния агрегатных функций в деструкторе.
 										/// Теперь состояниями владеют ColumnAggregateFunction.
-												Improvement [#METR-2807].

											
										
										
											2014-04-08 07:31:51 +00:00
+										data_variants.aggregator = nullptr;
-												dbms: merged convertToBlock and finalize aggregation steps whenever possible [#METR-2944].



											
										
										
											2013-11-03 23:35:18 +00:00
+									}
-												dbms: fixed possible leak [#CONV-2944].



											
										
										
											2013-02-16 18:59:05 +00:00
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return BlocksList();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									size_t rows = 0;
 									size_t bytes = 0;
 									for (const auto & block : blocks)
 									{
 										rows += block.rowsInFirstColumn();
 										bytes += block.bytes();
 									}
-												dbms: development [#CONV-2944].



											
										
										
											2012-02-27 06:28:20 +00:00
-												dbms: improved performance of queries with large aggregation result [#CONV-2944].



											
										
										
											2013-02-03 18:39:09 +00:00
+									double elapsed_seconds = watch.elapsedSeconds();
-												dbms: Aggregator: more logging [#CONV-2944].



											
										
										
											2013-02-04 03:31:53 +00:00
+									LOG_TRACE(log, std::fixed << std::setprecision(3)
-												dbms: tiny additions [#METR-14604].

											
										
										
											2015-01-16 21:01:41 +00:00
+										<< "Converted aggregated data to blocks. "
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+										<< rows << " rows, " << bytes / 1048576.0 << " MiB"
-												dbms: Aggregator: more logging [#CONV-2944].



											
										
										
											2013-02-04 03:31:53 +00:00
+										<< " in " << elapsed_seconds << " sec."
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+										<< " (" << rows / elapsed_seconds << " rows/sec., " << bytes / elapsed_seconds / 1048576.0 << " MiB/sec.)");
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-31 00:33:42 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									return blocks;
-												dbms: development [#CONV-2944].



											
										
										
											2012-02-27 06:28:20 +00:00
+								}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								template <typename Method, typename Table>
 								void NO_INLINE Aggregator::mergeDataImpl(
 									Table & table_dst,
 									Table & table_src) const
 								{
 									for (auto it = table_src.begin(); it != table_src.end(); ++it)
 									{
 										decltype(it) res_it;
 										bool inserted;
 										table_dst.emplace(it->first, res_it, inserted, it.getHash());
 										if (!inserted)
 										{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+												aggregate_functions[i]->merge(
 													Method::getAggregateData(res_it->second) + offsets_of_aggregate_states[i],
 													Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+												aggregate_functions[i]->destroy(
 													Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);
 										}
 										else
 										{
 											res_it->second = it->second;
 										}
-												dbms: fixed exception safety [#METR-15357].

											
										
										
											2015-03-16 21:31:40 +00:00
 										Method::getAggregateData(it->second) = nullptr;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									}
-												dbms: better [#METR-19278].

											
										
										
											2015-12-23 07:06:34 +00:00
 									table_src.clearAndShrink();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								}
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+								template <typename Method, typename Table>
 								void NO_INLINE Aggregator::mergeDataNoMoreKeysImpl(
 									Table & table_dst,
 									AggregatedDataWithoutKey & overflows,
 									Table & table_src) const
 								{
 									for (auto it = table_src.begin(); it != table_src.end(); ++it)
 									{
 										decltype(it) res_it = table_dst.find(it->first, it.getHash());
 										AggregateDataPtr res_data = table_dst.end() == res_it
 											? overflows
 											: Method::getAggregateData(res_it->second);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+											aggregate_functions[i]->merge(
 												res_data + offsets_of_aggregate_states[i],
 												Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+											aggregate_functions[i]->destroy(
 												Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);
 										Method::getAggregateData(it->second) = nullptr;
 									}
-												dbms: better [#METR-19278].

											
										
										
											2015-12-23 07:06:34 +00:00
 									table_src.clearAndShrink();
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+								}
 								template <typename Method, typename Table>
 								void NO_INLINE Aggregator::mergeDataOnlyExistingKeysImpl(
 									Table & table_dst,
 									Table & table_src) const
 								{
 									for (auto it = table_src.begin(); it != table_src.end(); ++it)
 									{
 										decltype(it) res_it = table_dst.find(it->first, it.getHash());
 										if (table_dst.end() == res_it)
 											continue;
 										AggregateDataPtr res_data = Method::getAggregateData(res_it->second);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+											aggregate_functions[i]->merge(
 												res_data + offsets_of_aggregate_states[i],
 												Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+											aggregate_functions[i]->destroy(
 												Method::getAggregateData(it->second) + offsets_of_aggregate_states[i]);
 										Method::getAggregateData(it->second) = nullptr;
 									}
-												dbms: better [#METR-19278].

											
										
										
											2015-12-23 07:06:34 +00:00
 									table_src.clearAndShrink();
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+								}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								void NO_INLINE Aggregator::mergeWithoutKeyDataImpl(
 									ManyAggregatedDataVariants & non_empty_data) const
 								{
 									AggregatedDataVariantsPtr & res = non_empty_data[0];
 									/// Все результаты агрегации соединяем с первым.
 									for (size_t i = 1, size = non_empty_data.size(); i < size; ++i)
 									{
 										AggregatedDataWithoutKey & res_data = res->without_key;
 										AggregatedDataWithoutKey & current_data = non_empty_data[i]->without_key;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											aggregate_functions[i]->merge(res_data + offsets_of_aggregate_states[i], current_data + offsets_of_aggregate_states[i]);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											aggregate_functions[i]->destroy(current_data + offsets_of_aggregate_states[i]);
 										current_data = nullptr;
 									}
 								}
 								template <typename Method>
 								void NO_INLINE Aggregator::mergeSingleLevelDataImpl(
 									ManyAggregatedDataVariants & non_empty_data) const
 								{
 									AggregatedDataVariantsPtr & res = non_empty_data[0];
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+									bool no_more_keys = false;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 									/// Все результаты агрегации соединяем с первым.
 									for (size_t i = 1, size = non_empty_data.size(); i < size; ++i)
 									{
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+										if (!checkLimits(res->sizeWithoutOverflowRow(), no_more_keys))
 											break;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										AggregatedDataVariants & current = *non_empty_data[i];
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+										if (!no_more_keys)
 											mergeDataImpl<Method>(
 												getDataVariant<Method>(*res).data,
 												getDataVariant<Method>(current).data);
-												dbms: fixed error [#MTRSADMIN-1690].

											
										
										
											2015-10-30 02:29:53 +00:00
+										else if (res->without_key)
-												dbms: using max_rows_to_group_by limit while merging aggregate states (incomplete) [#METR-18507].

											
										
										
											2015-10-22 01:44:33 +00:00
+											mergeDataNoMoreKeysImpl<Method>(
 												getDataVariant<Method>(*res).data,
 												res->without_key,
 												getDataVariant<Method>(current).data);
-												dbms: fixed error [#MTRSADMIN-1690].

											
										
										
											2015-10-30 02:29:53 +00:00
+										else
 											mergeDataOnlyExistingKeysImpl<Method>(
 												getDataVariant<Method>(*res).data,
 												getDataVariant<Method>(current).data);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 										/// current не будет уничтожать состояния агрегатных функций в деструкторе
 										current.aggregator = nullptr;
 									}
 								}
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+								template <typename Method>
 								void NO_INLINE Aggregator::mergeBucketImpl(
 									ManyAggregatedDataVariants & data, Int32 bucket) const
 								{
 									/// Все результаты агрегации соединяем с первым.
 									AggregatedDataVariantsPtr & res = data[0];
 									for (size_t i = 1, size = data.size(); i < size; ++i)
 									{
 										AggregatedDataVariants & current = *data[i];
 										mergeDataImpl<Method>(
 											getDataVariant<Method>(*res).data.impls[bucket],
 											getDataVariant<Method>(current).data.impls[bucket]);
 									}
 								}
 								/** Объединят вместе состояния агрегации, превращает их в блоки и выдаёт потоково.
 								  * Если состояния агрегации двухуровневые, то выдаёт блоки строго по порядку bucket_num.
 								  * (Это важно при распределённой обработке.)
 								  * При этом, может обрабатывать разные bucket-ы параллельно, используя до threads потоков.
 								  */
 								class MergingAndConvertingBlockInputStream : public IProfilingBlockInputStream
 								{
 								public:
 									/** На вход подаётся набор непустых множеств частично агрегированных данных,
 									  *  которые все либо являются одноуровневыми, либо являются двухуровневыми.
 									  */
-												dbms: fixed error [#METR-17000].

											
										
										
											2015-12-08 02:01:46 +00:00
+									MergingAndConvertingBlockInputStream(const Aggregator & aggregator_, ManyAggregatedDataVariants & data_, bool final_, size_t threads_)
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+										: aggregator(aggregator_), data(data_), final(final_), threads(threads_) {}
 									String getName() const override { return "MergingAndConverting"; }
 									String getID() const override
 									{
 										std::stringstream res;
 										res << this;
 										return res.str();
 									}
 								protected:
 									Block readImpl() override
 									{
 										if (data.empty())
 											return {};
 										if (current_bucket_num >= NUM_BUCKETS)
 											return {};
 										AggregatedDataVariantsPtr & first = data[0];
 										if (current_bucket_num == -1)
 										{
 											++current_bucket_num;
 											if (first->type == AggregatedDataVariants::Type::without_key || aggregator.params.overflow_row)
 											{
 												aggregator.mergeWithoutKeyDataImpl(data);
 												return aggregator.prepareBlocksAndFillWithoutKey(
 													*first, final, first->type != AggregatedDataVariants::Type::without_key).front();
 											}
 										}
 										if (!first->isTwoLevel())
 										{
 											if (current_bucket_num > 0)
 												return {};
-												dbms: fixed error [#METR-17000].

											
										
										
											2015-12-06 16:42:17 +00:00
+											if (first->type == AggregatedDataVariants::Type::without_key)
 												return {};
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+											++current_bucket_num;
 										#define M(NAME) \
 											else if (first->type == AggregatedDataVariants::Type::NAME) \
 												aggregator.mergeSingleLevelDataImpl<decltype(first->NAME)::element_type>(data);
 											if (false) {}
 											APPLY_FOR_VARIANTS_SINGLE_LEVEL(M)
 										#undef M
-												dbms: fixed error [#METR-17000].

											
										
										
											2015-12-06 16:42:17 +00:00
+											else
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+												throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
 											return aggregator.prepareBlocksAndFillSingleLevel(*first, final).front();
 										}
 										else
 										{
 											if (!parallel_merge_data)
 											{
 												parallel_merge_data.reset(new ParallelMergeData(threads));
 												for (size_t i = 0; i < threads; ++i)
 													scheduleThreadForNextBucket();
 											}
 											Block res;
 											while (true)
 											{
 												std::unique_lock<std::mutex> lock(parallel_merge_data->mutex);
 												if (parallel_merge_data->exception)
 													std::rethrow_exception(parallel_merge_data->exception);
 												auto it = parallel_merge_data->ready_blocks.find(current_bucket_num);
 												if (it != parallel_merge_data->ready_blocks.end())
 												{
 													++current_bucket_num;
 													scheduleThreadForNextBucket();
-												dbms: Aggregator: fixes [#METR-19371].

											
										
										
											2015-12-11 01:11:59 +00:00
+													if (it->second)
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+													{
 														res.swap(it->second);
 														break;
 													}
 													else if (current_bucket_num >= NUM_BUCKETS)
 														break;
 												}
 												parallel_merge_data->condvar.wait(lock);
 											}
 											return res;
 										}
 									}
 								private:
-												dbms: fixed error [#METR-17000].

											
										
										
											2015-12-08 02:01:46 +00:00
+									const Aggregator & aggregator;
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+									ManyAggregatedDataVariants data;
 									bool final;
 									size_t threads;
 									Int32 current_bucket_num = -1;
 									Int32 max_scheduled_bucket_num = -1;
 									static constexpr Int32 NUM_BUCKETS = 256;
 									struct ParallelMergeData
 									{
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+										ThreadPool pool;
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+										std::map<Int32, Block> ready_blocks;
 										std::exception_ptr exception;
 										std::mutex mutex;
 										std::condition_variable condvar;
 										ParallelMergeData(size_t threads) : pool(threads) {}
-												dbms: better [#METR-19278].

											
										
										
											2015-12-23 07:35:36 +00:00
 										~ParallelMergeData()
 										{
 											LOG_TRACE(&Logger::get(__PRETTY_FUNCTION__), "Waiting for threads to finish");
 											pool.wait();
 										}
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+									};
 									std::unique_ptr<ParallelMergeData> parallel_merge_data;
 									void scheduleThreadForNextBucket()
 									{
 										++max_scheduled_bucket_num;
 										if (max_scheduled_bucket_num >= NUM_BUCKETS)
 											return;
 										parallel_merge_data->pool.schedule(std::bind(&MergingAndConvertingBlockInputStream::thread, this,
 											max_scheduled_bucket_num, current_memory_tracker));
 									}
 									void thread(Int32 bucket_num, MemoryTracker * memory_tracker)
 									{
 										current_memory_tracker = memory_tracker;
 										setThreadName("MergingAggregtd");
-												dbms: CurrentMetrics: development [#METR-19596].

											
										
										
											2016-01-21 01:47:28 +00:00
+										CurrentMetrics::Increment metric_increment{CurrentMetrics::QueryThread};
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
 										try
 										{
 											/// TODO Возможно, поддержать no_more_keys
 											auto & merged_data = *data[0];
 											auto method = merged_data.type;
 											Block block;
 											if (false) {}
 										#define M(NAME) \
 											else if (method == AggregatedDataVariants::Type::NAME) \
 											{ \
 												aggregator.mergeBucketImpl<decltype(merged_data.NAME)::element_type>(data, bucket_num); \
 												block = aggregator.convertOneBucketToBlock(merged_data, *merged_data.NAME, final, bucket_num); \
 											}
 											APPLY_FOR_VARIANTS_TWO_LEVEL(M)
 										#undef M
 											std::lock_guard<std::mutex> lock(parallel_merge_data->mutex);
 											parallel_merge_data->ready_blocks[bucket_num] = std::move(block);
 										}
 										catch (...)
 										{
 											std::lock_guard<std::mutex> lock(parallel_merge_data->mutex);
-												dbms: better [#METR-19278].

											
										
										
											2015-12-23 07:06:34 +00:00
+											if (!parallel_merge_data->exception)
 												parallel_merge_data->exception = std::current_exception();
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+										}
 										parallel_merge_data->condvar.notify_all();
 									}
 								};
-												dbms: more safe [#METR-19278].

											
										
										
											2015-12-23 07:29:20 +00:00
+								std::unique_ptr<IBlockInputStream> Aggregator::mergeAndConvertToBlocks(
 									ManyAggregatedDataVariants & data_variants, bool final, size_t max_threads) const
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+								{
 									if (data_variants.empty())
 										throw Exception("Empty data passed to Aggregator::mergeAndConvertToBlocks.", ErrorCodes::EMPTY_DATA_PASSED);
 									LOG_TRACE(log, "Merging aggregated data");
 									ManyAggregatedDataVariants non_empty_data;
 									non_empty_data.reserve(data_variants.size());
 									for (auto & data : data_variants)
 										if (!data->empty())
 											non_empty_data.push_back(data);
 									if (non_empty_data.empty())
-												Using std::shared_ptr for data types [#METR-21503].

											
										
										
											2016-05-28 12:22:22 +00:00
+										return std::make_unique<NullBlockInputStream>();
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
 									if (non_empty_data.size() > 1)
 									{
 										/// Отсортируем состояния по убыванию размера, чтобы мердж был более эффективным (так как все состояния мерджатся в первое).
 										std::sort(non_empty_data.begin(), non_empty_data.end(),
 											[](const AggregatedDataVariantsPtr & lhs, const AggregatedDataVariantsPtr & rhs)
 											{
 												return lhs->sizeWithoutOverflowRow() > rhs->sizeWithoutOverflowRow();
 											});
 									}
 									/// Если хотя бы один из вариантов двухуровневый, то переконвертируем все варианты в двухуровневые, если есть не такие.
 									/// Замечание - возможно, было бы более оптимально не конвертировать одноуровневые варианты перед мерджем, а мерджить их отдельно, в конце.
 									bool has_at_least_one_two_level = false;
 									for (const auto & variant : non_empty_data)
 									{
 										if (variant->isTwoLevel())
 										{
 											has_at_least_one_two_level = true;
 											break;
 										}
 									}
 									if (has_at_least_one_two_level)
 										for (auto & variant : non_empty_data)
 											if (!variant->isTwoLevel())
 												variant->convertToTwoLevel();
 									AggregatedDataVariantsPtr & first = non_empty_data[0];
 									for (size_t i = 1, size = non_empty_data.size(); i < size; ++i)
-												dbms: fixed error with order of destruction of arenas, if exception was thrown while merging [#METR-19278].

											
										
										
											2015-12-23 06:46:48 +00:00
+									{
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+										if (first->type != non_empty_data[i]->type)
 											throw Exception("Cannot merge different aggregated data variants.", ErrorCodes::CANNOT_MERGE_DIFFERENT_AGGREGATED_DATA_VARIANTS);
-												dbms: fixed error with order of destruction of arenas, if exception was thrown while merging [#METR-19278].

											
										
										
											2015-12-23 06:46:48 +00:00
+										/** В первое множество данных могут быть перемещены элементы из остальных множеств.
 										  * Поэтому, оно должно владеть всеми аренами всех остальных множеств.
 										  */
 										first->aggregates_pools.insert(first->aggregates_pools.end(),
 											non_empty_data[i]->aggregates_pools.begin(), non_empty_data[i]->aggregates_pools.end());
 									}
-												Using std::shared_ptr for data types [#METR-21503].

											
										
										
											2016-05-28 12:22:22 +00:00
+									return std::make_unique<MergingAndConvertingBlockInputStream>(*this, non_empty_data, final, max_threads);
-												dbms: more memory efficient merging aggregated states [#METR-17000].

											
										
										
											2015-12-06 16:22:01 +00:00
+								}
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+								template <bool no_more_keys, typename Method, typename Table>
 								void NO_INLINE Aggregator::mergeStreamsImplCase(
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									Block & block,
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
+									const Sizes & key_sizes,
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 06:49:32 +00:00
+									Arena * aggregates_pool,
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									Method & method,
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+									Table & data,
 									AggregateDataPtr overflow_row) const
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									ConstColumnPlainPtrs key_columns(params.keys_size);
 									AggregateColumnsData aggregate_columns(params.aggregates_size);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 									/// Запоминаем столбцы, с которыми будем работать
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.keys_size; ++i)
-												Using std::shared_ptr for columns [#METR-21503].

											
										
										
											2016-05-28 05:31:36 +00:00
+										key_columns[i] = block.getByPosition(i).column.get();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
 										aggregate_columns[i] = &typeid_cast<ColumnAggregateFunction &>(*block.getByPosition(params.keys_size + i).column).getData();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 06:49:32 +00:00
+									typename Method::State state;
 									state.init(key_columns);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 									/// Для всех строчек.
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									StringRefs keys(params.keys_size);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									size_t rows = block.rowsInFirstColumn();
 									for (size_t i = 0; i < rows; ++i)
 									{
 										typename Table::iterator it;
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										bool inserted;			/// Вставили новый ключ, или такой ключ уже был?
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+										bool overflow = false;	/// Новый ключ не поместился в хэш-таблицу из-за no_more_keys.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 										/// Получаем ключ для вставки в хэш-таблицу.
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										auto key = state.getKey(key_columns, params.keys_size, i, key_sizes, keys, *aggregates_pool);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+										if (!no_more_keys)
 										{
 											data.emplace(key, it, inserted);
 										}
 										else
 										{
 											inserted = false;
 											it = data.find(key);
 											if (data.end() == it)
 												overflow = true;
 										}
 										/// Если ключ не поместился, и данные не надо агрегировать в отдельную строку, то делать нечего.
 										if (no_more_keys && overflow && !overflow_row)
 										{
 											method.onExistingKey(key, keys, *aggregates_pool);
 											continue;
 										}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+										/// Если вставили новый ключ - инициализируем состояния агрегатных функций, и возможно, что-нибудь связанное с ключом.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										if (inserted)
 										{
 											AggregateDataPtr & aggregate_data = Method::getAggregateData(it->second);
-												dbms: fixed exception safety [#METR-15352].

											
										
										
											2015-03-07 01:05:06 +00:00
+											aggregate_data = nullptr;
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+											method.onNewKey(*it, params.keys_size, i, keys, *aggregates_pool);
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
-												dbms: fixed exception safety [#METR-15352].

											
										
										
											2015-03-07 01:05:06 +00:00
+											AggregateDataPtr place = aggregates_pool->alloc(total_size_of_aggregate_states);
 											createAggregateStates(place);
 											aggregate_data = place;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										}
-												dbms: added aggregation method 'concat' - performance improvement in generic case [#METR-2944].

											
										
										
											2015-02-22 16:09:16 +00:00
+										else
 											method.onExistingKey(key, keys, *aggregates_pool);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+										AggregateDataPtr value = (!no_more_keys || !overflow) ? Method::getAggregateData(it->second) : overflow_row;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										/// Мерджим состояния агрегатных функций.
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t j = 0; j < params.aggregates_size; ++j)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											aggregate_functions[j]->merge(
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+												value + offsets_of_aggregate_states[j],
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+												(*aggregate_columns[j])[i]);
 									}
-												dbms: slightly lowered memory usage of distributed aggregation [#METR-2944].

											
										
										
											2015-01-27 23:02:05 +00:00
 									/// Пораньше освобождаем память.
 									block.clear();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								}
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+								template <typename Method, typename Table>
 								void NO_INLINE Aggregator::mergeStreamsImpl(
 									Block & block,
 									const Sizes & key_sizes,
 									Arena * aggregates_pool,
 									Method & method,
 									Table & data,
 									AggregateDataPtr overflow_row,
 									bool no_more_keys) const
 								{
 									if (!no_more_keys)
 										mergeStreamsImplCase<false>(block, key_sizes, aggregates_pool, method, data, overflow_row);
 									else
 										mergeStreamsImplCase<true>(block, key_sizes, aggregates_pool, method, data, overflow_row);
 								}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								void NO_INLINE Aggregator::mergeWithoutKeyStreamsImpl(
 									Block & block,
 									AggregatedDataVariants & result) const
 								{
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									AggregateColumnsData aggregate_columns(params.aggregates_size);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 									/// Запоминаем столбцы, с которыми будем работать
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
 										aggregate_columns[i] = &typeid_cast<ColumnAggregateFunction &>(*block.getByPosition(params.keys_size + i).column).getData();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 									AggregatedDataWithoutKey & res = result.without_key;
 									if (!res)
 									{
-												dbms: fixed exception safety [#METR-15352].

											
										
										
											2015-03-07 01:05:06 +00:00
+										AggregateDataPtr place = result.aggregates_pool->alloc(total_size_of_aggregate_states);
 										createAggregateStates(place);
 										res = place;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									}
 									/// Добавляем значения
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										aggregate_functions[i]->merge(res + offsets_of_aggregate_states[i], (*aggregate_columns[i])[0]);
-												dbms: slightly lowered memory usage of distributed aggregation [#METR-2944].

											
										
										
											2015-01-27 23:02:05 +00:00
 									/// Пораньше освобождаем память.
 									block.clear();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								}
 								void Aggregator::mergeStream(BlockInputStreamPtr stream, AggregatedDataVariants & result, size_t max_threads)
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+								{
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									StringRefs key(params.keys_size);
 									ConstColumnPlainPtrs key_columns(params.keys_size);
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									AggregateColumnsData aggregate_columns(params.aggregates_size);
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												dbms: fixed error in memory-efficient merging of aggregated states [#METR-17000].

											
										
										
											2015-12-09 02:56:18 +00:00
+									initialize({});
-												dbms: probably fixed error in Aggregator [#CONV-2944].



											
										
										
											2013-02-13 19:24:19 +00:00
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 03:18:49 +00:00
+									/** Если на удалённых серверах использовался двухуровневый метод агрегации,
 									  *  то в блоках будет расположена информация о номере корзины.
 									  * Тогда вычисления можно будет распараллелить по корзинам.
 									  * Разложим блоки по указанным в них номерам корзин.
 									  */
 									using BucketToBlocks = std::map<Int32, BlocksList>;
 									BucketToBlocks bucket_to_blocks;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									/// Читаем все данные.
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									LOG_TRACE(log, "Reading blocks of partially aggregated data.");
 									size_t total_input_rows = 0;
 									size_t total_input_blocks = 0;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+									while (Block block = stream->read())
 									{
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+										if (isCancelled())
 											return;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										total_input_rows += block.rowsInFirstColumn();
 										++total_input_blocks;
 										bucket_to_blocks[block.info.bucket_num].emplace_back(std::move(block));
 									}
 									LOG_TRACE(log, "Read " << total_input_blocks << " blocks of partially aggregated data, total " << total_input_rows << " rows.");
 									if (bucket_to_blocks.empty())
 										return;
-												dbms: fixed error in memory-efficient merging of aggregated states [#METR-17000].

											
										
										
											2015-12-09 02:56:18 +00:00
+									setSampleBlock(bucket_to_blocks.begin()->second.front());
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 									/// Каким способом выполнять агрегацию?
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.keys_size; ++i)
-												Using std::shared_ptr for columns [#METR-21503].

											
										
										
											2016-05-28 05:31:36 +00:00
+										key_columns[i] = sample.getByPosition(i).column.get();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 									Sizes key_sizes;
 									AggregatedDataVariants::Type method = chooseAggregationMethod(key_columns, key_sizes);
 									/** Минус единицей обозначается отсутствие информации о корзине
 									  * - в случае одноуровневой агрегации, а также для блоков с "переполнившимися" значениями.
 									  * Если есть хотя бы один блок с номером корзины больше нуля, значит была двухуровневая агрегация.
 									  */
-												dbms: fixed error with higher than usual memory usage [#METR-15530].

											
										
										
											2015-03-24 00:39:30 +00:00
+									auto max_bucket = bucket_to_blocks.rbegin()->first;
-												dbms: fixed error [#METR-15530].

											
										
										
											2015-03-19 05:15:38 +00:00
+									size_t has_two_level = max_bucket > 0;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 									if (has_two_level)
 									{
 									#define M(NAME) \
 										if (method == AggregatedDataVariants::Type::NAME) \
 											method = AggregatedDataVariants::Type::NAME ## _two_level;
-												dbms: improved performance on short queries [#METR-11571].

											
										
										
											2014-06-26 00:58:14 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
-												dbms: improved performance on short queries [#METR-11571].

											
										
										
											2014-06-26 00:58:14 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									#undef M
 									}
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 										return;
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
+									/// result будет уничтожать состояния агрегатных функций в деструкторе
 									result.aggregator = this;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									result.init(method);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									result.keys_size = params.keys_size;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									result.key_sizes = key_sizes;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												dbms: fixed error [#METR-14604].

											
										
										
											2015-01-17 04:49:13 +00:00
+									bool has_blocks_with_unknown_bucket = bucket_to_blocks.count(-1);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									/// Сначала параллельно мерджим для отдельных bucket-ов. Затем домердживаем данные, не распределённые по bucket-ам.
 									if (has_two_level)
 									{
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+										/** В этом случае, no_more_keys не поддерживается в связи с тем, что
 										  *  из разных потоков трудно обновлять общее состояние для "остальных" ключей (overflows).
 										  * То есть, ключей в итоге может оказаться существенно больше, чем max_rows_to_group_by.
 										  */
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										LOG_TRACE(log, "Merging partially aggregated two-level data.");
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
+										auto merge_bucket = [&bucket_to_blocks, &result, &key_sizes, this](Int32 bucket, Arena * aggregates_pool, MemoryTracker * memory_tracker)
-												dbms: improved performance for small queries [#METR-8582].



											
										
										
											2013-12-16 02:32:00 +00:00
+										{
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											current_memory_tracker = memory_tracker;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											for (Block & block : bucket_to_blocks[bucket])
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+											{
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+												if (isCancelled())
 													return;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											#define M(NAME) \
 												else if (result.type == AggregatedDataVariants::Type::NAME) \
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+													mergeStreamsImpl(block, key_sizes, aggregates_pool, *result.NAME, result.NAME->data.impls[bucket], nullptr, false);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 												if (false) {}
 													APPLY_FOR_VARIANTS_TWO_LEVEL(M)
 											#undef M
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 06:49:32 +00:00
+												else
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+													throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+											}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										};
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 03:30:29 +00:00
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+										std::unique_ptr<ThreadPool> thread_pool;
-												dbms: fixed error with exception safety [#METR-15357].

											
										
										
											2015-03-16 19:24:57 +00:00
+										if (max_threads > 1 && total_input_rows > 100000	/// TODO Сделать настраиваемый порог.
 											&& has_two_level)
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+											thread_pool.reset(new ThreadPool(max_threads));
-												dbms: fixed error with exception safety [#METR-15357].

											
										
										
											2015-03-16 19:24:57 +00:00
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
+										for (const auto & bucket_blocks : bucket_to_blocks)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										{
-												dbms: better exception safety [#METR-15530].

											
										
										
											2015-03-23 01:10:06 +00:00
+											const auto bucket = bucket_blocks.first;
-												dbms: fixed error [#METR-14604].

											
										
										
											2015-01-17 04:49:13 +00:00
 											if (bucket == -1)
 												continue;
-												Using std::shared_ptr for data types [#METR-21503].

											
										
										
											2016-05-28 10:15:36 +00:00
+											result.aggregates_pools.push_back(std::make_shared<Arena>());
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 06:49:32 +00:00
+											Arena * aggregates_pool = result.aggregates_pools.back().get();
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+											auto task = std::bind(merge_bucket, bucket, aggregates_pool, current_memory_tracker);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 											if (thread_pool)
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+												thread_pool->schedule(task);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											else
-												Removed useless code (experimental) [#METR-2944].

											
										
										
											2016-08-02 01:46:05 +00:00
+												task();
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+										}
-												dbms: fixed error after adding 'WITH TOTALS' modifier [#CONV-7489].



											
										
										
											2013-05-06 11:45:28 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										if (thread_pool)
 											thread_pool->wait();
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										LOG_TRACE(log, "Merged partially aggregated two-level data.");
 									}
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+									if (isCancelled())
 									{
 										result.invalidate();
 										return;
 									}
-												dbms: fixed error [#METR-14604].

											
										
										
											2015-01-17 04:49:13 +00:00
+									if (has_blocks_with_unknown_bucket)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									{
 										LOG_TRACE(log, "Merging partially aggregated single-level data.");
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+										bool no_more_keys = false;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+										BlocksList & blocks = bucket_to_blocks[-1];
 										for (Block & block : blocks)
 										{
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+											if (isCancelled())
 											{
 												result.invalidate();
 												return;
 											}
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+											if (!checkLimits(result.sizeWithoutOverflowRow(), no_more_keys))
 												break;
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											if (result.type == AggregatedDataVariants::Type::without_key || block.info.is_overflows)
 												mergeWithoutKeyStreamsImpl(block, result);
 										#define M(NAME, IS_TWO_LEVEL) \
 											else if (result.type == AggregatedDataVariants::Type::NAME) \
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+												mergeStreamsImpl(block, key_sizes, result.aggregates_pool, *result.NAME, result.NAME->data, result.without_key, no_more_keys);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 											APPLY_FOR_AGGREGATED_VARIANTS(M)
 										#undef M
 											else if (result.type != AggregatedDataVariants::Type::without_key)
 												throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
 										}
 										LOG_TRACE(log, "Merged partially aggregated single-level data.");
 									}
 								}
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
+								Block Aggregator::mergeBlocks(BlocksList & blocks, bool final)
 								{
 									if (blocks.empty())
 										return {};
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									StringRefs key(params.keys_size);
 									ConstColumnPlainPtrs key_columns(params.keys_size);
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									AggregateColumnsData aggregate_columns(params.aggregates_size);
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
-												dbms: fixed error in memory-efficient merging of aggregated states [#METR-17000].

											
										
										
											2015-12-09 02:56:18 +00:00
+									initialize({});
 									setSampleBlock(blocks.front());
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
 									/// Каким способом выполнять агрегацию?
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.keys_size; ++i)
-												Using std::shared_ptr for columns [#METR-21503].

											
										
										
											2016-05-28 05:31:36 +00:00
+										key_columns[i] = sample.getByPosition(i).column.get();
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
 									Sizes key_sizes;
 									AggregatedDataVariants::Type method = chooseAggregationMethod(key_columns, key_sizes);
 									/// Временные данные для агрегации.
 									AggregatedDataVariants result;
 									/// result будет уничтожать состояния агрегатных функций в деструкторе
 									result.aggregator = this;
 									result.init(method);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									result.keys_size = params.keys_size;
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
+									result.key_sizes = key_sizes;
-												dbms: Aggregator: fixes [#METR-19371].

											
										
										
											2015-12-11 00:34:00 +00:00
+									auto bucket_num = blocks.front().info.bucket_num;
 									LOG_TRACE(log, "Merging partially aggregated blocks (bucket = " << bucket_num << ").");
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
 									for (Block & block : blocks)
 									{
 										if (result.type == AggregatedDataVariants::Type::without_key || block.info.is_overflows)
 											mergeWithoutKeyStreamsImpl(block, result);
 									#define M(NAME, IS_TWO_LEVEL) \
 										else if (result.type == AggregatedDataVariants::Type::NAME) \
-												dbms: using 'max_rows_to_group_by' limit while merging aggregate states (in certain cases) [#METR-18507].

											
										
										
											2015-10-23 01:43:42 +00:00
+											mergeStreamsImpl(block, key_sizes, result.aggregates_pool, *result.NAME, result.NAME->data, nullptr, false);
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
 										APPLY_FOR_AGGREGATED_VARIANTS(M)
 									#undef M
 										else if (result.type != AggregatedDataVariants::Type::without_key)
 											throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
 									}
-												dbms: memory efficient distributed aggregation: development [#METR-17536].

											
										
										
											2015-09-07 20:08:02 +00:00
+									BlocksList merged_blocks = convertToBlocks(result, final, 1);
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
-												dbms: memory efficient distributed aggregation: development [#METR-17536].

											
										
										
											2015-09-07 20:08:02 +00:00
+									if (merged_blocks.size() > 1)
 									{
 										/** Может быть два блока. Один с is_overflows, другой - нет.
 										  * Если есть непустой блок не is_overflows, то удаляем блок с is_overflows.
 										  * Если есть пустой блок не is_overflows и блок с is_overflows, то удаляем пустой блок.
 										  *
 										  * Это делаем, потому что исходим из допущения, что в функцию передаются
 										  *  либо все блоки не is_overflows, либо все блоки is_overflows.
 										  */
 										bool has_nonempty_nonoverflows = false;
 										bool has_overflows = false;
 										for (const auto & block : merged_blocks)
 										{
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-14 21:09:33 +00:00
+											if (block && block.rowsInFirstColumn() && !block.info.is_overflows)
-												dbms: memory efficient distributed aggregation: development [#METR-17536].

											
										
										
											2015-09-07 20:08:02 +00:00
+												has_nonempty_nonoverflows = true;
 											else if (block.info.is_overflows)
 												has_overflows = true;
 										}
 										if (has_nonempty_nonoverflows)
 										{
 											for (auto it = merged_blocks.begin(); it != merged_blocks.end(); ++it)
 											{
 												if (it->info.is_overflows)
 												{
 													merged_blocks.erase(it);
 													break;
 												}
 											}
 										}
 										else if (has_overflows)
 										{
 											for (auto it = merged_blocks.begin(); it != merged_blocks.end(); ++it)
 											{
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-14 21:09:33 +00:00
+												if (!*it || it->rowsInFirstColumn() == 0)
-												dbms: memory efficient distributed aggregation: development [#METR-17536].

											
										
										
											2015-09-07 20:08:02 +00:00
+												{
 													merged_blocks.erase(it);
 													break;
 												}
 											}
 										}
 										if (merged_blocks.size() > 1)
 											throw Exception("Logical error: temporary result is not single-level", ErrorCodes::LOGICAL_ERROR);
 									}
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
 									LOG_TRACE(log, "Merged partially aggregated blocks.");
-												dbms: memory efficient distributed aggregation: development [#METR-17536].

											
										
										
											2015-09-07 20:08:02 +00:00
+									if (merged_blocks.empty())
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
+										return {};
-												dbms: Aggregator: fixes [#METR-19371].

											
										
										
											2015-12-11 00:34:00 +00:00
+									auto res = std::move(merged_blocks.front());
 									res.info.bucket_num = bucket_num;
 									return res;
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
+								}
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
+								template <typename Method>
 								void NO_INLINE Aggregator::convertBlockToTwoLevelImpl(
 									Method & method,
 									Arena * pool,
 									ConstColumnPlainPtrs & key_columns,
 									const Sizes & key_sizes,
 									StringRefs & keys,
 									const Block & source,
 									std::vector<Block> & destinations) const
 								{
 									typename Method::State state;
 									state.init(key_columns);
 									size_t rows = source.rowsInFirstColumn();
 									size_t columns = source.columns();
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-10 01:58:37 +00:00
+									/// Для каждого номера корзины создадим фильтр, где будут отмечены строки, относящиеся к этой корзине.
 									std::vector<IColumn::Filter> filters(destinations.size());
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
+									/// Для всех строчек.
 									for (size_t i = 0; i < rows; ++i)
 									{
 										/// Получаем ключ. Вычисляем на его основе номер корзины.
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										typename Method::Key key = state.getKey(key_columns, params.keys_size, i, key_sizes, keys, *pool);
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
 										auto hash = method.data.hash(key);
 										auto bucket = method.data.getBucketFromHash(hash);
 										/// Этот ключ нам больше не нужен.
 										method.onExistingKey(key, keys, *pool);
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-10 01:58:37 +00:00
+										auto & filter = filters[bucket];
 										if (unlikely(filter.empty()))
 											filter.resize_fill(rows);
 										filter[i] = 1;
 									}
-												dbms: fixed excessive memory allocation when splitting single-level block in Aggregator [#METR-17000].

											
										
										
											2015-12-05 07:01:18 +00:00
+									ssize_t size_hint = ((source.rowsInFirstColumn() + method.data.NUM_BUCKETS - 1)
 										/ method.data.NUM_BUCKETS) * 1.1;	/// Число 1.1 выбрано наугад.
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-10 01:58:37 +00:00
+									for (size_t bucket = 0, size = destinations.size(); bucket < size; ++bucket)
 									{
 										const auto & filter = filters[bucket];
 										if (filter.empty())
 											continue;
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
+										Block & dst = destinations[bucket];
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-10 01:58:37 +00:00
+										dst.info.bucket_num = bucket;
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
 										for (size_t j = 0; j < columns; ++j)
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-10 01:58:37 +00:00
+										{
 											const ColumnWithTypeAndName & src_col = source.unsafeGetByPosition(j);
-												dbms: fixed excessive memory allocation when splitting single-level block in Aggregator [#METR-17000].

											
										
										
											2015-12-05 07:01:18 +00:00
+											dst.insert({src_col.column->filter(filter, size_hint), src_col.type, src_col.name});
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-10 01:58:37 +00:00
 											/** Вставленные в блок столбцы типа ColumnAggregateFunction будут владеть состояниями агрегатных функций
-												Get rid of Poco::SharedPtr [#METR-21503].

											
										
										
											2016-05-28 17:31:50 +00:00
+											  *  путём удержания shared_ptr-а на исходный столбец. См. ColumnAggregateFunction.h
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-10 01:58:37 +00:00
+											  */
 										}
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
+									}
 								}
 								std::vector<Block> Aggregator::convertBlockToTwoLevel(const Block & block)
 								{
 									if (!block)
 										return {};
-												dbms: fixed error in memory-efficient merging of aggregated states [#METR-17000].

											
										
										
											2015-12-09 02:56:18 +00:00
+									initialize({});
 									setSampleBlock(block);
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-08 20:19:30 +00:00
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
+									AggregatedDataVariants data;
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									StringRefs key(params.keys_size);
 									ConstColumnPlainPtrs key_columns(params.keys_size);
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
+									Sizes key_sizes;
 									/// Запоминаем столбцы, с которыми будем работать
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.keys_size; ++i)
-												Using std::shared_ptr for columns [#METR-21503].

											
										
										
											2016-05-28 05:31:36 +00:00
+										key_columns[i] = block.getByPosition(i).column.get();
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
 									AggregatedDataVariants::Type type = chooseAggregationMethod(key_columns, key_sizes);
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									data.keys_size = params.keys_size;
-												dbms: fixed error [#METR-17536].

											
										
										
											2015-09-09 21:32:29 +00:00
+									data.key_sizes = key_sizes;
-												dbms: development of memory efficient distributed aggregation method [#METR-17536].

											
										
										
											2015-09-07 07:40:14 +00:00
 								#define M(NAME) \
 									else if (type == AggregatedDataVariants::Type::NAME) \
 										type = AggregatedDataVariants::Type::NAME ## _two_level;
 									if (false) {}
 									APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
 								#undef M
 									else
 										throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
 									data.init(type);
 									size_t num_buckets = 0;
 								#define M(NAME) \
 									else if (data.type == AggregatedDataVariants::Type::NAME) \
 										num_buckets = data.NAME->data.NUM_BUCKETS;
 									if (false) {}
 									APPLY_FOR_VARIANTS_TWO_LEVEL(M)
 								#undef M
 									else
 										throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
 									std::vector<Block> splitted_blocks(num_buckets);
 								#define M(NAME) \
 									else if (data.type == AggregatedDataVariants::Type::NAME) \
 										convertBlockToTwoLevelImpl(*data.NAME, data.aggregates_pool, \
 											key_columns, data.key_sizes, key, block, splitted_blocks);
 									if (false) {}
 									APPLY_FOR_VARIANTS_TWO_LEVEL(M)
 								#undef M
 									else
 										throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
 									return splitted_blocks;
 								}
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
+								template <typename Method, typename Table>
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								void NO_INLINE Aggregator::destroyImpl(
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
+									Method & method,
-												dbms: better [#METR-19278].

											
										
										
											2015-12-23 07:03:50 +00:00
+									Table & table) const
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+								{
-												dbms: better [#METR-19278].

											
										
										
											2015-12-23 07:03:50 +00:00
+									for (auto elem : table)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+									{
-												dbms: fixed another error [#METR-19278].

											
										
										
											2015-12-23 05:06:32 +00:00
+										AggregateDataPtr & data = Method::getAggregateData(elem.second);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
 										/** Если исключение (обычно нехватка памяти, кидается MemoryTracker-ом) возникло
 										  *  после вставки ключа в хэш-таблицу, но до создания всех состояний агрегатных функций,
 										  *  то data будет равен nullptr-у.
 										  */
 										if (nullptr == data)
 											continue;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-31 00:33:42 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.aggregates_size; ++i)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-03 05:39:21 +00:00
+											if (!aggregate_functions[i]->isState())
 												aggregate_functions[i]->destroy(data + offsets_of_aggregate_states[i]);
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
 										data = nullptr;
 									}
 								}
 								void Aggregator::destroyWithoutKey(AggregatedDataVariants & result) const
 								{
 									AggregatedDataWithoutKey & res_data = result.without_key;
 									if (nullptr != res_data)
 									{
 										for (size_t i = 0; i < params.aggregates_size; ++i)
 											if (!aggregate_functions[i]->isState())
 												aggregate_functions[i]->destroy(res_data + offsets_of_aggregate_states[i]);
 										res_data = nullptr;
-												dbms: development [#CONV-2944].



											
										
										
											2012-05-30 01:38:02 +00:00
+									}
 								}
-												dbms: fixed segfault in case of memory limit exceeded [#METR-11160].

											
										
										
											2014-05-19 19:41:56 +00:00
+								void Aggregator::destroyAllAggregateStates(AggregatedDataVariants & result)
-												dbms: fixed possible leak [#CONV-2944].



											
										
										
											2013-02-16 18:59:05 +00:00
+								{
 									if (result.size() == 0)
 										return;
-												dbms: merged convertToBlock and finalize aggregation steps whenever possible [#METR-2944].



											
										
										
											2013-11-03 23:35:18 +00:00
+									LOG_TRACE(log, "Destroying aggregate states");
-												dbms: fixed possible leak [#CONV-2944].



											
										
										
											2013-02-16 18:59:05 +00:00
 									/// В какой структуре данных агрегированы данные?
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									if (result.type == AggregatedDataVariants::Type::without_key || params.overflow_row)
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
+										destroyWithoutKey(result);
-												dbms: fixed possible leak [#CONV-2944].



											
										
										
											2013-02-16 18:59:05 +00:00
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+								#define M(NAME, IS_TWO_LEVEL) \
 									else if (result.type == AggregatedDataVariants::Type::NAME) \
-												dbms: fixed errors [#METR-17000].

											
										
										
											2015-12-06 19:42:28 +00:00
+										destroyImpl(*result.NAME, result.NAME->data);
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
 									if (false) {}
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2015-01-02 03:16:28 +00:00
+									APPLY_FOR_AGGREGATED_VARIANTS(M)
-												dbms: more scalable aggregator: development [#METR-2944].

											
										
										
											2014-12-30 10:16:23 +00:00
+								#undef M
 									else if (result.type != AggregatedDataVariants::Type::without_key)
-												dbms: Aggregator: decomposed code to easier trying more aggregation methods; performance is suddenly improved up to 25%; fixed memory leak when exception while aggregating by KEYS_128 method [#METR-2944].

											
										
										
											2014-05-10 00:31:22 +00:00
+										throw Exception("Unknown aggregated data variant.", ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT);
-												dbms: fixed possible leak [#CONV-2944].



											
										
										
											2013-02-16 18:59:05 +00:00
+								}
-												dbms: development of multi-queries [#CONV-2944].



											
										
										
											2013-05-03 10:20:53 +00:00
 								String Aggregator::getID() const
 								{
 									std::stringstream res;
-												dbms: improved performance on short queries [#METR-11571].

											
										
										
											2014-06-26 00:58:14 +00:00
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									if (params.keys.empty())
-												dbms: development of multi-queries [#CONV-2944].



											
										
										
											2013-05-03 10:20:53 +00:00
+									{
 										res << "key_names";
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.key_names.size(); ++i)
 											res << ", " << params.key_names[i];
-												dbms: development of multi-queries [#CONV-2944].



											
										
										
											2013-05-03 10:20:53 +00:00
+									}
 									else
 									{
 										res << "keys";
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+										for (size_t i = 0; i < params.keys.size(); ++i)
 											res << ", " << params.keys[i];
-												dbms: development of multi-queries [#CONV-2944].



											
										
										
											2013-05-03 10:20:53 +00:00
+									}
 									res << ", aggregates";
-												dbms: Aggregator: preparation [#METR-17000].

											
										
										
											2015-11-30 16:57:05 +00:00
+									for (size_t i = 0; i < params.aggregates_size; ++i)
 										res << ", " << params.aggregates[i].column_name;
-												dbms: development of multi-queries [#CONV-2944].



											
										
										
											2013-05-03 10:20:53 +00:00
 									return res.str();
 								}
-												Merge

											
										
										
											2015-04-16 14:27:56 +00:00
+								void Aggregator::setCancellationHook(const CancellationHook cancellation_hook)
 								{
 									isCancelled = cancellation_hook;
 								}
-												dbms: added memory-efficient mode of distributed aggregation [#METR-17536].

											
										
										
											2015-07-30 23:41:02 +00:00
-												dbms: development.



											
										
										
											2011-09-19 01:42:16 +00:00
+								}