#include #include #include #include namespace DB { Block MergeSortingBlockInputStream::readImpl() { /** Достаточно простой алгоритм: * - прочитать в оперативку все блоки; * - объединить их всех; */ if (has_been_read) return Block(); has_been_read = true; Blocks blocks; while (Block block = children.back()->read()) blocks.push_back(block); if (isCancelled()) return Block(); return merge(blocks); } Block MergeSortingBlockInputStream::merge(Blocks & blocks) { if (blocks.empty()) return Block(); if (blocks.size() == 1) return blocks[0]; Stopwatch watch; LOG_DEBUG(log, "Merge sorting"); CursorImpls cursors(blocks.size()); bool has_collation = false; size_t i = 0; for (Blocks::const_iterator it = blocks.begin(); it != blocks.end(); ++it, ++i) { if (!*it) continue; cursors[i] = SortCursorImpl(*it, description); has_collation |= cursors[i].has_collation; } Block merged; if (has_collation) merged = mergeImpl(blocks, cursors); else merged = mergeImpl(blocks, cursors); LOG_DEBUG(log, std::fixed << std::setprecision(2) << "Merge sorted " << blocks.size() << " blocks, " << merged.rows() << " rows" << " in " << watch.elapsedSeconds() << " sec., " << merged.rows() / watch.elapsedSeconds() << " rows/sec., " << merged.bytes() / 1000000.0 / watch.elapsedSeconds() << " MiB/sec."); return merged; } template Block MergeSortingBlockInputStream::mergeImpl(Blocks & blocks, CursorImpls & cursors) { Block merged = blocks[0].cloneEmpty(); size_t num_columns = blocks[0].columns(); typedef std::priority_queue Queue; Queue queue; for (size_t i = 0; i < cursors.size(); ++i) queue.push(TSortCursor(&cursors[i])); ColumnPlainPtrs merged_columns; for (size_t i = 0; i < num_columns; ++i) merged_columns.push_back(&*merged.getByPosition(i).column); /// Вынимаем строки в нужном порядке и кладём в merged. while (!queue.empty()) { TSortCursor current = queue.top(); queue.pop(); for (size_t i = 0; i < num_columns; ++i) merged_columns[i]->insertFrom(*current->all_columns[i], current->pos); if (!current->isLast()) { current->next(); queue.push(current); } } return merged; } }