ClickHouse/src/Common/ProgressIndication.cpp

263 lines
8.8 KiB
C++
Raw Normal View History

#include "ProgressIndication.h"
2021-09-15 15:45:43 +00:00
#include <cstddef>
#include <numeric>
#include <cmath>
#include <IO/WriteBufferFromFileDescriptor.h>
#include <base/types.h>
#include <Common/TerminalSize.h>
#include <Common/UnicodeBar.h>
#include "IO/WriteBufferFromString.h"
#include <Databases/DatabaseMemory.h>
2021-09-15 15:45:43 +00:00
namespace
{
constexpr UInt64 ZERO = 0;
2021-09-17 15:00:13 +00:00
UInt64 calculateNewCoresNumber(DB::ThreadIdToTimeMap const & prev, DB::ThreadIdToTimeMap const& next)
{
if (next.find(ZERO) == next.end())
return ZERO;
auto accumulated = std::accumulate(next.cbegin(), next.cend(), ZERO,
[&prev](UInt64 acc, auto const & elem)
{
if (elem.first == ZERO)
return acc;
auto thread_time = elem.second.time();
auto it = prev.find(elem.first);
if (it != prev.end())
thread_time -= it->second.time();
return acc + thread_time;
});
auto elapsed = next.at(ZERO).time() - (prev.contains(ZERO) ? prev.at(ZERO).time() : ZERO);
if (elapsed == ZERO)
return ZERO;
return (accumulated + elapsed - 1) / elapsed;
}
2021-09-15 15:45:43 +00:00
}
namespace DB
{
2021-04-17 22:02:06 +00:00
bool ProgressIndication::updateProgress(const Progress & value)
{
2021-04-16 14:37:46 +00:00
return progress.incrementPiecewiseAtomically(value);
}
void ProgressIndication::clearProgressOutput()
{
if (written_progress_chars)
{
written_progress_chars = 0;
std::cerr << "\r" CLEAR_TO_END_OF_LINE;
}
}
void ProgressIndication::resetProgress()
2021-04-17 13:26:58 +00:00
{
watch.restart();
progress.reset();
show_progress_bar = false;
written_progress_chars = 0;
2021-05-14 08:35:51 +00:00
write_progress_on_update = false;
2021-09-17 15:00:13 +00:00
host_active_cores.clear();
2021-09-17 16:47:54 +00:00
thread_data.clear();
}
void ProgressIndication::setFileProgressCallback(ContextMutablePtr context, bool write_progress_on_update_)
{
2021-05-14 08:35:51 +00:00
write_progress_on_update = write_progress_on_update_;
context->setFileProgressCallback([&](const FileProgress & file_progress)
{
progress.incrementPiecewiseAtomically(Progress(file_progress));
if (write_progress_on_update)
writeProgress();
});
}
2021-09-15 15:45:43 +00:00
void ProgressIndication::addThreadIdToList(String const & host, UInt64 thread_id)
2021-09-14 11:06:00 +00:00
{
2021-09-17 16:47:54 +00:00
auto & thread_to_times = thread_data[host];
2021-09-15 15:45:43 +00:00
if (thread_to_times.contains(thread_id))
return;
2021-09-15 15:45:43 +00:00
thread_to_times[thread_id] = {};
}
2021-09-17 16:47:54 +00:00
void ProgressIndication::updateThreadEventData(HostToThreadTimesMap & new_thread_data)
{
2021-09-17 16:47:54 +00:00
for (auto & new_host_map : new_thread_data)
2021-09-17 15:00:13 +00:00
{
2021-09-17 16:47:54 +00:00
auto & host_map = thread_data[new_host_map.first];
2021-09-17 15:00:13 +00:00
auto new_cores = calculateNewCoresNumber(host_map, new_host_map.second);
host_active_cores[new_host_map.first] = new_cores;
host_map = std::move(new_host_map.second);
}
}
2021-09-15 15:45:43 +00:00
size_t ProgressIndication::getUsedThreadsCount() const
{
2021-09-17 16:47:54 +00:00
return std::accumulate(thread_data.cbegin(), thread_data.cend(), 0,
2021-09-15 15:45:43 +00:00
[] (size_t acc, auto const & threads)
{
return acc + threads.second.size();
});
}
2021-09-15 15:45:43 +00:00
UInt64 ProgressIndication::getApproximateCoresNumber() const
{
2021-09-17 15:00:13 +00:00
return std::accumulate(host_active_cores.cbegin(), host_active_cores.cend(), ZERO,
[](UInt64 acc, auto const & elem)
{
2021-09-17 15:00:13 +00:00
return acc + elem.second;
});
2021-09-14 11:06:00 +00:00
}
2021-09-17 16:47:54 +00:00
UInt64 ProgressIndication::getMemoryUsage() const
{
return std::accumulate(thread_data.cbegin(), thread_data.cend(), ZERO,
[](UInt64 acc, auto const & host_data)
{
return acc + std::accumulate(host_data.second.cbegin(), host_data.second.cend(), ZERO,
[](UInt64 memory, auto const & data)
{
return memory + data.second.memory_usage;
});
});
}
void ProgressIndication::writeFinalProgress()
{
if (progress.read_rows < 1000)
return;
std::cout << "Processed " << formatReadableQuantity(progress.read_rows) << " rows, "
<< formatReadableSizeWithDecimalSuffix(progress.read_bytes);
size_t elapsed_ns = watch.elapsed();
if (elapsed_ns)
std::cout << " (" << formatReadableQuantity(progress.read_rows * 1000000000.0 / elapsed_ns) << " rows/s., "
<< formatReadableSizeWithDecimalSuffix(progress.read_bytes * 1000000000.0 / elapsed_ns) << "/s.)";
else
std::cout << ". ";
}
void ProgressIndication::writeProgress()
{
/// Output all progress bar commands to stderr at once to avoid flicker.
WriteBufferFromFileDescriptor message(STDERR_FILENO, 1024);
static size_t increment = 0;
static const char * indicators[8] = {
"\033[1;30m→\033[0m",
"\033[1;31m↘\033[0m",
"\033[1;32m↓\033[0m",
"\033[1;33m↙\033[0m",
"\033[1;34m←\033[0m",
"\033[1;35m↖\033[0m",
"\033[1;36m↑\033[0m",
"\033[1m↗\033[0m",
};
const char * indicator = indicators[increment % 8];
size_t terminal_width = getTerminalWidth();
if (!written_progress_chars)
{
/// If the current line is not empty, the progress must be output on the next line.
/// The trick is found here: https://www.vidarholen.net/contents/blog/?p=878
message << std::string(terminal_width, ' ');
}
message << '\r';
size_t prefix_size = message.count();
size_t read_bytes = progress.read_raw_bytes ? progress.read_raw_bytes : progress.read_bytes;
message << indicator << " Progress: ";
message
<< formatReadableQuantity(progress.read_rows) << " rows, "
<< formatReadableSizeWithDecimalSuffix(read_bytes);
auto elapsed_ns = watch.elapsed();
if (elapsed_ns)
message << " ("
<< formatReadableQuantity(progress.read_rows * 1000000000.0 / elapsed_ns) << " rows/s., "
<< formatReadableSizeWithDecimalSuffix(read_bytes * 1000000000.0 / elapsed_ns) << "/s.) ";
else
message << ". ";
written_progress_chars = message.count() - prefix_size - (strlen(indicator) - 2); /// Don't count invisible output (escape sequences).
// If approximate cores number is known, display it.
auto cores_number = getApproximateCoresNumber();
std::string profiling_msg;
if (cores_number != 0 && print_hardware_utilization)
{
WriteBufferFromOwnString profiling_msg_builder;
// Calculated cores number may be not accurate
// so it's better to print min(threads, cores).
UInt64 threads_number = getUsedThreadsCount();
profiling_msg_builder << " Running " << threads_number << " threads on "
<< std::min(cores_number, threads_number) << " cores";
auto memory_usage = getMemoryUsage();
if (memory_usage != 0)
profiling_msg_builder << " with " << formatReadableSizeWithDecimalSuffix(memory_usage) << " RAM used.";
else
profiling_msg_builder << ".";
profiling_msg = profiling_msg_builder.str();
}
/// If the approximate number of rows to process is known, we can display a progress bar and percentage.
if (progress.total_rows_to_read || progress.total_raw_bytes_to_read)
{
size_t current_count, max_count;
if (progress.total_rows_to_read)
{
current_count = progress.read_rows;
max_count = std::max(progress.read_rows, progress.total_rows_to_read);
}
else
{
current_count = progress.read_raw_bytes;
max_count = std::max(progress.read_raw_bytes, progress.total_raw_bytes_to_read);
}
/// To avoid flicker, display progress bar only if .5 seconds have passed since query execution start
/// and the query is less than halfway done.
if (elapsed_ns > 500000000)
{
/// Trigger to start displaying progress bar. If query is mostly done, don't display it.
if (current_count * 2 < max_count)
show_progress_bar = true;
if (show_progress_bar)
{
ssize_t width_of_progress_bar = static_cast<ssize_t>(terminal_width) - written_progress_chars - strlen(" 99%") - profiling_msg.length();
if (width_of_progress_bar > 0)
{
std::string bar
= UnicodeBar::render(UnicodeBar::getWidth(current_count, 0, max_count, width_of_progress_bar));
message << "\033[0;32m" << bar << "\033[0m";
if (width_of_progress_bar > static_cast<ssize_t>(bar.size() / UNICODE_BAR_CHAR_SIZE))
message << std::string(width_of_progress_bar - bar.size() / UNICODE_BAR_CHAR_SIZE, ' ');
}
}
}
/// Underestimate percentage a bit to avoid displaying 100%.
message << ' ' << (99 * current_count / max_count) << '%';
}
message << profiling_msg;
message << CLEAR_TO_END_OF_LINE;
++increment;
message.next();
}
2021-04-17 22:02:06 +00:00
}