2020-10-10 18:23:54 +00:00
|
|
|
#include <Functions/FunctionFactory.h>
|
2021-05-17 07:30:42 +00:00
|
|
|
#include <Functions/IFunction.h>
|
2020-10-10 18:23:54 +00:00
|
|
|
#include <Functions/FunctionHelpers.h>
|
|
|
|
#include <Columns/ColumnString.h>
|
|
|
|
#include <Columns/ColumnVector.h>
|
2021-01-29 02:14:15 +00:00
|
|
|
#include <Common/NaNUtils.h>
|
2020-10-10 18:23:54 +00:00
|
|
|
#include <DataTypes/DataTypeString.h>
|
|
|
|
#include <IO/WriteBufferFromVector.h>
|
|
|
|
#include <IO/WriteHelpers.h>
|
|
|
|
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
|
|
|
extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
|
|
|
|
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
|
2020-10-10 22:03:03 +00:00
|
|
|
extern const int BAD_ARGUMENTS;
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
namespace
|
|
|
|
{
|
|
|
|
|
2020-10-11 15:24:00 +00:00
|
|
|
/** Prints amount of seconds in form of:
|
|
|
|
* "1 year, 2 months, 12 days, 3 hours, 1 minute and 33 seconds".
|
|
|
|
* Maximum unit can be specified as a second argument: for example, you can specify "days",
|
|
|
|
* and it will avoid using years and months.
|
|
|
|
*
|
|
|
|
* The length of years and months (and even days in presence of time adjustments) are rough:
|
|
|
|
* year is just 365 days, month is 30.5 days, day is 86400 seconds.
|
|
|
|
*
|
|
|
|
* You may think that the choice of constants and the whole purpose of this function is very ignorant...
|
|
|
|
* And you're right. But actually it's made similar to a random Python library from the internet:
|
|
|
|
* https://github.com/jmoiron/humanize/blob/b37dc30ba61c2446eecb1a9d3e9ac8c9adf00f03/src/humanize/time.py#L462
|
|
|
|
*/
|
2020-10-10 18:23:54 +00:00
|
|
|
class FunctionFormatReadableTimeDelta : public IFunction
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
static constexpr auto name = "formatReadableTimeDelta";
|
2021-06-01 12:20:52 +00:00
|
|
|
static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionFormatReadableTimeDelta>(); }
|
2020-10-10 18:23:54 +00:00
|
|
|
|
|
|
|
String getName() const override { return name; }
|
|
|
|
|
|
|
|
bool isVariadic() const override { return true; }
|
|
|
|
|
2021-06-22 16:21:23 +00:00
|
|
|
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
|
2021-04-29 14:48:26 +00:00
|
|
|
|
2020-10-10 18:23:54 +00:00
|
|
|
size_t getNumberOfArguments() const override { return 0; }
|
|
|
|
|
|
|
|
DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
|
|
|
|
{
|
2020-10-11 19:43:04 +00:00
|
|
|
if (arguments.empty())
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
|
|
|
|
"Number of arguments for function {} doesn't match: passed {}, should be at least 1.",
|
|
|
|
getName(), arguments.size());
|
2020-10-10 18:23:54 +00:00
|
|
|
|
|
|
|
if (arguments.size() > 2)
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
|
|
|
|
"Number of arguments for function {} doesn't match: passed {}, should be at most 2.",
|
|
|
|
getName(), arguments.size());
|
2020-10-10 18:23:54 +00:00
|
|
|
|
|
|
|
const IDataType & type = *arguments[0];
|
|
|
|
|
|
|
|
if (!isNativeNumber(type))
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Cannot format {} as time delta", type.getName());
|
2020-10-10 18:23:54 +00:00
|
|
|
|
|
|
|
if (arguments.size() == 2)
|
|
|
|
{
|
|
|
|
const auto * maximum_unit_arg = arguments[1].get();
|
|
|
|
if (!isStringOrFixedString(maximum_unit_arg))
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument maximum_unit of function {}",
|
|
|
|
maximum_unit_arg->getName(), getName());
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return std::make_shared<DataTypeString>();
|
|
|
|
}
|
|
|
|
|
|
|
|
ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
|
|
|
|
|
|
|
|
bool useDefaultImplementationForConstants() const override { return true; }
|
|
|
|
|
2020-10-10 22:03:03 +00:00
|
|
|
enum Unit
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2020-10-10 22:03:03 +00:00
|
|
|
Seconds,
|
|
|
|
Minutes,
|
|
|
|
Hours,
|
|
|
|
Days,
|
|
|
|
Months,
|
|
|
|
Years
|
|
|
|
};
|
|
|
|
|
2020-11-17 13:24:45 +00:00
|
|
|
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2022-07-18 17:31:34 +00:00
|
|
|
std::string_view maximum_unit_str;
|
2020-10-14 12:51:53 +00:00
|
|
|
if (arguments.size() == 2)
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2020-10-17 21:41:50 +00:00
|
|
|
const ColumnPtr & maximum_unit_column = arguments[1].column;
|
2020-10-10 22:03:03 +00:00
|
|
|
const ColumnConst * maximum_unit_const_col = checkAndGetColumnConstStringOrFixedString(maximum_unit_column.get());
|
|
|
|
if (maximum_unit_const_col)
|
2022-07-18 17:31:34 +00:00
|
|
|
maximum_unit_str = maximum_unit_const_col->getDataColumn().getDataAt(0).toView();
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
2020-10-10 22:03:03 +00:00
|
|
|
|
|
|
|
Unit max_unit;
|
2020-10-11 15:24:00 +00:00
|
|
|
|
|
|
|
/// Default means "use all available units".
|
2022-07-18 17:31:34 +00:00
|
|
|
if (maximum_unit_str.empty() || maximum_unit_str == "years")
|
2020-10-10 22:03:03 +00:00
|
|
|
max_unit = Years;
|
|
|
|
else if (maximum_unit_str == "months")
|
|
|
|
max_unit = Months;
|
|
|
|
else if (maximum_unit_str == "days")
|
|
|
|
max_unit = Days;
|
|
|
|
else if (maximum_unit_str == "hours")
|
|
|
|
max_unit = Hours;
|
|
|
|
else if (maximum_unit_str == "minutes")
|
|
|
|
max_unit = Minutes;
|
|
|
|
else if (maximum_unit_str == "seconds")
|
|
|
|
max_unit = Seconds;
|
2020-10-10 18:23:54 +00:00
|
|
|
else
|
2020-10-10 22:03:03 +00:00
|
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS,
|
|
|
|
"Unexpected value of maximum unit argument ({}) for function {}, the only allowed values are:"
|
|
|
|
" 'seconds', 'minutes', 'hours', 'days', 'months', 'years'.",
|
2022-07-19 11:17:33 +00:00
|
|
|
maximum_unit_str, getName());
|
2020-10-10 22:03:03 +00:00
|
|
|
|
|
|
|
auto col_to = ColumnString::create();
|
|
|
|
|
|
|
|
ColumnString::Chars & data_to = col_to->getChars();
|
|
|
|
ColumnString::Offsets & offsets_to = col_to->getOffsets();
|
|
|
|
offsets_to.resize(input_rows_count);
|
|
|
|
|
|
|
|
WriteBufferFromVector<ColumnString::Chars> buf_to(data_to);
|
|
|
|
|
|
|
|
for (size_t i = 0; i < input_rows_count; ++i)
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2020-10-27 11:04:03 +00:00
|
|
|
/// Virtual call is Ok (negligible comparing to the rest of calculations).
|
2020-10-17 21:41:50 +00:00
|
|
|
Float64 value = arguments[0].column->getFloat64(i);
|
2020-10-11 15:24:00 +00:00
|
|
|
|
2021-01-29 02:14:15 +00:00
|
|
|
if (!isFinite(value))
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2021-01-29 02:14:15 +00:00
|
|
|
/// Cannot decide what unit it is (years, month), just simply write inf or nan.
|
|
|
|
writeFloatText(value, buf_to);
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
2021-01-29 02:14:15 +00:00
|
|
|
else
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2021-01-29 02:14:15 +00:00
|
|
|
bool is_negative = value < 0;
|
|
|
|
if (is_negative)
|
|
|
|
{
|
|
|
|
writeChar('-', buf_to);
|
|
|
|
value = -value;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// To output separators between parts: ", " and " and ".
|
|
|
|
bool has_output = false;
|
|
|
|
|
|
|
|
switch (max_unit) /// A kind of Duff Device.
|
|
|
|
{
|
|
|
|
case Years: processUnit(365 * 24 * 3600, " year", 5, value, buf_to, has_output); [[fallthrough]];
|
2022-09-11 02:49:43 +00:00
|
|
|
case Months: processUnit(static_cast<UInt64>(30.5 * 24 * 3600), " month", 6, value, buf_to, has_output); [[fallthrough]];
|
2021-01-29 02:14:15 +00:00
|
|
|
case Days: processUnit(24 * 3600, " day", 4, value, buf_to, has_output); [[fallthrough]];
|
|
|
|
case Hours: processUnit(3600, " hour", 5, value, buf_to, has_output); [[fallthrough]];
|
|
|
|
case Minutes: processUnit(60, " minute", 7, value, buf_to, has_output); [[fallthrough]];
|
|
|
|
case Seconds: processUnit(1, " second", 7, value, buf_to, has_output);
|
|
|
|
}
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
2020-10-10 22:03:03 +00:00
|
|
|
|
|
|
|
writeChar(0, buf_to);
|
|
|
|
offsets_to[i] = buf_to.count();
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
|
|
|
|
2020-10-10 22:03:03 +00:00
|
|
|
buf_to.finalize();
|
2020-10-17 21:41:50 +00:00
|
|
|
return col_to;
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
|
|
|
|
2020-10-10 22:03:03 +00:00
|
|
|
static void processUnit(
|
|
|
|
UInt64 unit_size, const char * unit_name, size_t unit_name_size,
|
|
|
|
Float64 & value, WriteBuffer & buf_to, bool & has_output)
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2020-10-10 22:03:03 +00:00
|
|
|
if (unlikely(value + 1.0 == value))
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2020-10-11 15:24:00 +00:00
|
|
|
/// The case when value is too large so exact representation for subsequent smaller units is not possible.
|
2020-10-10 22:03:03 +00:00
|
|
|
writeText(std::floor(value / unit_size), buf_to);
|
|
|
|
buf_to.write(unit_name, unit_name_size);
|
|
|
|
writeChar('s', buf_to);
|
|
|
|
has_output = true;
|
|
|
|
value = 0;
|
|
|
|
return;
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
|
|
|
|
2022-09-11 03:38:59 +00:00
|
|
|
UInt64 num_units = static_cast<UInt64>(value / unit_size);
|
2020-10-10 22:03:03 +00:00
|
|
|
|
|
|
|
if (!num_units)
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
2020-10-11 15:24:00 +00:00
|
|
|
/// Zero units, no need to print. But if it's the last (seconds) and the only unit, print "0 seconds" nevertheless.
|
2020-10-10 22:03:03 +00:00
|
|
|
if (unit_size > 1 || has_output)
|
|
|
|
return;
|
|
|
|
}
|
2020-10-10 18:23:54 +00:00
|
|
|
|
2020-10-11 15:24:00 +00:00
|
|
|
/// Remaining value to print on next iteration.
|
2020-10-10 22:03:03 +00:00
|
|
|
value -= num_units * unit_size;
|
2020-10-10 18:23:54 +00:00
|
|
|
|
2020-10-10 22:03:03 +00:00
|
|
|
if (has_output)
|
|
|
|
{
|
2020-10-11 15:24:00 +00:00
|
|
|
/// Need delimiter between values. The last delimiter is " and ", all previous are comma.
|
2020-10-10 22:03:03 +00:00
|
|
|
if (value < 1)
|
|
|
|
writeCString(" and ", buf_to);
|
|
|
|
else
|
|
|
|
writeCString(", ", buf_to);
|
|
|
|
}
|
2020-10-10 18:23:54 +00:00
|
|
|
|
2020-10-10 22:03:03 +00:00
|
|
|
writeText(num_units, buf_to);
|
2020-10-11 15:24:00 +00:00
|
|
|
buf_to.write(unit_name, unit_name_size); /// If we just leave strlen(unit_name) here, clang-11 fails to make it compile-time.
|
|
|
|
|
|
|
|
/// How to pronounce: unit vs. units.
|
2020-10-10 22:03:03 +00:00
|
|
|
if (num_units != 1)
|
|
|
|
writeChar('s', buf_to);
|
2020-10-10 18:23:54 +00:00
|
|
|
|
2020-10-10 22:03:03 +00:00
|
|
|
has_output = true;
|
2020-10-10 18:23:54 +00:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2022-07-04 07:01:39 +00:00
|
|
|
REGISTER_FUNCTION(FormatReadableTimeDelta)
|
2020-10-10 18:23:54 +00:00
|
|
|
{
|
|
|
|
factory.registerFunction<FunctionFormatReadableTimeDelta>();
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|