2021-06-01 03:01:35 +00:00
|
|
|
#include <numeric>
|
|
|
|
|
|
|
|
#include <Columns/ColumnsNumber.h>
|
2022-10-19 09:13:02 +00:00
|
|
|
#include <Columns/ColumnsDateTime.h>
|
2021-06-01 03:01:35 +00:00
|
|
|
#include <Columns/ColumnTuple.h>
|
|
|
|
#include <DataTypes/DataTypeDate.h>
|
|
|
|
#include <DataTypes/DataTypeDateTime.h>
|
|
|
|
#include <DataTypes/DataTypesNumber.h>
|
|
|
|
#include <DataTypes/DataTypeTuple.h>
|
|
|
|
#include <Functions/extractTimeZoneFromFunctionArguments.h>
|
2020-01-14 03:08:54 +00:00
|
|
|
#include <Functions/FunctionFactory.h>
|
2021-06-01 03:01:35 +00:00
|
|
|
#include <Functions/FunctionHelpers.h>
|
2021-12-10 09:43:44 +00:00
|
|
|
#include <Functions/FunctionsTimeWindow.h>
|
2020-01-14 03:08:54 +00:00
|
|
|
|
2024-02-27 13:37:21 +00:00
|
|
|
|
2020-01-14 03:08:54 +00:00
|
|
|
namespace DB
|
|
|
|
{
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2021-06-02 01:52:54 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
|
|
|
extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
|
|
|
|
extern const int ILLEGAL_COLUMN;
|
|
|
|
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
|
|
|
|
extern const int ARGUMENT_OUT_OF_BOUND;
|
2022-02-09 07:28:15 +00:00
|
|
|
extern const int SYNTAX_ERROR;
|
2024-03-18 11:40:49 +00:00
|
|
|
extern const int BAD_ARGUMENTS;
|
2021-06-02 01:52:54 +00:00
|
|
|
}
|
|
|
|
|
2021-06-01 03:01:35 +00:00
|
|
|
namespace
|
|
|
|
{
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
std::tuple<IntervalKind::Kind, Int64>
|
|
|
|
dispatchForIntervalColumns(const ColumnWithTypeAndName & interval_column, const String & function_name)
|
|
|
|
{
|
|
|
|
const auto * interval_type = checkAndGetDataType<DataTypeInterval>(interval_column.type.get());
|
|
|
|
if (!interval_type)
|
|
|
|
throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}",
|
|
|
|
interval_column.name, function_name);
|
|
|
|
const auto * interval_column_const_int64 = checkAndGetColumnConst<ColumnInt64>(interval_column.column.get());
|
|
|
|
if (!interval_column_const_int64)
|
|
|
|
throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}",
|
|
|
|
interval_column.name, function_name);
|
|
|
|
Int64 num_units = interval_column_const_int64->getValue<Int64>();
|
|
|
|
if (num_units <= 0)
|
|
|
|
throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND, "Value for column {} of function {} must be positive",
|
|
|
|
interval_column.name, function_name);
|
|
|
|
|
|
|
|
return {interval_type->getKind(), num_units};
|
|
|
|
}
|
|
|
|
|
2024-03-18 11:58:03 +00:00
|
|
|
ColumnPtr executeWindowBound(const ColumnPtr & column, size_t index, const String & function_name)
|
2024-03-18 11:26:05 +00:00
|
|
|
{
|
2024-03-18 11:58:03 +00:00
|
|
|
chassert(index == 0 || index == 1);
|
2024-03-18 11:26:05 +00:00
|
|
|
if (const ColumnTuple * col_tuple = checkAndGetColumn<ColumnTuple>(column.get()); col_tuple)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2024-03-18 11:58:03 +00:00
|
|
|
if (index >= col_tuple->tupleSize() || !checkColumn<ColumnVector<UInt32>>(*col_tuple->getColumnPtr(index)))
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column for first argument of function {}. "
|
2024-03-18 11:26:05 +00:00
|
|
|
"Must be a Tuple(DataTime, DataTime)", function_name);
|
|
|
|
return col_tuple->getColumnPtr(index);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
2024-03-18 11:26:05 +00:00
|
|
|
else
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2024-03-18 11:26:05 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column for first argument of function {}. "
|
|
|
|
"Must be Tuple", function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
2024-03-18 11:26:05 +00:00
|
|
|
}
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
void checkFirstArgument(const ColumnWithTypeAndName & argument, const String & function_name)
|
|
|
|
{
|
|
|
|
if (!isDateTime(argument.type))
|
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
|
|
|
|
"Should be a date with time", argument.type->getName(), function_name);
|
|
|
|
}
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
void checkIntervalArgument(const ColumnWithTypeAndName & argument, const String & function_name, IntervalKind & interval_kind, bool & result_type_is_date)
|
|
|
|
{
|
|
|
|
const auto * interval_type = checkAndGetDataType<DataTypeInterval>(argument.type.get());
|
|
|
|
if (!interval_type)
|
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
|
|
|
|
"Should be an interval of time", argument.type->getName(), function_name);
|
|
|
|
interval_kind = interval_type->getKind();
|
|
|
|
result_type_is_date = (interval_type->getKind() == IntervalKind::Kind::Year) || (interval_type->getKind() == IntervalKind::Kind::Quarter)
|
|
|
|
|| (interval_type->getKind() == IntervalKind::Kind::Month) || (interval_type->getKind() == IntervalKind::Kind::Week);
|
|
|
|
}
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
void checkIntervalArgument(const ColumnWithTypeAndName & argument, const String & function_name, bool & result_type_is_date)
|
|
|
|
{
|
|
|
|
IntervalKind interval_kind;
|
|
|
|
checkIntervalArgument(argument, function_name, interval_kind, result_type_is_date);
|
|
|
|
}
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
void checkTimeZoneArgument(
|
|
|
|
const ColumnWithTypeAndName & argument,
|
|
|
|
const String & function_name)
|
|
|
|
{
|
|
|
|
if (!WhichDataType(argument.type).isString())
|
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
|
|
|
|
"This argument is optional and must be a constant string with timezone name",
|
|
|
|
argument.type->getName(), function_name);
|
|
|
|
}
|
|
|
|
|
|
|
|
bool checkIntervalOrTimeZoneArgument(const ColumnWithTypeAndName & argument, const String & function_name, IntervalKind & interval_kind, bool & result_type_is_date)
|
|
|
|
{
|
|
|
|
if (WhichDataType(argument.type).isString())
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2024-03-18 11:26:05 +00:00
|
|
|
checkTimeZoneArgument(argument, function_name);
|
|
|
|
return false;
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
2024-03-18 11:26:05 +00:00
|
|
|
checkIntervalArgument(argument, function_name, interval_kind, result_type_is_date);
|
|
|
|
return true;
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
template <TimeWindowFunctionName type>
|
|
|
|
struct TimeWindowImpl
|
|
|
|
{
|
|
|
|
static constexpr auto name = "UNKNOWN";
|
|
|
|
|
|
|
|
static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name);
|
|
|
|
|
|
|
|
static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name);
|
|
|
|
};
|
|
|
|
|
|
|
|
template <TimeWindowFunctionName type>
|
|
|
|
class FunctionTimeWindow : public IFunction
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
static constexpr auto name = TimeWindowImpl<type>::name;
|
|
|
|
static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionTimeWindow>(); }
|
|
|
|
String getName() const override { return name; }
|
|
|
|
bool isVariadic() const override { return true; }
|
|
|
|
size_t getNumberOfArguments() const override { return 0; }
|
|
|
|
bool useDefaultImplementationForConstants() const override { return true; }
|
|
|
|
ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2, 3}; }
|
|
|
|
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo &) const override { return true; }
|
|
|
|
|
|
|
|
DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override;
|
|
|
|
|
|
|
|
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & /*result_type*/, size_t /*input_rows_count*/) const override;
|
|
|
|
};
|
|
|
|
|
|
|
|
using FunctionTumble = FunctionTimeWindow<TUMBLE>;
|
|
|
|
using FunctionTumbleStart = FunctionTimeWindow<TUMBLE_START>;
|
|
|
|
using FunctionTumbleEnd = FunctionTimeWindow<TUMBLE_END>;
|
|
|
|
using FunctionHop = FunctionTimeWindow<HOP>;
|
|
|
|
using FunctionWindowId = FunctionTimeWindow<WINDOW_ID>;
|
|
|
|
using FunctionHopStart = FunctionTimeWindow<HOP_START>;
|
|
|
|
using FunctionHopEnd = FunctionTimeWindow<HOP_END>;
|
|
|
|
|
|
|
|
|
2021-06-01 03:01:35 +00:00
|
|
|
template <>
|
2021-12-10 09:43:44 +00:00
|
|
|
struct TimeWindowImpl<TUMBLE>
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-07 08:14:00 +00:00
|
|
|
static constexpr auto name = "tumble";
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
[[maybe_unused]] static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
|
|
|
{
|
|
|
|
bool result_type_is_date;
|
|
|
|
|
|
|
|
if (arguments.size() == 2)
|
|
|
|
{
|
|
|
|
checkFirstArgument(arguments.at(0), function_name);
|
|
|
|
checkIntervalArgument(arguments.at(1), function_name, result_type_is_date);
|
|
|
|
}
|
|
|
|
else if (arguments.size() == 3)
|
|
|
|
{
|
|
|
|
checkFirstArgument(arguments.at(0), function_name);
|
|
|
|
checkIntervalArgument(arguments.at(1), function_name, result_type_is_date);
|
|
|
|
checkTimeZoneArgument(arguments.at(2), function_name);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
|
|
|
|
"Number of arguments for function {} doesn't match: passed {}, should be 2 or 3",
|
|
|
|
function_name, arguments.size());
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
2021-11-27 14:46:43 +00:00
|
|
|
DataTypePtr data_type = nullptr;
|
2021-06-01 03:01:35 +00:00
|
|
|
if (result_type_is_date)
|
2021-11-27 14:46:43 +00:00
|
|
|
data_type = std::make_shared<DataTypeDate>();
|
2021-06-01 03:01:35 +00:00
|
|
|
else
|
2023-06-10 12:53:02 +00:00
|
|
|
data_type = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2021-11-27 14:46:43 +00:00
|
|
|
return std::make_shared<DataTypeTuple>(DataTypes{data_type, data_type});
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
|
|
|
{
|
|
|
|
const auto & time_column = arguments[0];
|
|
|
|
const auto & interval_column = arguments[1];
|
|
|
|
const auto & from_datatype = *time_column.type.get();
|
|
|
|
const auto which_type = WhichDataType(from_datatype);
|
2022-10-19 09:13:02 +00:00
|
|
|
const auto * time_column_vec = checkAndGetColumn<ColumnDateTime>(time_column.column.get());
|
2021-06-01 03:01:35 +00:00
|
|
|
const DateLUTImpl & time_zone = extractTimeZoneFromFunctionArguments(arguments, 2, 0);
|
|
|
|
if (!which_type.isDateTime() || !time_column_vec)
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column {} of function {}. "
|
|
|
|
"Must contain dates or dates with time", time_column.name, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
auto interval = dispatchForIntervalColumns(interval_column, function_name);
|
|
|
|
|
|
|
|
switch (std::get<0>(interval))
|
|
|
|
{
|
2024-02-27 13:37:21 +00:00
|
|
|
/// TODO: add proper support for fractional seconds
|
|
|
|
case IntervalKind::Kind::Second:
|
|
|
|
return executeTumble<UInt32, IntervalKind::Kind::Second>(*time_column_vec, std::get<1>(interval), time_zone);
|
|
|
|
case IntervalKind::Kind::Minute:
|
|
|
|
return executeTumble<UInt32, IntervalKind::Kind::Minute>(*time_column_vec, std::get<1>(interval), time_zone);
|
|
|
|
case IntervalKind::Kind::Hour:
|
|
|
|
return executeTumble<UInt32, IntervalKind::Kind::Hour>(*time_column_vec, std::get<1>(interval), time_zone);
|
|
|
|
case IntervalKind::Kind::Day:
|
|
|
|
return executeTumble<UInt32, IntervalKind::Kind::Day>(*time_column_vec, std::get<1>(interval), time_zone);
|
|
|
|
case IntervalKind::Kind::Week:
|
|
|
|
return executeTumble<UInt16, IntervalKind::Kind::Week>(*time_column_vec, std::get<1>(interval), time_zone);
|
|
|
|
case IntervalKind::Kind::Month:
|
|
|
|
return executeTumble<UInt16, IntervalKind::Kind::Month>(*time_column_vec, std::get<1>(interval), time_zone);
|
|
|
|
case IntervalKind::Kind::Quarter:
|
|
|
|
return executeTumble<UInt16, IntervalKind::Kind::Quarter>(*time_column_vec, std::get<1>(interval), time_zone);
|
|
|
|
case IntervalKind::Kind::Year:
|
|
|
|
return executeTumble<UInt16, IntervalKind::Kind::Year>(*time_column_vec, std::get<1>(interval), time_zone);
|
2022-02-09 07:28:15 +00:00
|
|
|
default:
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::SYNTAX_ERROR, "Fraction seconds are unsupported by windows yet");
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
2022-10-07 19:20:14 +00:00
|
|
|
UNREACHABLE();
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template <typename ToType, IntervalKind::Kind unit>
|
2022-10-19 09:13:02 +00:00
|
|
|
static ColumnPtr executeTumble(const ColumnDateTime & time_column, UInt64 num_units, const DateLUTImpl & time_zone)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
|
|
|
const auto & time_data = time_column.getData();
|
|
|
|
size_t size = time_column.size();
|
|
|
|
auto start = ColumnVector<ToType>::create();
|
|
|
|
auto end = ColumnVector<ToType>::create();
|
|
|
|
auto & start_data = start->getData();
|
|
|
|
auto & end_data = end->getData();
|
|
|
|
start_data.resize(size);
|
|
|
|
end_data.resize(size);
|
|
|
|
for (size_t i = 0; i != size; ++i)
|
|
|
|
{
|
|
|
|
start_data[i] = ToStartOfTransform<unit>::execute(time_data[i], num_units, time_zone);
|
|
|
|
end_data[i] = AddTime<unit>::execute(start_data[i], num_units, time_zone);
|
|
|
|
}
|
|
|
|
MutableColumns result;
|
|
|
|
result.emplace_back(std::move(start));
|
|
|
|
result.emplace_back(std::move(end));
|
|
|
|
return ColumnTuple::create(std::move(result));
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
template <>
|
2021-12-10 09:43:44 +00:00
|
|
|
struct TimeWindowImpl<TUMBLE_START>
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-07 08:14:00 +00:00
|
|
|
static constexpr auto name = "tumbleStart";
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
|
|
|
{
|
|
|
|
if (arguments.size() == 1)
|
|
|
|
{
|
2021-11-27 14:46:43 +00:00
|
|
|
auto type = WhichDataType(arguments[0].type);
|
|
|
|
if (type.isTuple())
|
2021-11-26 18:03:41 +00:00
|
|
|
return std::static_pointer_cast<const DataTypeTuple>(arguments[0].type)->getElement(0);
|
2021-11-27 14:46:43 +00:00
|
|
|
else if (type.isUInt32())
|
2021-11-26 18:03:41 +00:00
|
|
|
return std::make_shared<DataTypeDateTime>();
|
|
|
|
else
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_COLUMN,
|
|
|
|
"Illegal type of first argument of function {} should be DateTime, Tuple or UInt32",
|
|
|
|
function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2021-12-10 09:43:44 +00:00
|
|
|
return std::static_pointer_cast<const DataTypeTuple>(TimeWindowImpl<TUMBLE>::getReturnType(arguments, function_name))
|
2021-11-26 18:30:22 +00:00
|
|
|
->getElement(0);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
[[maybe_unused]] static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
|
|
|
{
|
2021-12-04 12:30:04 +00:00
|
|
|
const auto & time_column = arguments[0];
|
|
|
|
const auto which_type = WhichDataType(time_column.type);
|
2021-11-27 14:46:43 +00:00
|
|
|
ColumnPtr result_column;
|
2021-12-04 12:30:04 +00:00
|
|
|
if (arguments.size() == 1)
|
|
|
|
{
|
|
|
|
if (which_type.isUInt32())
|
|
|
|
return time_column.column;
|
|
|
|
else //isTuple
|
|
|
|
result_column = time_column.column;
|
|
|
|
}
|
2021-06-01 03:01:35 +00:00
|
|
|
else
|
2021-12-10 09:43:44 +00:00
|
|
|
result_column = TimeWindowImpl<TUMBLE>::dispatchForColumns(arguments, function_name);
|
2021-11-27 14:46:43 +00:00
|
|
|
return executeWindowBound(result_column, 0, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
template <>
|
2021-12-10 09:43:44 +00:00
|
|
|
struct TimeWindowImpl<TUMBLE_END>
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-07 08:14:00 +00:00
|
|
|
static constexpr auto name = "tumbleEnd";
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
[[maybe_unused]] static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
|
|
|
{
|
2021-12-10 09:43:44 +00:00
|
|
|
return TimeWindowImpl<TUMBLE_START>::getReturnType(arguments, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
[[maybe_unused]] static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String& function_name)
|
|
|
|
{
|
2021-12-04 12:30:04 +00:00
|
|
|
const auto & time_column = arguments[0];
|
|
|
|
const auto which_type = WhichDataType(time_column.type);
|
2021-11-27 14:46:43 +00:00
|
|
|
ColumnPtr result_column;
|
2021-12-04 12:30:04 +00:00
|
|
|
if (arguments.size() == 1)
|
|
|
|
{
|
|
|
|
if (which_type.isUInt32())
|
|
|
|
return time_column.column;
|
|
|
|
else //isTuple
|
|
|
|
result_column = time_column.column;
|
|
|
|
}
|
2021-06-01 03:01:35 +00:00
|
|
|
else
|
2021-12-10 09:43:44 +00:00
|
|
|
result_column = TimeWindowImpl<TUMBLE>::dispatchForColumns(arguments, function_name);
|
2021-11-27 14:46:43 +00:00
|
|
|
return executeWindowBound(result_column, 1, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
template <>
|
2021-12-10 09:43:44 +00:00
|
|
|
struct TimeWindowImpl<HOP>
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-07 08:14:00 +00:00
|
|
|
static constexpr auto name = "hop";
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
[[maybe_unused]] static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
|
|
|
{
|
|
|
|
bool result_type_is_date;
|
|
|
|
IntervalKind interval_kind_1;
|
|
|
|
IntervalKind interval_kind_2;
|
|
|
|
|
|
|
|
if (arguments.size() == 3)
|
|
|
|
{
|
|
|
|
checkFirstArgument(arguments.at(0), function_name);
|
|
|
|
checkIntervalArgument(arguments.at(1), function_name, interval_kind_1, result_type_is_date);
|
|
|
|
checkIntervalArgument(arguments.at(2), function_name, interval_kind_2, result_type_is_date);
|
|
|
|
}
|
|
|
|
else if (arguments.size() == 4)
|
|
|
|
{
|
|
|
|
checkFirstArgument(arguments.at(0), function_name);
|
|
|
|
checkIntervalArgument(arguments.at(1), function_name, interval_kind_1, result_type_is_date);
|
|
|
|
checkIntervalArgument(arguments.at(2), function_name, interval_kind_2, result_type_is_date);
|
|
|
|
checkTimeZoneArgument(arguments.at(3), function_name);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
|
|
|
|
"Number of arguments for function {} doesn't match: passed {}, should be 3 or 4",
|
|
|
|
function_name, arguments.size());
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (interval_kind_1 != interval_kind_2)
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal type of window and hop column of function {}, must be same",
|
|
|
|
function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2021-11-27 14:46:43 +00:00
|
|
|
DataTypePtr data_type = nullptr;
|
2021-06-01 03:01:35 +00:00
|
|
|
if (result_type_is_date)
|
2021-11-27 14:46:43 +00:00
|
|
|
data_type = std::make_shared<DataTypeDate>();
|
2021-06-01 03:01:35 +00:00
|
|
|
else
|
2023-06-10 12:53:02 +00:00
|
|
|
data_type = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 3, 0, false));
|
2021-11-27 14:46:43 +00:00
|
|
|
return std::make_shared<DataTypeTuple>(DataTypes{data_type, data_type});
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
|
|
|
{
|
|
|
|
const auto & time_column = arguments[0];
|
|
|
|
const auto & hop_interval_column = arguments[1];
|
|
|
|
const auto & window_interval_column = arguments[2];
|
|
|
|
const auto & from_datatype = *time_column.type.get();
|
2022-10-19 09:13:02 +00:00
|
|
|
const auto * time_column_vec = checkAndGetColumn<ColumnDateTime>(time_column.column.get());
|
2021-06-01 03:01:35 +00:00
|
|
|
const DateLUTImpl & time_zone = extractTimeZoneFromFunctionArguments(arguments, 3, 0);
|
|
|
|
if (!WhichDataType(from_datatype).isDateTime() || !time_column_vec)
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column {} argument of function {}. "
|
|
|
|
"Must contain dates or dates with time", time_column.name, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
auto hop_interval = dispatchForIntervalColumns(hop_interval_column, function_name);
|
|
|
|
auto window_interval = dispatchForIntervalColumns(window_interval_column, function_name);
|
|
|
|
|
|
|
|
if (std::get<1>(hop_interval) > std::get<1>(window_interval))
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND,
|
|
|
|
"Value for hop interval of function {} must not larger than window interval", function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
switch (std::get<0>(window_interval))
|
|
|
|
{
|
2024-02-27 13:37:21 +00:00
|
|
|
/// TODO: add proper support for fractional seconds
|
|
|
|
case IntervalKind::Kind::Second:
|
|
|
|
return executeHop<UInt32, IntervalKind::Kind::Second>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Minute:
|
|
|
|
return executeHop<UInt32, IntervalKind::Kind::Minute>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Hour:
|
|
|
|
return executeHop<UInt32, IntervalKind::Kind::Hour>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Day:
|
|
|
|
return executeHop<UInt32, IntervalKind::Kind::Day>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Week:
|
|
|
|
return executeHop<UInt16, IntervalKind::Kind::Week>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Month:
|
|
|
|
return executeHop<UInt16, IntervalKind::Kind::Month>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Quarter:
|
|
|
|
return executeHop<UInt16, IntervalKind::Kind::Quarter>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Year:
|
|
|
|
return executeHop<UInt16, IntervalKind::Kind::Year>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2022-02-09 07:28:15 +00:00
|
|
|
default:
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::SYNTAX_ERROR, "Fraction seconds are unsupported by windows yet");
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
2022-10-07 19:20:14 +00:00
|
|
|
UNREACHABLE();
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template <typename ToType, IntervalKind::Kind kind>
|
|
|
|
static ColumnPtr
|
2022-10-19 09:13:02 +00:00
|
|
|
executeHop(const ColumnDateTime & time_column, UInt64 hop_num_units, UInt64 window_num_units, const DateLUTImpl & time_zone)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
|
|
|
const auto & time_data = time_column.getData();
|
|
|
|
size_t size = time_column.size();
|
|
|
|
auto start = ColumnVector<ToType>::create();
|
|
|
|
auto end = ColumnVector<ToType>::create();
|
|
|
|
auto & start_data = start->getData();
|
|
|
|
auto & end_data = end->getData();
|
|
|
|
start_data.resize(size);
|
|
|
|
end_data.resize(size);
|
|
|
|
|
|
|
|
for (size_t i = 0; i < size; ++i)
|
|
|
|
{
|
|
|
|
ToType wstart = ToStartOfTransform<kind>::execute(time_data[i], hop_num_units, time_zone);
|
|
|
|
ToType wend = AddTime<kind>::execute(wstart, hop_num_units, time_zone);
|
2022-05-04 12:56:09 +00:00
|
|
|
wstart = AddTime<kind>::execute(wend, -window_num_units, time_zone);
|
2021-06-01 03:01:35 +00:00
|
|
|
ToType wend_latest;
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
if (wstart > wend)
|
|
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "Time overflow in function {}", name);
|
|
|
|
|
2021-06-01 03:01:35 +00:00
|
|
|
do
|
|
|
|
{
|
2021-11-27 14:46:43 +00:00
|
|
|
wend_latest = wend;
|
2022-05-04 12:56:09 +00:00
|
|
|
wend = AddTime<kind>::execute(wend, -hop_num_units, time_zone);
|
2021-11-27 14:46:43 +00:00
|
|
|
} while (wend > time_data[i]);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
end_data[i] = wend_latest;
|
2022-05-04 12:56:09 +00:00
|
|
|
start_data[i] = AddTime<kind>::execute(wend_latest, -window_num_units, time_zone);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
MutableColumns result;
|
|
|
|
result.emplace_back(std::move(start));
|
|
|
|
result.emplace_back(std::move(end));
|
|
|
|
return ColumnTuple::create(std::move(result));
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
template <>
|
2021-12-10 09:43:44 +00:00
|
|
|
struct TimeWindowImpl<WINDOW_ID>
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-07 08:14:00 +00:00
|
|
|
static constexpr auto name = "windowID";
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
|
|
|
bool result_type_is_date;
|
|
|
|
IntervalKind interval_kind_1;
|
|
|
|
IntervalKind interval_kind_2;
|
|
|
|
|
|
|
|
if (arguments.size() == 2)
|
|
|
|
{
|
|
|
|
checkFirstArgument(arguments.at(0), function_name);
|
|
|
|
checkIntervalArgument(arguments.at(1), function_name, interval_kind_1, result_type_is_date);
|
|
|
|
}
|
|
|
|
else if (arguments.size() == 3)
|
|
|
|
{
|
|
|
|
checkFirstArgument(arguments.at(0), function_name);
|
|
|
|
checkIntervalArgument(arguments.at(1), function_name, interval_kind_1, result_type_is_date);
|
|
|
|
if (checkIntervalOrTimeZoneArgument(arguments.at(2), function_name, interval_kind_2, result_type_is_date))
|
|
|
|
{
|
|
|
|
if (interval_kind_1 != interval_kind_2)
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal type of window and hop column of function {}, must be same",
|
|
|
|
function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
else if (arguments.size() == 4)
|
|
|
|
{
|
|
|
|
checkFirstArgument(arguments.at(0), function_name);
|
|
|
|
checkIntervalArgument(arguments.at(1), function_name, interval_kind_1, result_type_is_date);
|
|
|
|
checkIntervalArgument(arguments.at(2), function_name, interval_kind_2, result_type_is_date);
|
|
|
|
checkTimeZoneArgument(arguments.at(3), function_name);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
|
|
|
|
"Number of arguments for function {} doesn't match: passed {}, should be 2, 3 or 4",
|
|
|
|
function_name, arguments.size());
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if (result_type_is_date)
|
|
|
|
return std::make_shared<DataTypeUInt16>();
|
|
|
|
else
|
|
|
|
return std::make_shared<DataTypeUInt32>();
|
|
|
|
}
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
static ColumnPtr dispatchForHopColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
|
|
|
const auto & time_column = arguments[0];
|
|
|
|
const auto & hop_interval_column = arguments[1];
|
|
|
|
const auto & window_interval_column = arguments[2];
|
|
|
|
const auto & from_datatype = *time_column.type.get();
|
2022-10-19 09:13:02 +00:00
|
|
|
const auto * time_column_vec = checkAndGetColumn<ColumnDateTime>(time_column.column.get());
|
2021-06-01 03:01:35 +00:00
|
|
|
const DateLUTImpl & time_zone = extractTimeZoneFromFunctionArguments(arguments, 3, 0);
|
|
|
|
if (!WhichDataType(from_datatype).isDateTime() || !time_column_vec)
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column {} argument of function {}. "
|
|
|
|
"Must contain dates or dates with time", time_column.name, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
auto hop_interval = dispatchForIntervalColumns(hop_interval_column, function_name);
|
|
|
|
auto window_interval = dispatchForIntervalColumns(window_interval_column, function_name);
|
|
|
|
|
|
|
|
if (std::get<1>(hop_interval) > std::get<1>(window_interval))
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND,
|
|
|
|
"Value for hop interval of function {} must not larger than window interval", function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
switch (std::get<0>(window_interval))
|
|
|
|
{
|
2024-02-27 13:37:21 +00:00
|
|
|
/// TODO: add proper support for fractional seconds
|
|
|
|
case IntervalKind::Kind::Second:
|
|
|
|
return executeHopSlice<UInt32, IntervalKind::Kind::Second>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Minute:
|
|
|
|
return executeHopSlice<UInt32, IntervalKind::Kind::Minute>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Hour:
|
|
|
|
return executeHopSlice<UInt32, IntervalKind::Kind::Hour>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Day:
|
|
|
|
return executeHopSlice<UInt32, IntervalKind::Kind::Day>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Week:
|
|
|
|
return executeHopSlice<UInt16, IntervalKind::Kind::Week>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Month:
|
|
|
|
return executeHopSlice<UInt16, IntervalKind::Kind::Month>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Quarter:
|
|
|
|
return executeHopSlice<UInt16, IntervalKind::Kind::Quarter>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2024-02-27 13:37:21 +00:00
|
|
|
case IntervalKind::Kind::Year:
|
|
|
|
return executeHopSlice<UInt16, IntervalKind::Kind::Year>(
|
2021-06-01 03:01:35 +00:00
|
|
|
*time_column_vec, std::get<1>(hop_interval), std::get<1>(window_interval), time_zone);
|
2022-02-09 07:28:15 +00:00
|
|
|
default:
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::SYNTAX_ERROR, "Fraction seconds are unsupported by windows yet");
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
2022-10-07 19:20:14 +00:00
|
|
|
UNREACHABLE();
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template <typename ToType, IntervalKind::Kind kind>
|
|
|
|
static ColumnPtr
|
2022-10-19 09:13:02 +00:00
|
|
|
executeHopSlice(const ColumnDateTime & time_column, UInt64 hop_num_units, UInt64 window_num_units, const DateLUTImpl & time_zone)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
|
|
|
Int64 gcd_num_units = std::gcd(hop_num_units, window_num_units);
|
|
|
|
|
|
|
|
const auto & time_data = time_column.getData();
|
|
|
|
size_t size = time_column.size();
|
|
|
|
|
|
|
|
auto end = ColumnVector<ToType>::create();
|
|
|
|
auto & end_data = end->getData();
|
|
|
|
end_data.resize(size);
|
|
|
|
for (size_t i = 0; i < size; ++i)
|
|
|
|
{
|
|
|
|
ToType wstart = ToStartOfTransform<kind>::execute(time_data[i], hop_num_units, time_zone);
|
|
|
|
ToType wend = AddTime<kind>::execute(wstart, hop_num_units, time_zone);
|
|
|
|
ToType wend_latest;
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
if (wstart > wend)
|
|
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "Time overflow in function {}", name);
|
|
|
|
|
2021-06-01 03:01:35 +00:00
|
|
|
do
|
|
|
|
{
|
2021-11-27 14:46:43 +00:00
|
|
|
wend_latest = wend;
|
2022-05-04 12:56:09 +00:00
|
|
|
wend = AddTime<kind>::execute(wend, -gcd_num_units, time_zone);
|
2021-11-27 14:46:43 +00:00
|
|
|
} while (wend > time_data[i]);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
end_data[i] = wend_latest;
|
|
|
|
}
|
|
|
|
return end;
|
|
|
|
}
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
static ColumnPtr dispatchForTumbleColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-10 09:43:44 +00:00
|
|
|
ColumnPtr column = TimeWindowImpl<TUMBLE>::dispatchForColumns(arguments, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
return executeWindowBound(column, 1, function_name);
|
|
|
|
}
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
|
|
|
if (arguments.size() == 2)
|
|
|
|
return dispatchForTumbleColumns(arguments, function_name);
|
|
|
|
else
|
|
|
|
{
|
|
|
|
const auto & third_column = arguments[2];
|
|
|
|
if (arguments.size() == 3 && WhichDataType(third_column.type).isString())
|
|
|
|
return dispatchForTumbleColumns(arguments, function_name);
|
|
|
|
else
|
|
|
|
return dispatchForHopColumns(arguments, function_name);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
template <>
|
2021-12-10 09:43:44 +00:00
|
|
|
struct TimeWindowImpl<HOP_START>
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-07 08:14:00 +00:00
|
|
|
static constexpr auto name = "hopStart";
|
2021-06-01 03:01:35 +00:00
|
|
|
|
|
|
|
static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
|
|
|
{
|
|
|
|
if (arguments.size() == 1)
|
|
|
|
{
|
2021-11-27 14:46:43 +00:00
|
|
|
auto type = WhichDataType(arguments[0].type);
|
|
|
|
if (type.isTuple())
|
2021-11-26 18:03:41 +00:00
|
|
|
return std::static_pointer_cast<const DataTypeTuple>(arguments[0].type)->getElement(0);
|
2021-11-27 14:46:43 +00:00
|
|
|
else if (type.isUInt32())
|
2021-11-26 18:03:41 +00:00
|
|
|
return std::make_shared<DataTypeDateTime>();
|
|
|
|
else
|
2023-01-23 21:13:58 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_COLUMN,
|
|
|
|
"Illegal type of first argument of function {} should be DateTime, Tuple or UInt32",
|
|
|
|
function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2021-12-10 09:43:44 +00:00
|
|
|
return std::static_pointer_cast<const DataTypeTuple>(TimeWindowImpl<HOP>::getReturnType(arguments, function_name))->getElement(0);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
|
|
|
const auto & time_column = arguments[0];
|
|
|
|
const auto which_type = WhichDataType(time_column.type);
|
2021-11-27 14:46:43 +00:00
|
|
|
ColumnPtr result_column;
|
2021-06-01 03:01:35 +00:00
|
|
|
if (arguments.size() == 1)
|
|
|
|
{
|
|
|
|
if (which_type.isUInt32())
|
|
|
|
return time_column.column;
|
|
|
|
else //isTuple
|
2021-11-27 14:46:43 +00:00
|
|
|
result_column = time_column.column;
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
else
|
2021-12-10 09:43:44 +00:00
|
|
|
result_column = TimeWindowImpl<HOP>::dispatchForColumns(arguments, function_name);
|
2021-11-27 14:46:43 +00:00
|
|
|
return executeWindowBound(result_column, 0, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
template <>
|
2021-12-10 09:43:44 +00:00
|
|
|
struct TimeWindowImpl<HOP_END>
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-07 08:14:00 +00:00
|
|
|
static constexpr auto name = "hopEnd";
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-10 09:43:44 +00:00
|
|
|
return TimeWindowImpl<HOP_START>::getReturnType(arguments, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
|
|
|
const auto & time_column = arguments[0];
|
|
|
|
const auto which_type = WhichDataType(time_column.type);
|
2021-11-27 14:46:43 +00:00
|
|
|
ColumnPtr result_column;
|
2021-06-01 03:01:35 +00:00
|
|
|
if (arguments.size() == 1)
|
|
|
|
{
|
|
|
|
if (which_type.isUInt32())
|
|
|
|
return time_column.column;
|
|
|
|
else //isTuple
|
2021-11-27 14:46:43 +00:00
|
|
|
result_column = time_column.column;
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
else
|
2021-12-10 09:43:44 +00:00
|
|
|
result_column = TimeWindowImpl<HOP>::dispatchForColumns(arguments, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
|
2021-11-27 14:46:43 +00:00
|
|
|
return executeWindowBound(result_column, 1, function_name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2021-12-10 09:59:50 +00:00
|
|
|
template <TimeWindowFunctionName type>
|
2021-12-10 09:43:44 +00:00
|
|
|
DataTypePtr FunctionTimeWindow<type>::getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-10 09:43:44 +00:00
|
|
|
return TimeWindowImpl<type>::getReturnType(arguments, name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
2021-12-10 09:59:50 +00:00
|
|
|
template <TimeWindowFunctionName type>
|
2021-12-10 09:43:44 +00:00
|
|
|
ColumnPtr FunctionTimeWindow<type>::executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & /*result_type*/, size_t /*input_rows_count*/) const
|
2021-06-01 03:01:35 +00:00
|
|
|
{
|
2021-12-10 09:43:44 +00:00
|
|
|
return TimeWindowImpl<type>::dispatchForColumns(arguments, name);
|
2021-06-01 03:01:35 +00:00
|
|
|
}
|
|
|
|
|
2024-03-18 11:26:05 +00:00
|
|
|
}
|
|
|
|
|
2022-07-04 07:01:39 +00:00
|
|
|
REGISTER_FUNCTION(TimeWindow)
|
2020-01-14 03:08:54 +00:00
|
|
|
{
|
|
|
|
factory.registerFunction<FunctionTumble>();
|
|
|
|
factory.registerFunction<FunctionHop>();
|
|
|
|
factory.registerFunction<FunctionTumbleStart>();
|
|
|
|
factory.registerFunction<FunctionTumbleEnd>();
|
|
|
|
factory.registerFunction<FunctionHopStart>();
|
|
|
|
factory.registerFunction<FunctionHopEnd>();
|
2020-06-17 15:06:19 +00:00
|
|
|
factory.registerFunction<FunctionWindowId>();
|
2020-01-14 03:08:54 +00:00
|
|
|
}
|
2020-01-14 16:24:26 +00:00
|
|
|
}
|