2015-06-03 03:29:28 +00:00
|
|
|
#include <mutex>
|
2021-10-02 07:13:14 +00:00
|
|
|
#include <base/bit_cast.h>
|
2021-02-14 16:07:20 +00:00
|
|
|
|
2017-07-21 06:35:58 +00:00
|
|
|
#include <Columns/ColumnArray.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Columns/ColumnConst.h>
|
2021-11-26 02:05:31 +00:00
|
|
|
#include <Columns/ColumnDecimal.h>
|
2023-03-31 15:15:23 +00:00
|
|
|
#include <Columns/ColumnNullable.h>
|
|
|
|
#include <Columns/ColumnString.h>
|
|
|
|
#include <Columns/ColumnsNumber.h>
|
|
|
|
#include <DataTypes/DataTypeArray.h>
|
|
|
|
#include <DataTypes/getLeastSupertype.h>
|
|
|
|
#include <Functions/FunctionFactory.h>
|
|
|
|
#include <Functions/FunctionHelpers.h>
|
|
|
|
#include <Functions/IFunction.h>
|
|
|
|
#include <Interpreters/castColumn.h>
|
|
|
|
#include <Interpreters/convertFieldToType.h>
|
|
|
|
#include <base/StringRef.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Common/Arena.h>
|
2023-03-31 15:15:23 +00:00
|
|
|
#include <Common/FieldVisitorConvertToNumber.h>
|
|
|
|
#include <Common/FieldVisitorDump.h>
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <Common/HashTable/HashMap.h>
|
2017-07-13 20:58:19 +00:00
|
|
|
#include <Common/typeid_cast.h>
|
2015-06-03 03:29:28 +00:00
|
|
|
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
2017-04-08 01:32:05 +00:00
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
2020-02-25 18:02:41 +00:00
|
|
|
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
|
2017-04-08 01:32:05 +00:00
|
|
|
extern const int BAD_ARGUMENTS;
|
2017-06-13 02:06:53 +00:00
|
|
|
extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
|
|
|
|
extern const int ILLEGAL_COLUMN;
|
2017-04-08 01:32:05 +00:00
|
|
|
}
|
|
|
|
|
2020-09-07 18:00:37 +00:00
|
|
|
namespace
|
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
/** transform(x, from_array, to_array[, default]) - convert x according to an explicitly passed match.
|
2015-06-03 03:29:28 +00:00
|
|
|
*/
|
2023-03-31 15:15:23 +00:00
|
|
|
/** transform(x, [from...], [to...], default)
|
2017-05-27 15:45:25 +00:00
|
|
|
* - converts the values according to the explicitly specified mapping.
|
2015-06-03 03:29:28 +00:00
|
|
|
*
|
2017-05-27 15:45:25 +00:00
|
|
|
* x - what to transform.
|
|
|
|
* from - a constant array of values for the transformation.
|
|
|
|
* to - a constant array of values into which values from `from` must be transformed.
|
|
|
|
* default - what value to use if x is not equal to any of the values in `from`.
|
|
|
|
* `from` and `to` - arrays of the same size.
|
2015-06-03 03:29:28 +00:00
|
|
|
*
|
2017-05-27 15:45:25 +00:00
|
|
|
* Types:
|
2015-06-03 03:29:28 +00:00
|
|
|
* transform(T, Array(T), Array(U), U) -> U
|
|
|
|
*
|
|
|
|
* transform(x, [from...], [to...])
|
2017-05-27 15:45:25 +00:00
|
|
|
* - if `default` is not specified, then for values of `x` for which there is no corresponding element in `from`, the unchanged value of `x` is returned.
|
2015-06-03 03:29:28 +00:00
|
|
|
*
|
2017-05-27 15:45:25 +00:00
|
|
|
* Types:
|
2015-06-03 03:29:28 +00:00
|
|
|
* transform(T, Array(T), Array(T)) -> T
|
|
|
|
*
|
2017-05-27 15:45:25 +00:00
|
|
|
* Note: the implementation is rather cumbersome.
|
2015-06-03 03:29:28 +00:00
|
|
|
*/
|
2023-03-31 15:15:23 +00:00
|
|
|
class FunctionTransform : public IFunction
|
2016-05-03 23:19:14 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
public:
|
|
|
|
static constexpr auto name = "transform";
|
|
|
|
static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionTransform>(); }
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
String getName() const override { return name; }
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
bool isVariadic() const override { return true; }
|
|
|
|
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
|
|
|
|
size_t getNumberOfArguments() const override { return 0; }
|
|
|
|
bool useDefaultImplementationForConstants() const override { return false; }
|
|
|
|
bool useDefaultImplementationForNulls() const override { return false; }
|
|
|
|
bool useDefaultImplementationForNothing() const override { return false; }
|
|
|
|
ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2}; }
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
const auto args_size = arguments.size();
|
|
|
|
if (args_size != 3 && args_size != 4)
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
|
|
|
|
"Number of arguments for function {} doesn't match: "
|
|
|
|
"passed {}, should be 3 or 4",
|
|
|
|
getName(),
|
|
|
|
args_size);
|
|
|
|
|
|
|
|
const DataTypePtr & type_x = arguments[0];
|
|
|
|
const auto & type_x_nn = removeNullable(type_x);
|
|
|
|
|
|
|
|
if (!type_x_nn->isValueRepresentedByNumber() && !isString(type_x_nn) && !isNothing(type_x_nn))
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
|
|
|
|
"Unsupported type {} of first argument "
|
|
|
|
"of function {}, must be numeric type or Date/DateTime or String",
|
|
|
|
type_x->getName(),
|
|
|
|
getName());
|
|
|
|
|
|
|
|
const DataTypeArray * type_arr_from = checkAndGetDataType<DataTypeArray>(arguments[1].get());
|
|
|
|
|
|
|
|
if (!type_arr_from)
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
|
|
|
|
"Second argument of function {}, must be array of source values to transform from.",
|
|
|
|
getName());
|
|
|
|
|
|
|
|
const auto type_arr_from_nested = type_arr_from->getNestedType();
|
|
|
|
|
|
|
|
if ((type_x->isValueRepresentedByNumber() != type_arr_from_nested->isValueRepresentedByNumber())
|
|
|
|
|| (isString(type_x) != isString(type_arr_from_nested)))
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
|
|
|
|
"First argument and elements of array "
|
|
|
|
"of second argument of function {} must have compatible types: "
|
|
|
|
"both numeric or both strings.",
|
|
|
|
getName());
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
const DataTypeArray * type_arr_to = checkAndGetDataType<DataTypeArray>(arguments[2].get());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
if (!type_arr_to)
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
|
|
|
|
"Third argument of function {}, must be array of destination values to transform to.",
|
|
|
|
getName());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
const DataTypePtr & type_arr_to_nested = type_arr_to->getNestedType();
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
if (args_size == 3)
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
auto ret = tryGetLeastSupertype(DataTypes{type_arr_to_nested, type_x});
|
|
|
|
if (!ret)
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
|
|
|
|
"Function {} has signature: "
|
|
|
|
"transform(T, Array(T), Array(U), U) -> U; "
|
|
|
|
"or transform(T, Array(T), Array(T)) -> T; where T and U are types.",
|
|
|
|
getName());
|
|
|
|
return ret;
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
auto ret = tryGetLeastSupertype(DataTypes{type_arr_to_nested, arguments[3]});
|
|
|
|
if (!ret)
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
|
|
|
|
"Function {} have signature: "
|
|
|
|
"transform(T, Array(T), Array(U), U) -> U; "
|
|
|
|
"or transform(T, Array(T), Array(T)) -> T; where T and U are types.",
|
|
|
|
getName());
|
|
|
|
return ret;
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
ColumnPtr
|
|
|
|
executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
|
2021-11-26 02:05:31 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
initialize(arguments, result_type);
|
|
|
|
|
|
|
|
const auto * in = arguments.front().column.get();
|
|
|
|
|
|
|
|
if (isColumnConst(*in))
|
|
|
|
return executeConst(arguments, result_type, input_rows_count);
|
|
|
|
|
|
|
|
ColumnPtr default_non_const;
|
|
|
|
if (!cache.default_column && arguments.size() == 4)
|
|
|
|
default_non_const = castColumn(arguments[3], result_type);
|
|
|
|
|
|
|
|
auto column_result = result_type->createColumn();
|
|
|
|
if (!executeNum<ColumnVector<UInt8>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<UInt16>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<UInt32>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<UInt64>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<Int8>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<Int16>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<Int32>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<Int64>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<Float32>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnVector<Float64>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnDecimal<Decimal32>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeNum<ColumnDecimal<Decimal64>>(in, *column_result, default_non_const)
|
|
|
|
&& !executeString(in, *column_result, default_non_const))
|
2021-11-26 02:05:31 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}", in->getName(), getName());
|
2021-11-26 02:05:31 +00:00
|
|
|
}
|
2023-03-31 15:15:23 +00:00
|
|
|
return column_result;
|
2021-11-26 02:05:31 +00:00
|
|
|
}
|
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
private:
|
|
|
|
static ColumnPtr executeConst(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count)
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
/// Materialize the input column and compute the function as usual.
|
2021-11-26 02:05:31 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
ColumnsWithTypeAndName args = arguments;
|
|
|
|
args[0].column = args[0].column->cloneResized(input_rows_count)->convertToFullColumnIfConst();
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
auto impl = FunctionToOverloadResolverAdaptor(std::make_shared<FunctionTransform>()).build(args);
|
2021-11-26 02:05:31 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
return impl->execute(args, result_type, input_rows_count);
|
2021-11-26 02:05:31 +00:00
|
|
|
}
|
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
template <typename T>
|
|
|
|
bool executeNum(const IColumn * in_untyped, IColumn & column_result, const ColumnPtr default_non_const) const
|
2021-11-26 02:05:31 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
const auto in = checkAndGetColumn<T>(in_untyped);
|
|
|
|
if (!in)
|
|
|
|
return false;
|
|
|
|
const auto & pod = in->getData();
|
|
|
|
const size_t size = pod.size();
|
|
|
|
const auto & table = *cache.table_num_to_idx;
|
2023-04-14 08:09:28 +00:00
|
|
|
column_result.reserve(size);
|
2023-03-31 15:15:23 +00:00
|
|
|
for (size_t i = 0; i < size; ++i)
|
2023-01-23 19:54:35 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
const auto * it = table.find(bit_cast<UInt64>(pod[i]));
|
|
|
|
if (it)
|
|
|
|
column_result.insertFrom(*cache.to_columns, it->getMapped());
|
|
|
|
else if (cache.default_column)
|
|
|
|
column_result.insertFrom(*cache.default_column, 0);
|
|
|
|
else if (default_non_const)
|
2023-04-14 08:40:37 +00:00
|
|
|
column_result.insertFrom(*default_non_const, i);
|
2023-01-23 19:54:35 +00:00
|
|
|
else
|
2023-03-31 15:15:23 +00:00
|
|
|
column_result.insertFrom(*in, i);
|
2023-01-23 19:54:35 +00:00
|
|
|
}
|
2023-03-31 15:15:23 +00:00
|
|
|
return true;
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
bool executeString(const IColumn * in_untyped, IColumn & column_result, const ColumnPtr default_non_const) const
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
const auto in = checkAndGetColumn<ColumnString>(in_untyped);
|
|
|
|
if (!in)
|
|
|
|
return false;
|
|
|
|
const auto & data = in->getChars();
|
|
|
|
const auto & offsets = in->getOffsets();
|
|
|
|
const size_t size = offsets.size();
|
|
|
|
const auto & table = *cache.table_string_to_idx;
|
2023-04-14 08:09:28 +00:00
|
|
|
column_result.reserve(size);
|
2023-03-31 15:15:23 +00:00
|
|
|
ColumnString::Offset current_offset = 0;
|
|
|
|
for (size_t i = 0; i < size; ++i)
|
2023-01-23 19:54:35 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
const StringRef ref{&data[current_offset], offsets[i] - current_offset};
|
|
|
|
current_offset = offsets[i];
|
|
|
|
const auto * it = table.find(ref);
|
|
|
|
if (it)
|
|
|
|
column_result.insertFrom(*cache.to_columns, it->getMapped());
|
|
|
|
else if (cache.default_column)
|
|
|
|
column_result.insertFrom(*cache.default_column, 0);
|
|
|
|
else if (default_non_const)
|
|
|
|
column_result.insertFrom(*default_non_const, 0);
|
2023-01-23 19:54:35 +00:00
|
|
|
else
|
2023-03-31 15:15:23 +00:00
|
|
|
column_result.insertFrom(*in, i);
|
2023-01-23 19:54:35 +00:00
|
|
|
}
|
2023-03-31 15:15:23 +00:00
|
|
|
return true;
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
/// Different versions of the hash tables to implement the mapping.
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
struct Cache
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
using NumToIdx = HashMap<UInt64, size_t, HashCRC32<UInt64>>;
|
|
|
|
using StringToIdx = HashMap<StringRef, size_t, StringRefHash>;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
std::unique_ptr<NumToIdx> table_num_to_idx;
|
|
|
|
std::unique_ptr<StringToIdx> table_string_to_idx;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
ColumnPtr to_columns;
|
|
|
|
ColumnPtr default_column;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
Arena string_pool;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
std::atomic<bool> initialized{false};
|
|
|
|
std::mutex mutex;
|
|
|
|
};
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
mutable Cache cache;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
static UInt64 bitCastToUInt64(const Field & x)
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
switch (x.getType())
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
case Field::Types::UInt64:
|
|
|
|
return x.get<UInt64>();
|
|
|
|
case Field::Types::Int64:
|
|
|
|
return x.get<Int64>();
|
|
|
|
case Field::Types::Float64:
|
|
|
|
return std::bit_cast<UInt64>(x.get<Float64>());
|
|
|
|
case Field::Types::Bool:
|
|
|
|
return x.get<bool>();
|
|
|
|
case Field::Types::Decimal32:
|
|
|
|
return x.get<DecimalField<Decimal32>>().getValue();
|
|
|
|
case Field::Types::Decimal64:
|
|
|
|
return x.get<DecimalField<Decimal64>>().getValue();
|
|
|
|
default:
|
|
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unexpected type in function 'transform'");
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
/// Can be called from different threads. It works only on the first call.
|
|
|
|
void initialize(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type) const
|
2022-09-18 03:16:08 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
const ColumnConst * array_from = checkAndGetColumnConst<ColumnArray>(arguments[1].column.get());
|
|
|
|
const ColumnConst * array_to = checkAndGetColumnConst<ColumnArray>(arguments[2].column.get());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
if (!array_from || !array_to)
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::ILLEGAL_COLUMN, "Second and third arguments of function {} must be constant arrays.", getName());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
if (cache.initialized)
|
|
|
|
return;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
const auto & from = array_from->getValue<Array>();
|
|
|
|
const size_t size = from.size();
|
|
|
|
if (0 == size)
|
|
|
|
throw Exception(ErrorCodes::BAD_ARGUMENTS, "Empty arrays are illegal in function {}", getName());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
std::lock_guard lock(cache.mutex);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
if (cache.initialized)
|
|
|
|
return;
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
const auto & to = array_to->getValue<Array>();
|
|
|
|
if (size != to.size())
|
|
|
|
throw Exception(
|
|
|
|
ErrorCodes::BAD_ARGUMENTS, "Second and third arguments of function {} must be arrays of same size", getName());
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
/// Whether the default value is set.
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
if (arguments.size() == 4)
|
2015-06-03 03:55:29 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
const IColumn * default_col = arguments[3].column.get();
|
|
|
|
if (default_col && isColumnConst(*default_col))
|
|
|
|
{
|
|
|
|
auto default_column = result_type->createColumn();
|
|
|
|
if (!default_col->onlyNull())
|
|
|
|
{
|
|
|
|
Field f = convertFieldToType((*default_col)[0], *result_type);
|
|
|
|
default_column->insert(f);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
default_column->insertDefault();
|
|
|
|
cache.default_column = std::move(default_column);
|
|
|
|
}
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
/// Note: Doesn't check the duplicates in the `from` array.
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
const IDataType & from_type = *arguments[0].type;
|
2021-02-14 16:07:20 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
if (from[0].getType() != Field::Types::String)
|
2019-12-17 10:19:21 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
cache.table_num_to_idx = std::make_unique<Cache::NumToIdx>();
|
|
|
|
auto & table = *cache.table_num_to_idx;
|
2021-02-14 16:07:20 +00:00
|
|
|
for (size_t i = 0; i < size; ++i)
|
|
|
|
{
|
|
|
|
Field key = convertFieldToType(from[i], from_type);
|
|
|
|
if (key.isNull())
|
|
|
|
continue;
|
|
|
|
|
2022-09-18 06:58:32 +00:00
|
|
|
/// Field may be of Float type, but for the purpose of bitwise equality we can treat them as UInt64
|
2023-03-31 15:15:23 +00:00
|
|
|
table[bitCastToUInt64(key)] = i;
|
2021-02-14 16:07:20 +00:00
|
|
|
}
|
2019-12-17 10:19:21 +00:00
|
|
|
}
|
2021-02-14 16:07:20 +00:00
|
|
|
else
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
cache.table_string_to_idx = std::make_unique<Cache::StringToIdx>();
|
|
|
|
auto & table = *cache.table_string_to_idx;
|
2021-02-14 16:07:20 +00:00
|
|
|
for (size_t i = 0; i < size; ++i)
|
|
|
|
{
|
|
|
|
const String & str_from = from[i].get<const String &>();
|
|
|
|
StringRef ref{cache.string_pool.insert(str_from.data(), str_from.size() + 1), str_from.size() + 1};
|
2023-03-31 15:15:23 +00:00
|
|
|
table[ref] = i;
|
2021-02-14 16:07:20 +00:00
|
|
|
}
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
2023-03-31 15:15:23 +00:00
|
|
|
|
|
|
|
auto to_columns = result_type->createColumn();
|
|
|
|
for (size_t i = 0; i < size; ++i)
|
2015-06-03 03:29:28 +00:00
|
|
|
{
|
2023-03-31 15:15:23 +00:00
|
|
|
Field to_value = convertFieldToType(to[i], *result_type);
|
|
|
|
to_columns->insert(to_value);
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|
2023-03-31 15:15:23 +00:00
|
|
|
cache.to_columns = std::move(to_columns);
|
2017-04-01 07:20:54 +00:00
|
|
|
|
2023-03-31 15:15:23 +00:00
|
|
|
cache.initialized = true;
|
|
|
|
}
|
2015-06-03 03:29:28 +00:00
|
|
|
};
|
|
|
|
|
2020-09-07 18:00:37 +00:00
|
|
|
}
|
|
|
|
|
2022-07-04 07:01:39 +00:00
|
|
|
REGISTER_FUNCTION(Transform)
|
2018-12-02 02:52:49 +00:00
|
|
|
{
|
|
|
|
factory.registerFunction<FunctionTransform>();
|
|
|
|
}
|
|
|
|
|
2015-06-03 03:29:28 +00:00
|
|
|
}
|