mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-11-05 15:21:43 +00:00
1411 lines
54 KiB
C++
1411 lines
54 KiB
C++
#pragma once
|
||
|
||
#include <DB/IO/WriteBufferFromVector.h>
|
||
#include <DB/IO/ReadBufferFromString.h>
|
||
#include <DB/DataTypes/DataTypesNumberFixed.h>
|
||
#include <DB/DataTypes/DataTypeString.h>
|
||
#include <DB/DataTypes/DataTypeFixedString.h>
|
||
#include <DB/DataTypes/DataTypeDate.h>
|
||
#include <DB/DataTypes/DataTypeDateTime.h>
|
||
#include <DB/Columns/ColumnString.h>
|
||
#include <DB/Columns/ColumnFixedString.h>
|
||
#include <DB/Columns/ColumnConst.h>
|
||
#include <DB/Functions/IFunction.h>
|
||
#include <DB/Core/FieldVisitors.h>
|
||
#include <ext/range.hpp>
|
||
#include <type_traits>
|
||
|
||
|
||
namespace DB
|
||
{
|
||
|
||
/** Функции преобразования типов.
|
||
* toType - преобразование "естественным образом";
|
||
*/
|
||
|
||
|
||
/** Преобразование чисел друг в друга, дат/дат-с-временем в числа и наоборот: делается обычным присваиванием.
|
||
* (дата внутри хранится как количество дней с какого-то, дата-с-временем - как unix timestamp)
|
||
*/
|
||
template <typename FromDataType, typename ToDataType, typename Name>
|
||
struct ConvertImpl
|
||
{
|
||
typedef typename FromDataType::FieldType FromFieldType;
|
||
typedef typename ToDataType::FieldType ToFieldType;
|
||
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
if (const ColumnVector<FromFieldType> * col_from = typeid_cast<const ColumnVector<FromFieldType> *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
ColumnVector<ToFieldType> * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
const typename ColumnVector<FromFieldType>::Container_t & vec_from = col_from->getData();
|
||
typename ColumnVector<ToFieldType>::Container_t & vec_to = col_to->getData();
|
||
size_t size = vec_from.size();
|
||
vec_to.resize(size);
|
||
|
||
for (size_t i = 0; i < size; ++i)
|
||
vec_to[i] = vec_from[i];
|
||
}
|
||
else if (const ColumnConst<FromFieldType> * col_from = typeid_cast<const ColumnConst<FromFieldType> *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
block.getByPosition(result).column = new ColumnConst<ToFieldType>(col_from->size(), col_from->getData());
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
};
|
||
|
||
|
||
/** Преобразование даты в дату-с-временем: добавление нулевого времени.
|
||
*/
|
||
template <typename Name>
|
||
struct ConvertImpl<DataTypeDate, DataTypeDateTime, Name>
|
||
{
|
||
typedef DataTypeDate::FieldType FromFieldType;
|
||
typedef DataTypeDateTime::FieldType ToFieldType;
|
||
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
typedef DataTypeDate::FieldType FromFieldType;
|
||
const auto & date_lut = DateLUT::instance();
|
||
|
||
if (const ColumnVector<FromFieldType> * col_from = typeid_cast<const ColumnVector<FromFieldType> *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
ColumnVector<ToFieldType> * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
const typename ColumnVector<FromFieldType>::Container_t & vec_from = col_from->getData();
|
||
typename ColumnVector<ToFieldType>::Container_t & vec_to = col_to->getData();
|
||
size_t size = vec_from.size();
|
||
vec_to.resize(size);
|
||
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
vec_to[i] = date_lut.fromDayNum(DayNum_t(vec_from[i]));
|
||
}
|
||
}
|
||
else if (const ColumnConst<FromFieldType> * col_from = typeid_cast<const ColumnConst<FromFieldType> *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
block.getByPosition(result).column = new ColumnConst<ToFieldType>(col_from->size(), date_lut.fromDayNum(DayNum_t(col_from->getData())));
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
};
|
||
|
||
/// Реализация функции toDate.
|
||
|
||
namespace details { namespace {
|
||
|
||
template<typename FromType, typename ToType, template <typename, typename> class Transformation>
|
||
class Transformer
|
||
{
|
||
private:
|
||
using Op = Transformation<FromType, ToType>;
|
||
|
||
public:
|
||
static void vector_vector(const PODArray<FromType> & vec_from, const ColumnString::Chars_t & data,
|
||
const ColumnString::Offsets_t & offsets, PODArray<ToType> & vec_to)
|
||
{
|
||
ColumnString::Offset_t prev_offset = 0;
|
||
|
||
for (size_t i = 0; i < vec_from.size(); ++i)
|
||
{
|
||
ColumnString::Offset_t cur_offset = offsets[i];
|
||
const std::string time_zone(reinterpret_cast<const char *>(&data[prev_offset]), cur_offset - prev_offset - 1);
|
||
const auto & remote_date_lut = DateLUT::instance(time_zone);
|
||
vec_to[i] = Op::execute(vec_from[i], remote_date_lut);
|
||
prev_offset = cur_offset;
|
||
}
|
||
}
|
||
|
||
static void vector_constant(const PODArray<FromType> & vec_from, const std::string & data,
|
||
PODArray<ToType> & vec_to)
|
||
{
|
||
const auto & remote_date_lut = DateLUT::instance(data);
|
||
for (size_t i = 0; i < vec_from.size(); ++i)
|
||
vec_to[i] = Op::execute(vec_from[i], remote_date_lut);
|
||
}
|
||
|
||
static void vector_constant(const PODArray<FromType> & vec_from, PODArray<ToType> & vec_to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
for (size_t i = 0; i < vec_from.size(); ++i)
|
||
vec_to[i] = Op::execute(vec_from[i], local_date_lut);
|
||
}
|
||
|
||
static void constant_vector(const FromType & from, const ColumnString::Chars_t & data,
|
||
const ColumnString::Offsets_t & offsets, PODArray<ToType> & vec_to)
|
||
{
|
||
ColumnString::Offset_t prev_offset = 0;
|
||
|
||
for (size_t i = 0; i < offsets.size(); ++i)
|
||
{
|
||
ColumnString::Offset_t cur_offset = offsets[i];
|
||
const std::string time_zone(reinterpret_cast<const char *>(&data[prev_offset]), cur_offset - prev_offset - 1);
|
||
const auto & remote_date_lut = DateLUT::instance(time_zone);
|
||
vec_to[i] = Op::execute(from, remote_date_lut);
|
||
prev_offset = cur_offset;
|
||
}
|
||
}
|
||
|
||
static void constant_constant(const FromType & from, const std::string & data, ToType & to)
|
||
{
|
||
const auto & remote_date_lut = DateLUT::instance(data);
|
||
to = Op::execute(from, remote_date_lut);
|
||
}
|
||
|
||
static void constant_constant(const FromType & from, ToType & to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
to = Op::execute(from, local_date_lut);
|
||
}
|
||
};
|
||
|
||
template <typename FromType, template <typename, typename> class Transformation, typename Name>
|
||
class ToDateConverter
|
||
{
|
||
private:
|
||
using FromFieldType = typename FromType::FieldType;
|
||
using ToFieldType = typename DataTypeDate::FieldType;
|
||
using Op = Transformer<FromFieldType, ToFieldType, Transformation>;
|
||
|
||
public:
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
const ColumnPtr source_col = block.getByPosition(arguments[0]).column;
|
||
const auto * sources = typeid_cast<const ColumnVector<FromFieldType> *>(&*source_col);
|
||
const auto * const_source = typeid_cast<const ColumnConst<FromFieldType> *>(&*source_col);
|
||
|
||
if (arguments.size() == 1)
|
||
{
|
||
if (sources)
|
||
{
|
||
auto * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
const auto & vec_from = sources->getData();
|
||
auto & vec_to = col_to->getData();
|
||
size_t size = vec_from.size();
|
||
vec_to.resize(size);
|
||
|
||
Op::vector_constant(vec_from, vec_to);
|
||
}
|
||
else if (const_source)
|
||
{
|
||
ToFieldType res;
|
||
Op::constant_constant(const_source->getData(), res);
|
||
block.getByPosition(result).column = new ColumnConst<ToFieldType>(const_source->size(), res);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else if (arguments.size() == 2)
|
||
{
|
||
const ColumnPtr time_zone_col = block.getByPosition(arguments[1]).column;
|
||
const auto * time_zones = typeid_cast<const ColumnString *>(&*time_zone_col);
|
||
const auto * const_time_zone = typeid_cast<const ColumnConstString *>(&*time_zone_col);
|
||
|
||
if (sources)
|
||
{
|
||
auto * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
auto & vec_from = sources->getData();
|
||
auto & vec_to = col_to->getData();
|
||
vec_to.resize(vec_from.size());
|
||
|
||
if (time_zones)
|
||
Op::vector_vector(vec_from, time_zones->getChars(), time_zones->getOffsets(), vec_to);
|
||
else if (const_time_zone)
|
||
Op::vector_constant(vec_from, const_time_zone->getData(), vec_to);
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[1]).column->getName()
|
||
+ " of second argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else if (const_source)
|
||
{
|
||
if (time_zones)
|
||
{
|
||
auto * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
auto & vec_to = col_to->getData();
|
||
vec_to.resize(time_zones->getOffsets().size());
|
||
|
||
Op::constant_vector(const_source->getData(), time_zones->getChars(), time_zones->getOffsets(), vec_to);
|
||
}
|
||
else if (const_time_zone)
|
||
{
|
||
ToFieldType res;
|
||
Op::constant_constant(const_source->getData(), const_time_zone->getData(), res);
|
||
block.getByPosition(result).column = new ColumnConst<ToFieldType>(const_source->size(), res);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[1]).column->getName()
|
||
+ " of second argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else
|
||
throw Exception("FunctionsConversion: Internal error", ErrorCodes::LOGICAL_ERROR);
|
||
}
|
||
};
|
||
|
||
template <typename FromType, typename ToType>
|
||
struct ToDateTransform
|
||
{
|
||
static inline ToType execute(const FromType & from, const DateLUTImpl & date_lut)
|
||
{
|
||
return date_lut.toDayNum(from);
|
||
}
|
||
};
|
||
|
||
template <typename FromType, typename ToType>
|
||
struct ToDateTransform32Or64
|
||
{
|
||
static inline ToType execute(const FromType & from, const DateLUTImpl & date_lut)
|
||
{
|
||
return (from < 0xFFFF) ? from : date_lut.toDayNum(from);
|
||
}
|
||
};
|
||
|
||
}}
|
||
|
||
/** Преобразование даты-с-временем в дату: отбрасывание времени.
|
||
*/
|
||
template <typename Name> struct ConvertImpl<DataTypeDateTime, DataTypeDate, Name> : details::ToDateConverter<DataTypeDateTime, details::ToDateTransform, Name> {};
|
||
|
||
/** Отдельный случай для преобразования (U)Int32 или (U)Int64 в Date.
|
||
* Если число меньше 65536, то оно понимается, как DayNum, а если больше или равно - как unix timestamp.
|
||
* Немного нелогично, что мы, по сути, помещаем две разные функции в одну.
|
||
* Но зато это позволяет поддержать распространённый случай,
|
||
* когда пользователь пишет toDate(UInt32), ожидая, что это - перевод unix timestamp в дату
|
||
* (иначе такое использование было бы распространённой ошибкой).
|
||
*/
|
||
template <typename Name> struct ConvertImpl<DataTypeUInt32, DataTypeDate, Name> : details::ToDateConverter<DataTypeUInt32, details::ToDateTransform32Or64, Name> {};
|
||
template <typename Name> struct ConvertImpl<DataTypeUInt64, DataTypeDate, Name> : details::ToDateConverter<DataTypeUInt64, details::ToDateTransform32Or64, Name> {};
|
||
template <typename Name> struct ConvertImpl<DataTypeInt32, DataTypeDate, Name> : details::ToDateConverter<DataTypeInt32, details::ToDateTransform32Or64, Name> {};
|
||
template <typename Name> struct ConvertImpl<DataTypeInt64, DataTypeDate, Name> : details::ToDateConverter<DataTypeInt64, details::ToDateTransform32Or64, Name> {};
|
||
|
||
/** Преобразование чисел, дат, дат-с-временем в строки: через форматирование.
|
||
*/
|
||
template <typename DataType> void formatImpl(typename DataType::FieldType x, WriteBuffer & wb) { writeText(x, wb); }
|
||
template <> inline void formatImpl<DataTypeDate>(DataTypeDate::FieldType x, WriteBuffer & wb) { writeDateText(DayNum_t(x), wb); }
|
||
template <> inline void formatImpl<DataTypeDateTime>(DataTypeDateTime::FieldType x, WriteBuffer & wb) { writeDateTimeText(x, wb); }
|
||
|
||
template <typename FromDataType, typename Name>
|
||
struct ConvertImpl<FromDataType, DataTypeString, Name>
|
||
{
|
||
typedef typename FromDataType::FieldType FromFieldType;
|
||
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
if (const ColumnVector<FromFieldType> * col_from = typeid_cast<const ColumnVector<FromFieldType> *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
ColumnString * col_to = new ColumnString;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
const typename ColumnVector<FromFieldType>::Container_t & vec_from = col_from->getData();
|
||
ColumnString::Chars_t & data_to = col_to->getChars();
|
||
ColumnString::Offsets_t & offsets_to = col_to->getOffsets();
|
||
size_t size = vec_from.size();
|
||
data_to.resize(size * 2);
|
||
offsets_to.resize(size);
|
||
|
||
WriteBufferFromVector<ColumnString::Chars_t> write_buffer(data_to);
|
||
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
formatImpl<FromDataType>(vec_from[i], write_buffer);
|
||
writeChar(0, write_buffer);
|
||
offsets_to[i] = write_buffer.count();
|
||
}
|
||
data_to.resize(write_buffer.count());
|
||
}
|
||
else if (const ColumnConst<FromFieldType> * col_from = typeid_cast<const ColumnConst<FromFieldType> *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
std::vector<char> buf;
|
||
WriteBufferFromVector<std::vector<char> > write_buffer(buf);
|
||
formatImpl<FromDataType>(col_from->getData(), write_buffer);
|
||
block.getByPosition(result).column = new ColumnConstString(col_from->size(), std::string(&buf[0], write_buffer.count()));
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
};
|
||
|
||
namespace details { namespace {
|
||
|
||
/** Пусть source_timestamp представляет дату и время в исходном часовом поясе соответствующем
|
||
* объекту from_date_lut. Эта функция возвращает timestamp представлящий те же дату и время
|
||
* в часовом поясе соответствующем объекту to_date_lut.
|
||
*/
|
||
time_t convertTimestamp(time_t source_timestamp, const DateLUTImpl & from_date_lut, const DateLUTImpl & to_date_lut)
|
||
{
|
||
if (&from_date_lut == &to_date_lut)
|
||
return source_timestamp;
|
||
else
|
||
{
|
||
const auto & values = from_date_lut.getValues(source_timestamp);
|
||
return to_date_lut.makeDateTime(values.year, values.month, values.day_of_month,
|
||
from_date_lut.toHourInaccurate(source_timestamp),
|
||
from_date_lut.toMinuteInaccurate(source_timestamp),
|
||
from_date_lut.toSecondInaccurate(source_timestamp));
|
||
}
|
||
}
|
||
|
||
/** Функции для преобразования даты + времени в строку.
|
||
*/
|
||
struct DateTimeToStringConverter
|
||
{
|
||
using FromFieldType = typename DataTypeDateTime::FieldType;
|
||
|
||
static void vector_vector(const PODArray<FromFieldType> & vec_from, const ColumnString::Chars_t & data,
|
||
const ColumnString::Offsets_t & offsets, ColumnString & vec_to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
|
||
ColumnString::Chars_t & data_to = vec_to.getChars();
|
||
ColumnString::Offsets_t & offsets_to = vec_to.getOffsets();
|
||
size_t size = vec_from.size();
|
||
data_to.resize(size * 2);
|
||
offsets_to.resize(size);
|
||
|
||
WriteBufferFromVector<ColumnString::Chars_t> write_buffer(data_to);
|
||
|
||
ColumnString::Offset_t prev_offset = 0;
|
||
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
ColumnString::Offset_t cur_offset = offsets[i];
|
||
const std::string time_zone(reinterpret_cast<const char *>(&data[prev_offset]), cur_offset - prev_offset - 1);
|
||
const auto & remote_date_lut = DateLUT::instance(time_zone);
|
||
|
||
auto ti = convertTimestamp(vec_from[i], remote_date_lut, local_date_lut);
|
||
formatImpl<DataTypeDateTime>(ti, write_buffer);
|
||
writeChar(0, write_buffer);
|
||
offsets_to[i] = write_buffer.count();
|
||
|
||
prev_offset = cur_offset;
|
||
}
|
||
data_to.resize(write_buffer.count());
|
||
}
|
||
|
||
static void vector_constant(const PODArray<FromFieldType> & vec_from, const std::string & data,
|
||
ColumnString & vec_to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
const auto & remote_date_lut = DateLUT::instance(data);
|
||
|
||
ColumnString::Chars_t & data_to = vec_to.getChars();
|
||
ColumnString::Offsets_t & offsets_to = vec_to.getOffsets();
|
||
size_t size = vec_from.size();
|
||
data_to.resize(size * 2);
|
||
offsets_to.resize(size);
|
||
|
||
WriteBufferFromVector<ColumnString::Chars_t> write_buffer(data_to);
|
||
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
auto ti = convertTimestamp(vec_from[i], remote_date_lut, local_date_lut);
|
||
formatImpl<DataTypeDateTime>(ti, write_buffer);
|
||
writeChar(0, write_buffer);
|
||
offsets_to[i] = write_buffer.count();
|
||
}
|
||
data_to.resize(write_buffer.count());
|
||
}
|
||
|
||
static void vector_constant(const PODArray<FromFieldType> & vec_from, ColumnString & vec_to)
|
||
{
|
||
ColumnString::Chars_t & data_to = vec_to.getChars();
|
||
ColumnString::Offsets_t & offsets_to = vec_to.getOffsets();
|
||
size_t size = vec_from.size();
|
||
data_to.resize(size * 2);
|
||
offsets_to.resize(size);
|
||
|
||
WriteBufferFromVector<ColumnString::Chars_t> write_buffer(data_to);
|
||
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
formatImpl<DataTypeDateTime>(vec_from[i], write_buffer);
|
||
writeChar(0, write_buffer);
|
||
offsets_to[i] = write_buffer.count();
|
||
}
|
||
data_to.resize(write_buffer.count());
|
||
}
|
||
|
||
static void constant_vector(FromFieldType from, const ColumnString::Chars_t & data,
|
||
const ColumnString::Offsets_t & offsets,
|
||
ColumnString & vec_to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
|
||
ColumnString::Chars_t & data_to = vec_to.getChars();
|
||
ColumnString::Offsets_t & offsets_to = vec_to.getOffsets();
|
||
size_t size = offsets.size();
|
||
data_to.resize(size * 2);
|
||
offsets_to.resize(size);
|
||
|
||
WriteBufferFromVector<ColumnString::Chars_t> write_buffer(data_to);
|
||
|
||
ColumnString::Offset_t prev_offset = 0;
|
||
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
ColumnString::Offset_t cur_offset = offsets[i];
|
||
const std::string time_zone(reinterpret_cast<const char *>(&data[prev_offset]), cur_offset - prev_offset - 1);
|
||
const auto & remote_date_lut = DateLUT::instance(time_zone);
|
||
|
||
auto ti = convertTimestamp(from, remote_date_lut, local_date_lut);
|
||
formatImpl<DataTypeDateTime>(ti, write_buffer);
|
||
writeChar(0, write_buffer);
|
||
offsets_to[i] = write_buffer.count();
|
||
|
||
prev_offset = cur_offset;
|
||
}
|
||
data_to.resize(write_buffer.count());
|
||
}
|
||
|
||
static void constant_constant(FromFieldType from, const std::string & data, std::string & to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
const auto & remote_date_lut = DateLUT::instance(data);
|
||
|
||
std::vector<char> buf;
|
||
WriteBufferFromVector<std::vector<char> > write_buffer(buf);
|
||
auto ti = convertTimestamp(from, remote_date_lut, local_date_lut);
|
||
formatImpl<DataTypeDateTime>(ti, write_buffer);
|
||
to = std::string(&buf[0], write_buffer.count());
|
||
}
|
||
|
||
static void constant_constant(FromFieldType from, std::string & to)
|
||
{
|
||
std::vector<char> buf;
|
||
WriteBufferFromVector<std::vector<char> > write_buffer(buf);
|
||
formatImpl<DataTypeDateTime>(from, write_buffer);
|
||
to = std::string(&buf[0], write_buffer.count());
|
||
}
|
||
};
|
||
|
||
}}
|
||
|
||
template<typename Name>
|
||
struct ConvertImpl<DataTypeDateTime, DataTypeString, Name>
|
||
{
|
||
using Op = details::DateTimeToStringConverter;
|
||
using FromFieldType = Op::FromFieldType;
|
||
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
const ColumnPtr source_col = block.getByPosition(arguments[0]).column;
|
||
const auto * sources = typeid_cast<const ColumnVector<FromFieldType> *>(&*source_col);
|
||
const auto * const_source = typeid_cast<const ColumnConst<FromFieldType> *>(&*source_col);
|
||
|
||
if (arguments.size() == 1)
|
||
{
|
||
if (sources)
|
||
{
|
||
ColumnString * col_to = new ColumnString;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
auto & vec_from = sources->getData();
|
||
auto & vec_to = *col_to;
|
||
|
||
Op::vector_constant(vec_from, vec_to);
|
||
}
|
||
else if (const_source)
|
||
{
|
||
std::string res;
|
||
Op::constant_constant(const_source->getData(), res);
|
||
block.getByPosition(result).column = new ColumnConstString(const_source->size(), res);
|
||
}
|
||
else
|
||
{
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
}
|
||
else if (arguments.size() == 2)
|
||
{
|
||
const ColumnPtr time_zone_col = block.getByPosition(arguments[1]).column;
|
||
const auto * time_zones = typeid_cast<const ColumnString *>(&*time_zone_col);
|
||
const auto * const_time_zone = typeid_cast<const ColumnConstString *>(&*time_zone_col);
|
||
|
||
if (sources)
|
||
{
|
||
ColumnString * col_to = new ColumnString;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
auto & vec_from = sources->getData();
|
||
auto & vec_to = *col_to;
|
||
|
||
if (time_zones)
|
||
Op::vector_vector(vec_from, time_zones->getChars(), time_zones->getOffsets(), vec_to);
|
||
else if (const_time_zone)
|
||
Op::vector_constant(vec_from, const_time_zone->getData(), vec_to);
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[1]).column->getName()
|
||
+ " of second argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else if (const_source)
|
||
{
|
||
if (time_zones)
|
||
{
|
||
ColumnString * col_to = new ColumnString;
|
||
block.getByPosition(result).column = col_to;
|
||
auto & vec_to = *col_to;
|
||
|
||
Op::constant_vector(const_source->getData(), time_zones->getChars(), time_zones->getOffsets(), vec_to);
|
||
}
|
||
else if (const_time_zone)
|
||
{
|
||
std::string res;
|
||
Op::constant_constant(const_source->getData(), const_time_zone->getData(), res);
|
||
block.getByPosition(result).column = new ColumnConstString(const_source->size(), res);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[1]).column->getName()
|
||
+ " of second argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else
|
||
throw Exception("Internal error.", ErrorCodes::LOGICAL_ERROR);
|
||
}
|
||
};
|
||
|
||
/** Преобразование строк в числа, даты, даты-с-временем: через парсинг.
|
||
*/
|
||
template <typename DataType> void parseImpl(typename DataType::FieldType & x, ReadBuffer & rb) { readText(x,rb); }
|
||
|
||
template <> inline void parseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb)
|
||
{
|
||
DayNum_t tmp(0);
|
||
readDateText(tmp, rb);
|
||
x = tmp;
|
||
}
|
||
|
||
template <> inline void parseImpl<DataTypeDateTime>(DataTypeDateTime::FieldType & x, ReadBuffer & rb)
|
||
{
|
||
time_t tmp = 0;
|
||
readDateTimeText(tmp, rb);
|
||
x = tmp;
|
||
}
|
||
|
||
template <typename ToDataType, typename Name>
|
||
struct ConvertImpl<DataTypeString, ToDataType, Name>
|
||
{
|
||
typedef typename ToDataType::FieldType ToFieldType;
|
||
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
if (const ColumnString * col_from = typeid_cast<const ColumnString *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
ColumnVector<ToFieldType> * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
const ColumnString::Chars_t & data_from = col_from->getChars();
|
||
typename ColumnVector<ToFieldType>::Container_t & vec_to = col_to->getData();
|
||
size_t size = col_from->size();
|
||
vec_to.resize(size);
|
||
|
||
ReadBuffer read_buffer(const_cast<char *>(reinterpret_cast<const char *>(&data_from[0])), data_from.size(), 0);
|
||
|
||
char zero = 0;
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
parseImpl<ToDataType>(vec_to[i], read_buffer);
|
||
readChar(zero, read_buffer);
|
||
if (zero != 0)
|
||
throw Exception("Cannot parse from string.", ErrorCodes::CANNOT_PARSE_NUMBER);
|
||
}
|
||
}
|
||
else if (const ColumnConstString * col_from = typeid_cast<const ColumnConstString *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
const String & s = col_from->getData();
|
||
ReadBufferFromString read_buffer(s);
|
||
ToFieldType x = 0;
|
||
parseImpl<ToDataType>(x, read_buffer);
|
||
block.getByPosition(result).column = new ColumnConst<ToFieldType>(col_from->size(), x);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
};
|
||
|
||
namespace details { namespace {
|
||
|
||
/** Функции для преобразования строк в timestamp.
|
||
*/
|
||
struct StringToTimestampConverter
|
||
{
|
||
using ToFieldType = typename DataTypeInt32::FieldType;
|
||
|
||
static void vector_vector(const ColumnString::Chars_t & vec_from, const ColumnString::Chars_t & data,
|
||
const ColumnString::Offsets_t & offsets, PODArray<ToFieldType> & vec_to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
ReadBuffer read_buffer(const_cast<char *>(reinterpret_cast<const char *>(&vec_from[0])), vec_from.size(), 0);
|
||
|
||
ColumnString::Offset_t prev_offset = 0;
|
||
|
||
char zero = 0;
|
||
for (size_t i = 0; i < vec_to.size(); ++i)
|
||
{
|
||
DataTypeDateTime::FieldType x = 0;
|
||
parseImpl<DataTypeDateTime>(x, read_buffer);
|
||
|
||
ColumnString::Offset_t cur_offset = offsets[i];
|
||
const std::string time_zone(reinterpret_cast<const char *>(&data[prev_offset]), cur_offset - prev_offset - 1);
|
||
const auto & remote_date_lut = DateLUT::instance(time_zone);
|
||
|
||
auto ti = convertTimestamp(x, local_date_lut, remote_date_lut);
|
||
|
||
vec_to[i] = ti;
|
||
readChar(zero, read_buffer);
|
||
if (zero != 0)
|
||
throw Exception("Cannot parse from string.", ErrorCodes::CANNOT_PARSE_NUMBER);
|
||
|
||
prev_offset = cur_offset;
|
||
}
|
||
}
|
||
|
||
static void vector_constant(const ColumnString::Chars_t & vec_from, const std::string & data,
|
||
PODArray<ToFieldType> & vec_to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
const auto & remote_date_lut = DateLUT::instance(data);
|
||
ReadBuffer read_buffer(const_cast<char *>(reinterpret_cast<const char *>(&vec_from[0])), vec_from.size(), 0);
|
||
|
||
char zero = 0;
|
||
for (size_t i = 0; i < vec_to.size(); ++i)
|
||
{
|
||
DataTypeDateTime::FieldType x = 0;
|
||
parseImpl<DataTypeDateTime>(x, read_buffer);
|
||
|
||
auto ti = convertTimestamp(x, local_date_lut, remote_date_lut);
|
||
|
||
vec_to[i] = ti;
|
||
readChar(zero, read_buffer);
|
||
if (zero != 0)
|
||
throw Exception("Cannot parse from string.", ErrorCodes::CANNOT_PARSE_NUMBER);
|
||
}
|
||
}
|
||
|
||
static void vector_constant(const ColumnString::Chars_t & vec_from, PODArray<ToFieldType> & vec_to)
|
||
{
|
||
ReadBuffer read_buffer(const_cast<char *>(reinterpret_cast<const char *>(&vec_from[0])), vec_from.size(), 0);
|
||
|
||
char zero = 0;
|
||
for (size_t i = 0; i < vec_to.size(); ++i)
|
||
{
|
||
DataTypeDateTime::FieldType x = 0;
|
||
parseImpl<DataTypeDateTime>(x, read_buffer);
|
||
vec_to[i] = x;
|
||
readChar(zero, read_buffer);
|
||
if (zero != 0)
|
||
throw Exception("Cannot parse from string.", ErrorCodes::CANNOT_PARSE_NUMBER);
|
||
}
|
||
}
|
||
|
||
static void constant_vector(const std::string & from, const ColumnString::Chars_t & data,
|
||
const ColumnString::Offsets_t & offsets, PODArray<ToFieldType> & vec_to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
|
||
ReadBufferFromString read_buffer(from);
|
||
DataTypeDateTime::FieldType x = 0;
|
||
parseImpl<DataTypeDateTime>(x, read_buffer);
|
||
|
||
ColumnString::Offset_t prev_offset = 0;
|
||
|
||
for (size_t i = 0; i < offsets.size(); ++i)
|
||
{
|
||
ColumnString::Offset_t cur_offset = offsets[i];
|
||
const std::string time_zone(reinterpret_cast<const char *>(&data[prev_offset]), cur_offset - prev_offset - 1);
|
||
const auto & remote_date_lut = DateLUT::instance(time_zone);
|
||
|
||
auto ti = convertTimestamp(x, local_date_lut, remote_date_lut);
|
||
|
||
vec_to[i] = ti;
|
||
prev_offset = cur_offset;
|
||
}
|
||
}
|
||
|
||
static void constant_constant(const std::string & from, const std::string & data, ToFieldType & to)
|
||
{
|
||
const auto & local_date_lut = DateLUT::instance();
|
||
const auto & remote_date_lut = DateLUT::instance(data);
|
||
|
||
ReadBufferFromString read_buffer(from);
|
||
DataTypeDateTime::FieldType x = 0;
|
||
parseImpl<DataTypeDateTime>(x, read_buffer);
|
||
|
||
to = convertTimestamp(x, local_date_lut, remote_date_lut);
|
||
}
|
||
|
||
static void constant_constant(const std::string & from, ToFieldType & to)
|
||
{
|
||
ReadBufferFromString read_buffer(from);
|
||
DataTypeDateTime::FieldType x = 0;
|
||
parseImpl<DataTypeDateTime>(x, read_buffer);
|
||
to = x;
|
||
}
|
||
};
|
||
|
||
}}
|
||
|
||
struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
|
||
|
||
template<>
|
||
struct ConvertImpl<DataTypeString, DataTypeInt32, NameToUnixTimestamp>
|
||
{
|
||
using Op = details::StringToTimestampConverter;
|
||
using ToFieldType = Op::ToFieldType;
|
||
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
const ColumnPtr source_col = block.getByPosition(arguments[0]).column;
|
||
const auto * sources = typeid_cast<const ColumnString *>(&*source_col);
|
||
const auto * const_source = typeid_cast<const ColumnConstString *>(&*source_col);
|
||
|
||
if (arguments.size() == 1)
|
||
{
|
||
if (sources)
|
||
{
|
||
auto * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
auto & vec_from = sources->getChars();
|
||
auto & vec_to = col_to->getData();
|
||
size_t size = sources->size();
|
||
vec_to.resize(size);
|
||
|
||
Op::vector_constant(vec_from, vec_to);
|
||
}
|
||
else if (const_source)
|
||
{
|
||
ToFieldType res;
|
||
Op::constant_constant(const_source->getData(), res);
|
||
block.getByPosition(result).column = new ColumnConst<ToFieldType>(const_source->size(), res);
|
||
}
|
||
else
|
||
{
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + NameToUnixTimestamp::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
}
|
||
else if (arguments.size() == 2)
|
||
{
|
||
const ColumnPtr time_zone_col = block.getByPosition(arguments[1]).column;
|
||
const auto * time_zones = typeid_cast<const ColumnString *>(&*time_zone_col);
|
||
const auto * const_time_zone = typeid_cast<const ColumnConstString *>(&*time_zone_col);
|
||
|
||
if (sources)
|
||
{
|
||
auto * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
auto & vec_from = sources->getChars();
|
||
auto & vec_to = col_to->getData();
|
||
size_t size = sources->size();
|
||
vec_to.resize(size);
|
||
|
||
if (time_zones)
|
||
Op::vector_vector(vec_from, time_zones->getChars(), time_zones->getOffsets(), vec_to);
|
||
else if (const_time_zone)
|
||
Op::vector_constant(vec_from, const_time_zone->getData(), vec_to);
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[1]).column->getName()
|
||
+ " of second argument of function " + NameToUnixTimestamp::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else if (const_source)
|
||
{
|
||
if (time_zones)
|
||
{
|
||
auto * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
auto & vec_to = col_to->getData();
|
||
vec_to.resize(time_zones->getOffsets().size());
|
||
|
||
Op::constant_vector(const_source->getData(), time_zones->getChars(), time_zones->getOffsets(), vec_to);
|
||
}
|
||
else if (const_time_zone)
|
||
{
|
||
ToFieldType res;
|
||
Op::constant_constant(const_source->getData(), const_time_zone->getData(), res);
|
||
block.getByPosition(result).column = new ColumnConst<ToFieldType>(const_source->size(), res);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[1]).column->getName()
|
||
+ " of second argument of function " + NameToUnixTimestamp::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + NameToUnixTimestamp::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
else
|
||
throw Exception("Internal error.", ErrorCodes::LOGICAL_ERROR);
|
||
}
|
||
};
|
||
|
||
|
||
/** Если типы совпадают - просто скопируем ссылку на столбец.
|
||
*/
|
||
template <typename Name>
|
||
struct ConvertImpl<DataTypeString, DataTypeString, Name>
|
||
{
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
block.getByPosition(result).column = block.getByPosition(arguments[0]).column;
|
||
}
|
||
};
|
||
|
||
|
||
/** Преобразование из FixedString.
|
||
*/
|
||
template <typename ToDataType, typename Name>
|
||
struct ConvertImpl<DataTypeFixedString, ToDataType, Name>
|
||
{
|
||
typedef typename ToDataType::FieldType ToFieldType;
|
||
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
if (const ColumnFixedString * col_from = typeid_cast<const ColumnFixedString *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
ColumnVector<ToFieldType> * col_to = new ColumnVector<ToFieldType>;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
const ColumnFixedString::Chars_t & data_from = col_from->getChars();
|
||
size_t n = col_from->getN();
|
||
typename ColumnVector<ToFieldType>::Container_t & vec_to = col_to->getData();
|
||
size_t size = col_from->size();
|
||
vec_to.resize(size);
|
||
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
char * begin = const_cast<char *>(reinterpret_cast<const char *>(&data_from[i * n]));
|
||
char * end = begin + n;
|
||
ReadBuffer read_buffer(begin, n, 0);
|
||
parseImpl<ToDataType>(vec_to[i], read_buffer);
|
||
|
||
if (!read_buffer.eof())
|
||
{
|
||
while (read_buffer.position() < end && *read_buffer.position() == 0)
|
||
++read_buffer.position();
|
||
|
||
if (read_buffer.position() < end)
|
||
throw Exception("Cannot parse from fixed string.", ErrorCodes::CANNOT_PARSE_NUMBER);
|
||
}
|
||
}
|
||
}
|
||
else if (typeid_cast<const ColumnConstString *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
ConvertImpl<DataTypeString, ToDataType, Name>::execute(block, arguments, result);
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
};
|
||
|
||
/** Преобразование из FixedString в String.
|
||
* При этом, вырезаются последовательности нулевых байт с конца строк.
|
||
*/
|
||
template <typename Name>
|
||
struct ConvertImpl<DataTypeFixedString, DataTypeString, Name>
|
||
{
|
||
static void execute(Block & block, const ColumnNumbers & arguments, size_t result)
|
||
{
|
||
if (const ColumnFixedString * col_from = typeid_cast<const ColumnFixedString *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
ColumnString * col_to = new ColumnString;
|
||
block.getByPosition(result).column = col_to;
|
||
|
||
const ColumnFixedString::Chars_t & data_from = col_from->getChars();
|
||
ColumnString::Chars_t & data_to = col_to->getChars();
|
||
ColumnString::Offsets_t & offsets_to = col_to->getOffsets();
|
||
size_t size = col_from->size();
|
||
size_t n = col_from->getN();
|
||
data_to.resize(size * (n + 1)); /// + 1 - нулевой байт
|
||
offsets_to.resize(size);
|
||
|
||
size_t offset_from = 0;
|
||
size_t offset_to = 0;
|
||
for (size_t i = 0; i < size; ++i)
|
||
{
|
||
size_t bytes_to_copy = n;
|
||
while (bytes_to_copy > 0 && data_from[offset_from + bytes_to_copy - 1] == 0)
|
||
--bytes_to_copy;
|
||
|
||
memcpy(&data_to[offset_to], &data_from[offset_from], bytes_to_copy);
|
||
offset_from += n;
|
||
offset_to += bytes_to_copy;
|
||
data_to[offset_to] = 0;
|
||
++offset_to;
|
||
offsets_to[i] = offset_to;
|
||
}
|
||
|
||
data_to.resize(offset_to);
|
||
}
|
||
else if (const ColumnConstString * col_from = typeid_cast<const ColumnConstString *>(&*block.getByPosition(arguments[0]).column))
|
||
{
|
||
const String & s = col_from->getData();
|
||
|
||
size_t bytes_to_copy = s.size();
|
||
while (bytes_to_copy > 0 && s[bytes_to_copy - 1] == 0)
|
||
--bytes_to_copy;
|
||
|
||
block.getByPosition(result).column = new ColumnConstString(col_from->size(), s.substr(0, bytes_to_copy));
|
||
}
|
||
else
|
||
throw Exception("Illegal column " + block.getByPosition(arguments[0]).column->getName()
|
||
+ " of first argument of function " + Name::name,
|
||
ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
};
|
||
|
||
/// Предварительное объявление.
|
||
struct NameToDate { static constexpr auto name = "toDate"; };
|
||
|
||
template <typename ToDataType, typename Name, typename Monotonic>
|
||
class FunctionConvert : public IFunction
|
||
{
|
||
public:
|
||
static constexpr auto name = Name::name;
|
||
static IFunction * create(const Context & context) { return new FunctionConvert; }
|
||
|
||
/// Получить имя функции.
|
||
String getName() const override
|
||
{
|
||
return name;
|
||
}
|
||
|
||
/// Получить тип результата по типам аргументов. Если функция неприменима для данных аргументов - кинуть исключение.
|
||
DataTypePtr getReturnType(const DataTypes & arguments) const override
|
||
{
|
||
return getReturnTypeImpl(arguments);
|
||
}
|
||
|
||
/// Выполнить функцию над блоком.
|
||
void execute(Block & block, const ColumnNumbers & arguments, size_t result) override
|
||
{
|
||
IDataType * from_type = &*block.getByPosition(arguments[0]).type;
|
||
|
||
if (typeid_cast<const DataTypeUInt8 * >(from_type)) ConvertImpl<DataTypeUInt8, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeUInt16 * >(from_type)) ConvertImpl<DataTypeUInt16, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeUInt32 * >(from_type)) ConvertImpl<DataTypeUInt32, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeUInt64 * >(from_type)) ConvertImpl<DataTypeUInt64, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeInt8 * >(from_type)) ConvertImpl<DataTypeInt8, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeInt16 * >(from_type)) ConvertImpl<DataTypeInt16, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeInt32 * >(from_type)) ConvertImpl<DataTypeInt32, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeInt64 * >(from_type)) ConvertImpl<DataTypeInt64, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeFloat32 * >(from_type)) ConvertImpl<DataTypeFloat32, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeFloat64 * >(from_type)) ConvertImpl<DataTypeFloat64, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeDate * >(from_type)) ConvertImpl<DataTypeDate, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeDateTime * >(from_type)) ConvertImpl<DataTypeDateTime, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeString * >(from_type)) ConvertImpl<DataTypeString, ToDataType, Name>::execute(block, arguments, result);
|
||
else if (typeid_cast<const DataTypeFixedString *>(from_type)) ConvertImpl<DataTypeFixedString, ToDataType, Name>::execute(block, arguments, result);
|
||
else
|
||
throw Exception("Illegal type " + block.getByPosition(arguments[0]).type->getName() + " of argument of function " + getName(),
|
||
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
|
||
}
|
||
|
||
bool hasInformationAboutMonotonicity() const override
|
||
{
|
||
return Monotonic::has();
|
||
}
|
||
|
||
Monotonicity getMonotonicityForRange(const IDataType & type, const Field & left, const Field & right) const override
|
||
{
|
||
return Monotonic::get(type, left, right);
|
||
}
|
||
|
||
private:
|
||
template<typename ToDataType2 = ToDataType, typename Name2 = Name>
|
||
DataTypePtr getReturnTypeImpl(const DataTypes & arguments,
|
||
typename std::enable_if<!(std::is_same<ToDataType2, DataTypeString>::value ||
|
||
std::is_same<Name2, NameToUnixTimestamp>::value ||
|
||
std::is_same<Name2, NameToDate>::value)>::type * = nullptr) const
|
||
{
|
||
if (arguments.size() != 1)
|
||
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
|
||
+ toString(arguments.size()) + ", should be 1.",
|
||
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
|
||
|
||
return new ToDataType;
|
||
}
|
||
|
||
template<typename ToDataType2 = ToDataType, typename Name2 = Name>
|
||
DataTypePtr getReturnTypeImpl(const DataTypes & arguments,
|
||
typename std::enable_if<std::is_same<ToDataType2, DataTypeString>::value>::type * = nullptr) const
|
||
{
|
||
if ((arguments.size() < 1) || (arguments.size() > 2))
|
||
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
|
||
+ toString(arguments.size()) + ", should be 1 or 2.",
|
||
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
|
||
|
||
if (typeid_cast<const DataTypeDateTime *>(&*arguments[0]) == nullptr)
|
||
{
|
||
if (arguments.size() != 1)
|
||
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
|
||
+ toString(arguments.size()) + ", should be 1.",
|
||
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
|
||
}
|
||
else if ((arguments.size() == 2) && (typeid_cast<const DataTypeString *>(&*arguments[1]) == nullptr))
|
||
{
|
||
throw Exception{
|
||
"Illegal type " + arguments[1]->getName() + " of argument of function " + getName(),
|
||
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT
|
||
};
|
||
}
|
||
|
||
return new ToDataType2;
|
||
}
|
||
|
||
template<typename ToDataType2 = ToDataType, typename Name2 = Name>
|
||
DataTypePtr getReturnTypeImpl(const DataTypes & arguments,
|
||
typename std::enable_if<std::is_same<Name2, NameToUnixTimestamp>::value, void>::type * = nullptr) const
|
||
{
|
||
if ((arguments.size() < 1) || (arguments.size() > 2))
|
||
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
|
||
+ toString(arguments.size()) + ", should be 1 or 2.",
|
||
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
|
||
|
||
if (typeid_cast<const DataTypeString *>(&*arguments[0]) == nullptr)
|
||
{
|
||
if (arguments.size() != 1)
|
||
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
|
||
+ toString(arguments.size()) + ", should be 1.",
|
||
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
|
||
}
|
||
else if ((arguments.size() == 2) && (typeid_cast<const DataTypeString *>(&*arguments[1]) == nullptr))
|
||
{
|
||
throw Exception{
|
||
"Illegal type " + arguments[1]->getName() + " of argument of function " + getName(),
|
||
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT
|
||
};
|
||
}
|
||
|
||
return new ToDataType2;
|
||
}
|
||
|
||
template<typename ToDataType2 = ToDataType, typename Name2 = Name>
|
||
DataTypePtr getReturnTypeImpl(const DataTypes & arguments,
|
||
typename std::enable_if<std::is_same<Name2, NameToDate>::value>::type * = nullptr) const
|
||
{
|
||
if ((arguments.size() < 1) || (arguments.size() > 2))
|
||
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
|
||
+ toString(arguments.size()) + ", should be 1 or 2.",
|
||
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
|
||
|
||
if ((arguments.size() == 2) && (typeid_cast<const DataTypeString *>(&*arguments[1]) == nullptr))
|
||
{
|
||
throw Exception{
|
||
"Illegal type " + arguments[1]->getName() + " of 2nd argument of function " + getName(),
|
||
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT
|
||
};
|
||
}
|
||
|
||
return new ToDataType2;
|
||
}
|
||
};
|
||
|
||
|
||
/** Преобразование в строку фиксированной длины реализовано только из строк.
|
||
*/
|
||
class FunctionToFixedString : public IFunction
|
||
{
|
||
public:
|
||
static constexpr auto name = "toFixedString";
|
||
static IFunction * create(const Context & context) { return new FunctionToFixedString; };
|
||
|
||
/// Получить имя функции.
|
||
String getName() const override
|
||
{
|
||
return name;
|
||
}
|
||
|
||
/** Получить тип результата по типам аргументов и значениям константных аргументов.
|
||
* Если функция неприменима для данных аргументов - кинуть исключение.
|
||
* Для неконстантных столбцов arguments[i].column = nullptr.
|
||
*/
|
||
void getReturnTypeAndPrerequisites(const ColumnsWithTypeAndName & arguments,
|
||
DataTypePtr & out_return_type,
|
||
std::vector<ExpressionAction> & out_prerequisites) override
|
||
{
|
||
if (arguments.size() != 2)
|
||
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
|
||
+ toString(arguments.size()) + ", should be 2.",
|
||
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
|
||
if (!arguments[1].column)
|
||
throw Exception("Second argument for function " + getName() + " must be constant", ErrorCodes::ILLEGAL_COLUMN);
|
||
if (!typeid_cast<const DataTypeString *>(arguments[0].type.get()) &&
|
||
!typeid_cast<const DataTypeFixedString *>(arguments[0].type.get()))
|
||
throw Exception(getName() + " is only implemented for types String and FixedString", ErrorCodes::NOT_IMPLEMENTED);
|
||
|
||
const size_t n = getSize(arguments[1]);
|
||
|
||
out_return_type = new DataTypeFixedString(n);
|
||
}
|
||
|
||
/// Выполнить функцию над блоком.
|
||
void execute(Block & block, const ColumnNumbers & arguments, size_t result) override
|
||
{
|
||
ColumnPtr column = block.getByPosition(arguments[0]).column;
|
||
size_t n = getSize(block.getByPosition(arguments[1]));
|
||
|
||
if (const ColumnConstString * column_const = typeid_cast<const ColumnConstString *>(&*column))
|
||
{
|
||
if (column_const->getData().size() > n)
|
||
throw Exception("String too long for type FixedString(" + toString(n) + ")",
|
||
ErrorCodes::TOO_LARGE_STRING_SIZE);
|
||
|
||
auto resized_string = column_const->getData();
|
||
resized_string.resize(n);
|
||
|
||
block.getByPosition(result).column = new ColumnConst<String>(column_const->size(), std::move(resized_string), new DataTypeFixedString(n));
|
||
}
|
||
else if (const ColumnString * column_string = typeid_cast<const ColumnString *>(&*column))
|
||
{
|
||
ColumnFixedString * column_fixed = new ColumnFixedString(n);
|
||
ColumnPtr result_ptr = column_fixed;
|
||
ColumnFixedString::Chars_t & out_chars = column_fixed->getChars();
|
||
const ColumnString::Chars_t & in_chars = column_string->getChars();
|
||
const ColumnString::Offsets_t & in_offsets = column_string->getOffsets();
|
||
out_chars.resize_fill(in_offsets.size() * n);
|
||
for (size_t i = 0; i < in_offsets.size(); ++i)
|
||
{
|
||
size_t off = i ? in_offsets[i - 1] : 0;
|
||
size_t len = in_offsets[i] - off - 1;
|
||
if (len > n)
|
||
throw Exception("String too long for type FixedString(" + toString(n) + ")",
|
||
ErrorCodes::TOO_LARGE_STRING_SIZE);
|
||
memcpy(&out_chars[i * n], &in_chars[off], len);
|
||
}
|
||
block.getByPosition(result).column = result_ptr;
|
||
}
|
||
else if (const auto column_fixed_string = typeid_cast<const ColumnFixedString *>(column.get()))
|
||
{
|
||
const auto src_n = column_fixed_string->getN();
|
||
if (src_n > n)
|
||
throw Exception{
|
||
"String too long for type FixedString(" + toString(n) + ")",
|
||
ErrorCodes::TOO_LARGE_STRING_SIZE
|
||
};
|
||
|
||
const auto column_fixed = new ColumnFixedString{n};
|
||
block.getByPosition(result).column = column_fixed;
|
||
|
||
auto & out_chars = column_fixed->getChars();
|
||
const auto & in_chars = column_fixed_string->getChars();
|
||
const auto size = column_fixed_string->size();
|
||
out_chars.resize_fill(size * n);
|
||
|
||
for (const auto i : ext::range(0, size))
|
||
memcpy(&out_chars[i * n], &in_chars[i * src_n], src_n);
|
||
}
|
||
else
|
||
throw Exception("Unexpected column: " + column->getName(), ErrorCodes::ILLEGAL_COLUMN);
|
||
}
|
||
|
||
private:
|
||
template <typename T>
|
||
bool getSizeTyped(const ColumnWithTypeAndName & column, size_t & out_size)
|
||
{
|
||
if (!typeid_cast<const typename DataTypeFromFieldType<T>::Type *>(&*column.type))
|
||
return false;
|
||
const ColumnConst<T> * column_const = typeid_cast<const ColumnConst<T> *>(&*column.column);
|
||
if (!column_const)
|
||
throw Exception("Unexpected type of column for FixedString length: " + column.column->getName(), ErrorCodes::ILLEGAL_COLUMN);
|
||
T s = column_const->getData();
|
||
if (s <= 0)
|
||
throw Exception("FixedString length must be positive (unlike " + toString(s) + ")", ErrorCodes::ILLEGAL_COLUMN);
|
||
out_size = static_cast<size_t>(s);
|
||
return true;
|
||
}
|
||
|
||
size_t getSize(const ColumnWithTypeAndName & column)
|
||
{
|
||
size_t res;
|
||
if (getSizeTyped<UInt8>(column, res) ||
|
||
getSizeTyped<UInt16>(column, res) ||
|
||
getSizeTyped<UInt32>(column, res) ||
|
||
getSizeTyped<UInt64>(column, res) ||
|
||
getSizeTyped< Int8 >(column, res) ||
|
||
getSizeTyped< Int16>(column, res) ||
|
||
getSizeTyped< Int32>(column, res) ||
|
||
getSizeTyped< Int64>(column, res))
|
||
return res;
|
||
throw Exception("Length of FixedString must be integer; got " + column.type->getName(), ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
|
||
}
|
||
};
|
||
|
||
|
||
/// Монотонность.
|
||
|
||
struct PositiveMonotonicity
|
||
{
|
||
static bool has() { return true; }
|
||
static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
|
||
{
|
||
return { true };
|
||
}
|
||
};
|
||
|
||
template <typename T>
|
||
struct ToIntMonotonicity
|
||
{
|
||
static bool has() { return true; }
|
||
|
||
template <typename T2 = T>
|
||
static UInt64 divideByRangeOfType(typename std::enable_if_t<sizeof(T2) != sizeof(UInt64), UInt64> x) { return x >> (sizeof(T) * 8); };
|
||
|
||
template <typename T2 = T>
|
||
static UInt64 divideByRangeOfType(typename std::enable_if_t<sizeof(T2) == sizeof(UInt64), UInt64> x) { return 0; };
|
||
|
||
static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
|
||
{
|
||
size_t size_of_type = type.getSizeOfField();
|
||
|
||
/// Если тип расширяется, то функция монотонна.
|
||
if (sizeof(T) > size_of_type)
|
||
return { true };
|
||
|
||
/// Если тип совпадает - тоже.
|
||
if (typeid_cast<const typename DataTypeFromFieldType<T>::Type *>(&type))
|
||
return { true };
|
||
|
||
/// В других случаях, для неограниченного диапазона не знаем, будет ли функция монотонной.
|
||
if (left.isNull() || right.isNull())
|
||
return {};
|
||
|
||
/// Если преобразуем из float, то аргументы должны помещаться в тип результата.
|
||
if (typeid_cast<const DataTypeFloat32 *>(&type)
|
||
|| typeid_cast<const DataTypeFloat64 *>(&type))
|
||
{
|
||
Float64 left_float = left.get<Float64>();
|
||
Float64 right_float = right.get<Float64>();
|
||
|
||
if (left_float >= std::numeric_limits<T>::min() && left_float <= std::numeric_limits<T>::max()
|
||
&& right_float >= std::numeric_limits<T>::min() && right_float <= std::numeric_limits<T>::max())
|
||
return { true };
|
||
|
||
return {};
|
||
}
|
||
|
||
/// Если меняем знаковость типа или преобразуем из даты, даты-времени, то аргумент должен быть из одной половинки.
|
||
/// На всякий случай, в остальных случаях тоже будем этого требовать.
|
||
if ((left.get<Int64>() >= 0) != (right.get<Int64>() >= 0))
|
||
return {};
|
||
|
||
/// Если уменьшаем тип, то все биты кроме тех, которые в него помещаются, должны совпадать.
|
||
if (divideByRangeOfType(left.get<UInt64>()) != divideByRangeOfType(right.get<UInt64>()))
|
||
return {};
|
||
|
||
return { true };
|
||
}
|
||
};
|
||
|
||
/** Монотонность для функции toString определяем, в основном, для тестовых целей.
|
||
* Всерьёз вряд ли кто-нибудь рассчитывает на оптимизацию запросов с условиями toString(CounterID) = 34.
|
||
*/
|
||
struct ToStringMonotonicity
|
||
{
|
||
static bool has() { return true; }
|
||
|
||
static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
|
||
{
|
||
IFunction::Monotonicity positive = { .is_monotonic = true, .is_positive = true };
|
||
IFunction::Monotonicity not_monotonic;
|
||
|
||
/// Функция toString монотонна, если аргумент - Date или DateTime, или неотрицательные числа с одинаковым количеством знаков.
|
||
|
||
if (typeid_cast<const DataTypeDate *>(&type)
|
||
|| typeid_cast<const DataTypeDateTime *>(&type))
|
||
return positive;
|
||
|
||
if (left.isNull() || right.isNull())
|
||
return {};
|
||
|
||
if (left.getType() == Field::Types::UInt64
|
||
&& right.getType() == Field::Types::UInt64)
|
||
{
|
||
return (left.get<Int64>() == 0 && right.get<Int64>() == 0)
|
||
|| (floor(log10(left.get<UInt64>())) == floor(log10(right.get<UInt64>())))
|
||
? positive : not_monotonic;
|
||
}
|
||
|
||
if (left.getType() == Field::Types::Int64
|
||
&& right.getType() == Field::Types::Int64)
|
||
{
|
||
return (left.get<Int64>() == 0 && right.get<Int64>() == 0)
|
||
|| (left.get<Int64>() > 0 && right.get<Int64>() > 0 && floor(log10(left.get<Int64>())) == floor(log10(right.get<Int64>())))
|
||
? positive : not_monotonic;
|
||
}
|
||
|
||
return not_monotonic;
|
||
}
|
||
};
|
||
|
||
|
||
struct NameToUInt8 { static constexpr auto name = "toUInt8"; };
|
||
struct NameToUInt16 { static constexpr auto name = "toUInt16"; };
|
||
struct NameToUInt32 { static constexpr auto name = "toUInt32"; };
|
||
struct NameToUInt64 { static constexpr auto name = "toUInt64"; };
|
||
struct NameToInt8 { static constexpr auto name = "toInt8"; };
|
||
struct NameToInt16 { static constexpr auto name = "toInt16"; };
|
||
struct NameToInt32 { static constexpr auto name = "toInt32"; };
|
||
struct NameToInt64 { static constexpr auto name = "toInt64"; };
|
||
struct NameToFloat32 { static constexpr auto name = "toFloat32"; };
|
||
struct NameToFloat64 { static constexpr auto name = "toFloat64"; };
|
||
struct NameToDateTime { static constexpr auto name = "toDateTime"; };
|
||
struct NameToString { static constexpr auto name = "toString"; };
|
||
|
||
typedef FunctionConvert<DataTypeUInt8, NameToUInt8, ToIntMonotonicity<UInt8>> FunctionToUInt8;
|
||
typedef FunctionConvert<DataTypeUInt16, NameToUInt16, ToIntMonotonicity<UInt16>> FunctionToUInt16;
|
||
typedef FunctionConvert<DataTypeUInt32, NameToUInt32, ToIntMonotonicity<UInt32>> FunctionToUInt32;
|
||
typedef FunctionConvert<DataTypeUInt64, NameToUInt64, ToIntMonotonicity<UInt64>> FunctionToUInt64;
|
||
typedef FunctionConvert<DataTypeInt8, NameToInt8, ToIntMonotonicity<Int8>> FunctionToInt8;
|
||
typedef FunctionConvert<DataTypeInt16, NameToInt16, ToIntMonotonicity<Int16>> FunctionToInt16;
|
||
typedef FunctionConvert<DataTypeInt32, NameToInt32, ToIntMonotonicity<Int32>> FunctionToInt32;
|
||
typedef FunctionConvert<DataTypeInt64, NameToInt64, ToIntMonotonicity<Int64>> FunctionToInt64;
|
||
typedef FunctionConvert<DataTypeFloat32, NameToFloat32, PositiveMonotonicity> FunctionToFloat32;
|
||
typedef FunctionConvert<DataTypeFloat64, NameToFloat64, PositiveMonotonicity> FunctionToFloat64;
|
||
typedef FunctionConvert<DataTypeDate, NameToDate, ToIntMonotonicity<UInt16>> FunctionToDate;
|
||
typedef FunctionConvert<DataTypeDateTime, NameToDateTime, ToIntMonotonicity<UInt32>> FunctionToDateTime;
|
||
typedef FunctionConvert<DataTypeString, NameToString, ToStringMonotonicity> FunctionToString;
|
||
typedef FunctionConvert<DataTypeInt32, NameToUnixTimestamp, ToIntMonotonicity<UInt32>> FunctionToUnixTimestamp;
|
||
|
||
}
|