ClickHouse/dbms/include/DB/Functions/FunctionsComparison.h

#pragma once

#include <Poco/NumberFormatter.h>

#include <DB/DataTypes/DataTypesNumberFixed.h>
#include <DB/DataTypes/DataTypesNumberVariable.h>
#include <DB/DataTypes/DataTypeDateTime.h>
#include <DB/DataTypes/DataTypeDate.h>
#include <DB/DataTypes/DataTypeString.h>
#include <DB/DataTypes/DataTypeFixedString.h>
#include <DB/Functions/IFunction.h>


namespace DB
{

/** Функции сравнения: ==, !=, <, >, <=, >=.
  * Функции сравнения возвращают всегда 0 или 1 (UInt8).
  *
  * Сравнивать можно следующие типы:
  * - числа;
  * - строки и фиксированные строки;
  * - даты;
  * - даты-с-временем;
  *   внутри каждой группы, но не из разных групп.
  */

template<typename A, typename B>
struct EqualsNumImpl
{
	typedef UInt8 ResultType;

	static void vector_vector(const std::vector<A> & a, const std::vector<B> & b, std::vector<ResultType> & c)
	{
		size_t size = a.size();
		for (size_t i = 0; i < size; ++i)
			c[i] = a[i] == b[i];
	}

	static void vector_constant(const std::vector<A> & a, B b, std::vector<ResultType> & c)
	{
		size_t size = a.size();
		for (size_t i = 0; i < size; ++i)
			c[i] = a[i] == b;
	}

	static void constant_constant(A a, B b, ResultType & c)
	{
		c = a == b;
	}
};

template<typename A, typename B>
struct EqualsStringImpl
{
	typedef UInt8 ResultType;

	static void string_vector_string_vector(
		const std::vector<UInt8> & a_data, const std::vector<size_t> & a_offsets,
		const std::vector<UInt8> & b_data, const std::vector<size_t> & b_offsets,
		std::vector<ResultType> & c)
	{
		size_t size = a_data.size();
		for (size_t i = 0; i < size; ++i)
			c[i] = (i == 0)
				? (a_offsets[0] == b_offsets[0] && !memcmp(&a_data[0], &b_data[0], a_offsets[0]))
				: (a_offsets[i] - a_offsets[i - 1] == b_offsets[i] - b_offsets[i - 1]
					&& !memcmp(&a_data[a_offsets[i - 1]], &b_data[b_offsets[i - 1]], a_offsets[i] - a_offsets[i - 1]));
	}

	static void string_vector_fixed_string_vector(
		const std::vector<UInt8> & a_data, const std::vector<size_t> & a_offsets,
		const std::vector<UInt8> & b_data, size_t b_n,
		std::vector<ResultType> & c)
	{
		size_t size = a_data.size();
		for (size_t i = 0; i < size; ++i)
			c[i] = (i == 0)
				? (a_offsets[0] == b_n && !memcmp(&a_data[0], &b_data[0], b_n))
				: (a_offsets[i] - a_offsets[i - 1] == b_n
					&& !memcmp(&a_data[a_offsets[i - 1]], &b_data[b_n * i], b_n));
	}

	static void string_vector_constant(
		const std::vector<UInt8> & a_data, const std::vector<size_t> & a_offsets,
		const std::string & b,
		std::vector<ResultType> & c)
	{
		size_t size = a_data.size();
		size_t b_n = b.size();
		const UInt8 * b_data = reinterpret_cast<const UInt8 *>(b.data())
		for (size_t i = 0; i < size; ++i)
			c[i] = (i == 0)
				? (a_offsets[0] == b_n && !memcmp(&a_data[0], b_data, b_n))
				: (a_offsets[i] - a_offsets[i - 1] == b_n
					&& !memcmp(&a_data[a_offsets[i - 1]], b_data, b_n));
	}

	static void fixed_string_vector_fixed_string_vector(
		const std::vector<UInt8> & a_data, size_t a_n,
		const std::vector<UInt8> & b_data, size_t b_n,
		std::vector<ResultType> & c)
	{
		size_t size = a_data.size();
		for (size_t i = 0; i < size; i += n)
			c[i] = a_n == b_n && !memcmp(&a_data[i], &b_data[i], n);
	}

	static void fixed_string_vector_constant(
		const std::vector<UInt8> & a_data, size_t a_n,
		const std::string & b,
		std::vector<ResultType> & c)
	{
		size_t size = a_data.size();
		for (size_t i = 0; i < size; i += n)
			c[i] = !memcmp(&a_data[i], &b_data[i], n);
	}

	static void constant_constant(
		const std::string & a,
		const std::string & b,
		std::string & c)
	{
		c = a == b;
	}
};


template <template <typename, typename> class Impl, typename Name>
class FunctionComparison : public IFunction
{
private:
	template <typename T0, typename T1>
	bool checkRightType(const DataTypes & arguments, DataTypes & types_res) const
	{
		if (dynamic_cast<const T1 *>(&*arguments[1]))
		{
			types_res.push_back(new typename DataTypeFromFieldType<
				typename Impl<typename T0::FieldType, typename T1::FieldType>::ResultType>::Type);
			return true;
		}
		return false;
	}

	template <typename T0>
	bool checkLeftType(const DataTypes & arguments, DataTypes & types_res) const
	{
		if (dynamic_cast<const T0 *>(&*arguments[0]))
		{
			if (	checkRightType<T0, DataTypeUInt8>(arguments, types_res)
				||	checkRightType<T0, DataTypeUInt16>(arguments, types_res)
				||	checkRightType<T0, DataTypeUInt32>(arguments, types_res)
				||	checkRightType<T0, DataTypeUInt64>(arguments, types_res)
				||	checkRightType<T0, DataTypeInt8>(arguments, types_res)
				||	checkRightType<T0, DataTypeInt16>(arguments, types_res)
				||	checkRightType<T0, DataTypeInt32>(arguments, types_res)
				||	checkRightType<T0, DataTypeInt64>(arguments, types_res)
				||	checkRightType<T0, DataTypeFloat32>(arguments, types_res)
				||	checkRightType<T0, DataTypeFloat64>(arguments, types_res)
				||	checkRightType<T0, DataTypeVarUInt>(arguments, types_res)
				||	checkRightType<T0, DataTypeVarInt>(arguments, types_res))
				return true;
			else
				throw Exception("Illegal type " + arguments[1]->getName() + " of second argument of function " + getName(),
					ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
		}
		return false;
	}


	template <typename T0, typename T1>
	bool executeRightType(Block & block, const ColumnNumbers & arguments, const ColumnNumbers & result, const ColumnVector<T0> * col_left)
	{
		if (ColumnVector<T1> * col_right = dynamic_cast<ColumnVector<T1> *>(&*block.getByPosition(arguments[1]).column))
		{
			typedef typename Impl<T0, T1>::ResultType ResultType;

			ColumnVector<ResultType> * col_res = new ColumnVector<ResultType>;
			block.getByPosition(result[0]).column = col_res;

			typename ColumnVector<ResultType>::Container_t & vec_res = col_res->getData();
			vec_res.resize(col_left->getData().size());
			Impl<T0, T1>::vector_vector(col_left->getData(), col_right->getData(), vec_res);

			return true;
		}
		else if (ColumnConst<T1> * col_right = dynamic_cast<ColumnConst<T1> *>(&*block.getByPosition(arguments[1]).column))
		{
			typedef typename Impl<T0, T1>::ResultType ResultType;

			ColumnVector<ResultType> * col_res = new ColumnVector<ResultType>;
			block.getByPosition(result[0]).column = col_res;

			typename ColumnVector<ResultType>::Container_t & vec_res = col_res->getData();
			vec_res.resize(col_left->getData().size());
			Impl<T0, T1>::vector_constant(col_left->getData(), col_right->getData(), vec_res);

			return true;
		}

		return false;
	}

	template <typename T0, typename T1>
	bool executeConstRightType(Block & block, const ColumnNumbers & arguments, const ColumnNumbers & result, const ColumnConst<T0> * col_left)
	{
		if (ColumnVector<T1> * col_right = dynamic_cast<ColumnVector<T1> *>(&*block.getByPosition(arguments[1]).column))
		{
			typedef typename Impl<T0, T1>::ResultType ResultType;

			ColumnVector<ResultType> * col_res = new ColumnVector<ResultType>;
			block.getByPosition(result[0]).column = col_res;

			typename ColumnVector<ResultType>::Container_t & vec_res = col_res->getData();
			vec_res.resize(col_left->size());
			Impl<T0, T1>::constant_vector(col_left->getData(), col_right->getData(), vec_res);

			return true;
		}
		else if (ColumnConst<T1> * col_right = dynamic_cast<ColumnConst<T1> *>(&*block.getByPosition(arguments[1]).column))
		{
			typedef typename Impl<T0, T1>::ResultType ResultType;

			ResultType res = 0;
			Impl<T0, T1>::constant_constant(col_left->getData(), col_right->getData(), res);

			ColumnConst<ResultType> * col_res = new ColumnConst<ResultType>(col_left->size(), res);
			block.getByPosition(result[0]).column = col_res;

			return true;
		}

		return false;
	}

	template <typename T0>
	bool executeLeftType(Block & block, const ColumnNumbers & arguments, const ColumnNumbers & result)
	{
		if (ColumnVector<T0> * col_left = dynamic_cast<ColumnVector<T0> *>(&*block.getByPosition(arguments[0]).column))
		{
			if (	executeRightType<T0, UInt8>(block, arguments, result, col_left)
				||	executeRightType<T0, UInt16>(block, arguments, result, col_left)
				||	executeRightType<T0, UInt32>(block, arguments, result, col_left)
				||	executeRightType<T0, UInt64>(block, arguments, result, col_left)
				||	executeRightType<T0, Int8>(block, arguments, result, col_left)
				||	executeRightType<T0, Int16>(block, arguments, result, col_left)
				||	executeRightType<T0, Int32>(block, arguments, result, col_left)
				||	executeRightType<T0, Int64>(block, arguments, result, col_left)
				||	executeRightType<T0, Float32>(block, arguments, result, col_left)
				||	executeRightType<T0, Float64>(block, arguments, result, col_left))
				return true;
			else
				throw Exception("Illegal column of second argument of function " + getName(),
					ErrorCodes::ILLEGAL_COLUMN);
		}
		else if (ColumnConst<T0> * col_left = dynamic_cast<ColumnConst<T0> *>(&*block.getByPosition(arguments[0]).column))
		{
			if (	executeConstRightType<T0, UInt8>(block, arguments, result, col_left)
				||	executeConstRightType<T0, UInt16>(block, arguments, result, col_left)
				||	executeConstRightType<T0, UInt32>(block, arguments, result, col_left)
				||	executeConstRightType<T0, UInt64>(block, arguments, result, col_left)
				||	executeConstRightType<T0, Int8>(block, arguments, result, col_left)
				||	executeConstRightType<T0, Int16>(block, arguments, result, col_left)
				||	executeConstRightType<T0, Int32>(block, arguments, result, col_left)
				||	executeConstRightType<T0, Int64>(block, arguments, result, col_left)
				||	executeConstRightType<T0, Float32>(block, arguments, result, col_left)
				||	executeConstRightType<T0, Float64>(block, arguments, result, col_left))
				return true;
			else
				throw Exception("Illegal column of second argument of function " + getName(),
					ErrorCodes::ILLEGAL_COLUMN);
		}

		return false;
	}

public:
	/// Получить все имена функции.
	String getName() const
	{
		return Name::get();
	}

	/// Получить типы результата по типам аргументов. Если функция неприменима для данных аргументов - кинуть исключение.
	DataTypes getReturnTypes(const DataTypes & arguments) const
	{
		if (arguments.size() != 2)
			throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
				+ Poco::NumberFormatter::format(arguments.size()) + ", should be 2.",
				ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);

		DataTypes types_res;

		if (!(	checkLeftType<DataTypeUInt8>(arguments, types_res)
			||	checkLeftType<DataTypeUInt16>(arguments, types_res)
			||	checkLeftType<DataTypeUInt32>(arguments, types_res)
			||	checkLeftType<DataTypeUInt64>(arguments, types_res)
			||	checkLeftType<DataTypeInt8>(arguments, types_res)
			||	checkLeftType<DataTypeInt16>(arguments, types_res)
			||	checkLeftType<DataTypeInt32>(arguments, types_res)
			||	checkLeftType<DataTypeInt64>(arguments, types_res)
			||	checkLeftType<DataTypeFloat32>(arguments, types_res)
			||	checkLeftType<DataTypeFloat64>(arguments, types_res)
			||	checkLeftType<DataTypeVarUInt>(arguments, types_res)
			||	checkLeftType<DataTypeVarInt>(arguments, types_res)))
			throw Exception("Illegal type " + arguments[0]->getName() + " of first argument of function " + getName(),
				ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);

		return types_res;
	}

	/// Выполнить функцию над блоком.
	void execute(Block & block, const ColumnNumbers & arguments, const ColumnNumbers & result)
	{
		if (result.size() != 1)
			throw Exception("Wrong number of result columns in function " + getName() + ", should be 1.",
				ErrorCodes::ILLEGAL_NUMBER_OF_RESULT_COLUMNS);

		if (!(	executeLeftType<UInt8>(block, arguments, result)
			||	executeLeftType<UInt16>(block, arguments, result)
			||	executeLeftType<UInt32>(block, arguments, result)
			||	executeLeftType<UInt64>(block, arguments, result)
			||	executeLeftType<Int8>(block, arguments, result)
			||	executeLeftType<Int16>(block, arguments, result)
			||	executeLeftType<Int32>(block, arguments, result)
			||	executeLeftType<Int64>(block, arguments, result)
			||	executeLeftType<Float32>(block, arguments, result)
			||	executeLeftType<Float64>(block, arguments, result)))
		   throw Exception("Illegal column of first argument of function " + getName(),
				ErrorCodes::ILLEGAL_COLUMN);
	}
};


struct NamePlus 			{ static const char * get() { return "plus"; } };
struct NameMinus 			{ static const char * get() { return "minus"; } };
struct NameMultiply 		{ static const char * get() { return "multiply"; } };
struct NameDivideFloating	{ static const char * get() { return "divide"; } };
struct NameDivideIntegral 	{ static const char * get() { return "div"; } };
struct NameModulo 			{ static const char * get() { return "modulo"; } };

typedef FunctionBinaryArithmetic<PlusImpl, 				NamePlus> 			FunctionPlus;
typedef FunctionBinaryArithmetic<MinusImpl, 			NameMinus> 			FunctionMinus;
typedef FunctionBinaryArithmetic<MultiplyImpl, 			NameMultiply> 		FunctionMultiply;
typedef FunctionBinaryArithmetic<DivideFloatingImpl, 	NameDivideFloating> FunctionDivideFloating;
typedef FunctionBinaryArithmetic<DivideIntegralImpl, 	NameDivideIntegral> FunctionDivideIntegral;
typedef FunctionBinaryArithmetic<ModuloImpl, 			NameModulo> 		FunctionModulo;


}