ClickHouse/src/Functions/in.cpp

154 lines
6.4 KiB
C++
Raw Normal View History

#include <Functions/IFunctionImpl.h>
#include <Functions/FunctionFactory.h>
#include <Functions/FunctionHelpers.h>
#include <DataTypes/DataTypeTuple.h>
#include <DataTypes/DataTypesNumber.h>
#include <Columns/ColumnConst.h>
2020-05-14 18:21:35 +00:00
#include <Columns/ColumnsNumber.h>
#include <Columns/ColumnTuple.h>
#include <Columns/ColumnSet.h>
#include <Interpreters/Set.h>
namespace DB
{
namespace ErrorCodes
{
extern const int ILLEGAL_COLUMN;
}
2020-09-07 18:00:37 +00:00
namespace
{
/** in(x, set) - function for evaluating the IN
* notIn(x, set) - and NOT IN.
*/
2020-05-14 14:21:38 +00:00
template <bool negative, bool global, bool null_is_skipped, bool ignore_set>
struct FunctionInName;
2020-05-14 14:21:38 +00:00
template <> struct FunctionInName<false, false, true, false> { static constexpr auto name = "in"; };
template <> struct FunctionInName<false, true, true, false> { static constexpr auto name = "globalIn"; };
template <> struct FunctionInName<true, false, true, false> { static constexpr auto name = "notIn"; };
template <> struct FunctionInName<true, true, true, false> { static constexpr auto name = "globalNotIn"; };
template <> struct FunctionInName<false, false, false, false> { static constexpr auto name = "nullIn"; };
template <> struct FunctionInName<false, true, false, false> { static constexpr auto name = "globalNullIn"; };
template <> struct FunctionInName<true, false, false, false> { static constexpr auto name = "notNullIn"; };
template <> struct FunctionInName<true, true, false, false> { static constexpr auto name = "globalNotNullIn"; };
template <> struct FunctionInName<false, false, true, true> { static constexpr auto name = "inIgnoreSet"; };
template <> struct FunctionInName<false, true, true, true> { static constexpr auto name = "globalInIgnoreSet"; };
template <> struct FunctionInName<true, false, true, true> { static constexpr auto name = "notInIgnoreSet"; };
template <> struct FunctionInName<true, true, true, true> { static constexpr auto name = "globalNotInIgnoreSet"; };
template <> struct FunctionInName<false, false, false, true> { static constexpr auto name = "nullInIgnoreSet"; };
template <> struct FunctionInName<false, true, false, true> { static constexpr auto name = "globalNullInIgnoreSet"; };
template <> struct FunctionInName<true, false, false, true> { static constexpr auto name = "notNullInIgnoreSet"; };
template <> struct FunctionInName<true, true, false, true> { static constexpr auto name = "globalNotNullInIgnoreSet"; };
template <bool negative, bool global, bool null_is_skipped, bool ignore_set>
class FunctionIn : public IFunction
{
public:
2020-05-14 14:21:38 +00:00
/// ignore_set flag means that we don't use set from the second argument, just return zero column.
/// It is needed to perform type analysis without creation of set.
static constexpr auto name = FunctionInName<negative, global, null_is_skipped, ignore_set>::name;
static FunctionPtr create(const Context &)
{
return std::make_shared<FunctionIn>();
}
String getName() const override
{
return name;
}
size_t getNumberOfArguments() const override
{
return 2;
}
DataTypePtr getReturnTypeImpl(const DataTypes & /*arguments*/) const override
{
return std::make_shared<DataTypeUInt8>();
}
2020-05-15 09:06:21 +00:00
bool useDefaultImplementationForConstants() const override
{
/// Never return constant for -IgnoreSet functions to avoid constant folding.
return !ignore_set;
}
2019-10-27 18:12:40 +00:00
2020-04-06 13:30:16 +00:00
bool useDefaultImplementationForNulls() const override { return null_is_skipped; }
void executeImpl(ColumnsWithTypeAndName & block, const ColumnNumbers & arguments, size_t result, [[maybe_unused]] size_t input_rows_count) const override
{
2020-05-14 14:21:38 +00:00
if constexpr (ignore_set)
{
2020-10-10 18:24:57 +00:00
block[result].column = ColumnUInt8::create(input_rows_count, 0u);
2020-05-14 14:21:38 +00:00
return;
}
2019-08-12 13:07:35 +00:00
/// Second argument must be ColumnSet.
2020-10-10 18:24:57 +00:00
ColumnPtr column_set_ptr = block[arguments[1]].column;
2019-10-27 18:12:40 +00:00
const ColumnSet * column_set = checkAndGetColumnConstData<const ColumnSet>(column_set_ptr.get());
if (!column_set)
column_set = checkAndGetColumn<const ColumnSet>(column_set_ptr.get());
if (!column_set)
throw Exception("Second argument for function '" + getName() + "' must be Set; found " + column_set_ptr->getName(),
ErrorCodes::ILLEGAL_COLUMN);
DB::Block block_of_key_columns;
2019-04-30 17:26:56 +00:00
/// First argument may be a tuple or a single column.
2020-10-10 18:24:57 +00:00
const ColumnWithTypeAndName & left_arg = block[arguments[0]];
const ColumnTuple * tuple = typeid_cast<const ColumnTuple *>(left_arg.column.get());
const ColumnConst * const_tuple = checkAndGetColumnConst<ColumnTuple>(left_arg.column.get());
const DataTypeTuple * type_tuple = typeid_cast<const DataTypeTuple *>(left_arg.type.get());
ColumnPtr materialized_tuple;
if (const_tuple)
{
materialized_tuple = const_tuple->convertToFullColumn();
tuple = typeid_cast<const ColumnTuple *>(materialized_tuple.get());
}
auto set = column_set->getData();
auto set_types = set->getDataTypes();
if (tuple && (set_types.size() != 1 || !set_types[0]->equals(*type_tuple)))
{
const auto & tuple_columns = tuple->getColumns();
const DataTypes & tuple_types = type_tuple->getElements();
size_t tuple_size = tuple_columns.size();
for (size_t i = 0; i < tuple_size; ++i)
block_of_key_columns.insert({ tuple_columns[i], tuple_types[i], "" });
}
else
block_of_key_columns.insert(left_arg);
2020-10-10 18:24:57 +00:00
block[result].column = set->execute(block_of_key_columns, negative);
}
};
2020-05-14 14:21:38 +00:00
template<bool ignore_set>
2020-09-07 18:00:37 +00:00
void registerFunctionsInImpl(FunctionFactory & factory)
2020-05-14 14:21:38 +00:00
{
factory.registerFunction<FunctionIn<false, false, true, ignore_set>>();
factory.registerFunction<FunctionIn<false, true, true, ignore_set>>();
factory.registerFunction<FunctionIn<true, false, true, ignore_set>>();
factory.registerFunction<FunctionIn<true, true, true, ignore_set>>();
factory.registerFunction<FunctionIn<false, false, false, ignore_set>>();
factory.registerFunction<FunctionIn<false, true, false, ignore_set>>();
factory.registerFunction<FunctionIn<true, false, false, ignore_set>>();
factory.registerFunction<FunctionIn<true, true, false, ignore_set>>();
}
2020-09-07 18:00:37 +00:00
}
void registerFunctionsIn(FunctionFactory & factory)
{
2020-05-14 14:21:38 +00:00
registerFunctionsInImpl<false>(factory);
registerFunctionsInImpl<true>(factory);
}
}