ClickHouse/src/Functions/map.cpp

288 lines
9.3 KiB
C++
Raw Normal View History

2021-05-17 07:30:42 +00:00
#include <Functions/IFunction.h>
2020-11-02 06:46:32 +00:00
#include <Functions/FunctionFactory.h>
#include <Functions/FunctionHelpers.h>
2020-11-02 06:46:32 +00:00
#include <DataTypes/DataTypeMap.h>
#include <DataTypes/DataTypeTuple.h>
2020-12-03 03:52:41 +00:00
#include <DataTypes/DataTypesNumber.h>
2020-11-02 06:46:32 +00:00
#include <Columns/ColumnMap.h>
#include <Columns/ColumnArray.h>
#include <Columns/ColumnString.h>
#include <Columns/ColumnsNumber.h>
2020-11-02 06:46:32 +00:00
#include <DataTypes/getLeastSupertype.h>
#include <Interpreters/castColumn.h>
#include <memory>
#include <Common/assert_cast.h>
#include <Common/typeid_cast.h>
#include "array/arrayIndex.h"
2020-11-02 06:46:32 +00:00
namespace DB
{
namespace ErrorCodes
{
extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
2020-11-02 06:46:32 +00:00
}
namespace
{
2020-11-02 09:23:02 +00:00
// map(x, y, ...) is a function that allows you to make key-value pair
2020-11-02 06:46:32 +00:00
class FunctionMap : public IFunction
{
public:
static constexpr auto name = "map";
2021-06-01 12:20:52 +00:00
static FunctionPtr create(ContextPtr)
2020-11-02 06:46:32 +00:00
{
return std::make_shared<FunctionMap>();
}
String getName() const override
{
return name;
}
bool isVariadic() const override
{
return true;
}
size_t getNumberOfArguments() const override
{
return 0;
}
bool isInjective(const ColumnsWithTypeAndName &) const override
{
return true;
}
2021-06-22 16:21:23 +00:00
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
2020-11-02 06:46:32 +00:00
bool useDefaultImplementationForNulls() const override { return false; }
bool useDefaultImplementationForConstants() const override { return true; }
DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
{
2020-12-15 14:34:37 +00:00
if (arguments.size() % 2 != 0)
throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
"Function {} requires even number of arguments, but {} given", getName(), arguments.size());
2020-11-02 06:46:32 +00:00
DataTypes keys, values;
for (size_t i = 0; i < arguments.size(); i += 2)
{
keys.emplace_back(arguments[i]);
values.emplace_back(arguments[i + 1]);
}
DataTypes tmp;
tmp.emplace_back(getLeastSupertype(keys));
tmp.emplace_back(getLeastSupertype(values));
return std::make_shared<DataTypeMap>(tmp);
}
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
2020-11-02 06:46:32 +00:00
{
size_t num_elements = arguments.size();
if (num_elements == 0)
return result_type->createColumnConstWithDefaultValue(input_rows_count);
2020-12-03 03:52:41 +00:00
const auto & result_type_map = static_cast<const DataTypeMap &>(*result_type);
const DataTypePtr & key_type = result_type_map.getKeyType();
const DataTypePtr & value_type = result_type_map.getValueType();
2020-11-02 06:46:32 +00:00
Columns columns_holder(num_elements);
ColumnRawPtrs column_ptrs(num_elements);
for (size_t i = 0; i < num_elements; ++i)
{
const auto & arg = arguments[i];
2020-12-03 03:52:41 +00:00
const auto to_type = i % 2 == 0 ? key_type : value_type;
2020-11-02 06:46:32 +00:00
2020-12-03 03:52:41 +00:00
ColumnPtr preprocessed_column = castColumn(arg, to_type);
2020-11-02 06:46:32 +00:00
preprocessed_column = preprocessed_column->convertToFullColumnIfConst();
columns_holder[i] = std::move(preprocessed_column);
column_ptrs[i] = columns_holder[i].get();
}
/// Create and fill the result map.
2020-12-03 03:52:41 +00:00
MutableColumnPtr keys_data = key_type->createColumn();
MutableColumnPtr values_data = value_type->createColumn();
MutableColumnPtr offsets = DataTypeNumber<IColumn::Offset>().createColumn();
2020-11-02 06:46:32 +00:00
2020-12-03 03:52:41 +00:00
size_t total_elements = input_rows_count * num_elements / 2;
keys_data->reserve(total_elements);
values_data->reserve(total_elements);
offsets->reserve(input_rows_count);
2020-11-02 06:46:32 +00:00
IColumn::Offset current_offset = 0;
for (size_t i = 0; i < input_rows_count; ++i)
{
for (size_t j = 0; j < num_elements; j += 2)
{
2020-12-03 03:52:41 +00:00
keys_data->insertFrom(*column_ptrs[j], i);
values_data->insertFrom(*column_ptrs[j + 1], i);
2020-11-02 06:46:32 +00:00
}
current_offset += num_elements / 2;
2020-12-03 03:52:41 +00:00
offsets->insert(current_offset);
2020-11-02 06:46:32 +00:00
}
2020-12-03 03:52:41 +00:00
auto nested_column = ColumnArray::create(
ColumnTuple::create(Columns{std::move(keys_data), std::move(values_data)}),
std::move(offsets));
2020-11-02 06:46:32 +00:00
2020-12-03 03:52:41 +00:00
return ColumnMap::create(nested_column);
2020-11-02 06:46:32 +00:00
}
};
2021-01-18 02:58:07 +00:00
struct NameMapContains { static constexpr auto name = "mapContains"; };
class FunctionMapContains : public IFunction
{
public:
2021-01-18 02:58:07 +00:00
static constexpr auto name = NameMapContains::name;
2021-06-01 12:20:52 +00:00
static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionMapContains>(); }
String getName() const override
{
2021-01-18 02:58:07 +00:00
return NameMapContains::name;
}
2021-09-22 16:08:08 +00:00
size_t getNumberOfArguments() const override { return impl.getNumberOfArguments(); }
2021-09-22 16:08:08 +00:00
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & arguments) const override
{
return impl.isSuitableForShortCircuitArgumentsExecution(arguments);
}
DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
{
2021-09-22 16:08:08 +00:00
return impl.getReturnTypeImpl(arguments);
}
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
{
2021-09-22 16:08:08 +00:00
return impl.executeImpl(arguments, result_type, input_rows_count);
}
2021-09-22 16:08:08 +00:00
private:
FunctionArrayIndex<HasAction, NameMapContains> impl;
};
2021-01-09 04:15:28 +00:00
class FunctionMapKeys : public IFunction
{
public:
static constexpr auto name = "mapKeys";
2021-06-01 12:20:52 +00:00
static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionMapKeys>(); }
String getName() const override
{
2021-01-09 04:15:28 +00:00
return name;
}
size_t getNumberOfArguments() const override { return 1; }
2021-06-22 16:21:23 +00:00
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
{
if (arguments.size() != 1)
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
+ toString(arguments.size()) + ", should be 1",
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
const DataTypeMap * map_type = checkAndGetDataType<DataTypeMap>(arguments[0].type.get());
if (!map_type)
2021-01-21 17:47:57 +00:00
throw Exception{"First argument for function " + getName() + " must be a map",
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT};
auto key_type = map_type->getKeyType();
return std::make_shared<DataTypeArray>(key_type);
}
bool useDefaultImplementationForConstants() const override { return true; }
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & /*result_type*/, size_t /*input_rows_count*/) const override
{
const ColumnMap * col_map = typeid_cast<const ColumnMap *>(arguments[0].column.get());
if (!col_map)
return nullptr;
const auto & nested_column = col_map->getNestedColumn();
const auto & keys_data = col_map->getNestedData().getColumn(0);
return ColumnArray::create(keys_data.getPtr(), nested_column.getOffsetsPtr());
}
};
2021-01-09 04:15:28 +00:00
class FunctionMapValues : public IFunction
{
public:
static constexpr auto name = "mapValues";
2021-06-01 12:20:52 +00:00
static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionMapValues>(); }
String getName() const override
{
2021-01-09 04:15:28 +00:00
return name;
}
size_t getNumberOfArguments() const override { return 1; }
2021-06-22 16:21:23 +00:00
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
{
if (arguments.size() != 1)
throw Exception("Number of arguments for function " + getName() + " doesn't match: passed "
+ toString(arguments.size()) + ", should be 1",
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
const DataTypeMap * map_type = checkAndGetDataType<DataTypeMap>(arguments[0].type.get());
if (!map_type)
2021-01-21 17:47:57 +00:00
throw Exception{"First argument for function " + getName() + " must be a map",
ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT};
auto value_type = map_type->getValueType();
return std::make_shared<DataTypeArray>(value_type);
}
bool useDefaultImplementationForConstants() const override { return true; }
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & /*result_type*/, size_t /*input_rows_count*/) const override
{
const ColumnMap * col_map = typeid_cast<const ColumnMap *>(arguments[0].column.get());
if (!col_map)
return nullptr;
const auto & nested_column = col_map->getNestedColumn();
const auto & values_data = col_map->getNestedData().getColumn(1);
return ColumnArray::create(values_data.getPtr(), nested_column.getOffsetsPtr());
}
};
2020-11-02 06:46:32 +00:00
}
void registerFunctionsMap(FunctionFactory & factory)
{
factory.registerFunction<FunctionMap>();
factory.registerFunction<FunctionMapContains>();
factory.registerFunction<FunctionMapKeys>();
factory.registerFunction<FunctionMapValues>();
2020-11-02 06:46:32 +00:00
}
}