2021-04-23 23:56:26 +00:00
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include <Core/Block.h>
|
|
|
|
#include <Core/NamesAndTypes.h>
|
2021-05-26 02:41:38 +00:00
|
|
|
#include <Common/FieldVisitors.h>
|
2021-07-23 16:30:18 +00:00
|
|
|
#include <Storages/ColumnsDescription.h>
|
2021-12-01 02:58:24 +00:00
|
|
|
#include <DataTypes/DataTypeTuple.h>
|
|
|
|
#include <DataTypes/Serializations/JSONDataParser.h>
|
2022-02-09 20:47:53 +00:00
|
|
|
#include <DataTypes/DataTypesNumber.h>
|
|
|
|
#include <Columns/ColumnObject.h>
|
2021-04-23 23:56:26 +00:00
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2021-05-06 05:33:06 +00:00
|
|
|
size_t getNumberOfDimensions(const IDataType & type);
|
|
|
|
size_t getNumberOfDimensions(const IColumn & column);
|
2021-06-10 13:57:31 +00:00
|
|
|
DataTypePtr getBaseTypeOfArray(const DataTypePtr & type);
|
2022-01-27 00:24:34 +00:00
|
|
|
DataTypePtr createArrayOfType(DataTypePtr type, size_t num_dimensions);
|
2022-01-21 14:55:26 +00:00
|
|
|
Array createEmptyArrayField(size_t num_dimensions);
|
2021-05-06 05:33:06 +00:00
|
|
|
|
2021-12-23 12:28:40 +00:00
|
|
|
ColumnPtr getBaseColumnOfArray(const ColumnPtr & column);
|
|
|
|
ColumnPtr createArrayOfColumn(const ColumnPtr & column, size_t num_dimensions);
|
|
|
|
|
2021-04-23 23:56:26 +00:00
|
|
|
DataTypePtr getDataTypeByColumn(const IColumn & column);
|
2021-05-29 01:19:20 +00:00
|
|
|
void convertObjectsToTuples(NamesAndTypesList & columns_list, Block & block, const NamesAndTypesList & extended_storage_columns);
|
2022-02-01 11:14:27 +00:00
|
|
|
void checkObjectHasNoAmbiguosPaths(const PathsInData & paths);
|
2021-09-13 12:40:39 +00:00
|
|
|
DataTypePtr getLeastCommonTypeForObject(const DataTypes & types, bool check_ambiguos_paths = false);
|
2021-07-23 16:30:18 +00:00
|
|
|
void extendObjectColumns(NamesAndTypesList & columns_list, const ColumnsDescription & object_columns, bool with_subcolumns);
|
|
|
|
|
2022-02-09 20:47:53 +00:00
|
|
|
NameSet getNamesOfObjectColumns(const NamesAndTypesList & columns_list);
|
|
|
|
bool hasObjectColumns(const ColumnsDescription & columns);
|
|
|
|
|
|
|
|
void updateObjectColumns(ColumnsDescription & object_columns, const NamesAndTypesList & new_columns);
|
|
|
|
|
2021-12-01 02:58:24 +00:00
|
|
|
using DataTypeTuplePtr = std::shared_ptr<DataTypeTuple>;
|
|
|
|
|
2022-02-01 11:14:27 +00:00
|
|
|
std::pair<PathsInData, DataTypes> flattenTuple(const DataTypePtr & type);
|
2022-01-27 00:24:34 +00:00
|
|
|
ColumnPtr flattenTuple(const ColumnPtr & column);
|
2021-12-01 02:58:24 +00:00
|
|
|
|
|
|
|
DataTypePtr unflattenTuple(
|
2022-02-01 11:14:27 +00:00
|
|
|
const PathsInData & paths,
|
2021-12-01 02:58:24 +00:00
|
|
|
const DataTypes & tuple_types);
|
|
|
|
|
2022-01-27 00:24:34 +00:00
|
|
|
std::pair<ColumnPtr, DataTypePtr> unflattenTuple(
|
2022-02-01 11:14:27 +00:00
|
|
|
const PathsInData & paths,
|
2021-12-01 02:58:24 +00:00
|
|
|
const DataTypes & tuple_types,
|
|
|
|
const Columns & tuple_columns);
|
|
|
|
|
2021-07-23 16:30:18 +00:00
|
|
|
void replaceMissedSubcolumnsByConstants(
|
|
|
|
const ColumnsDescription & expected_columns,
|
|
|
|
const ColumnsDescription & available_columns,
|
|
|
|
ASTPtr query);
|
2021-07-09 03:15:41 +00:00
|
|
|
|
2021-06-12 15:10:25 +00:00
|
|
|
void finalizeObjectColumns(MutableColumns & columns);
|
2021-04-23 23:56:26 +00:00
|
|
|
|
2022-02-09 20:47:53 +00:00
|
|
|
template <typename Iterator, typename EntryColumnsGetter>
|
|
|
|
ColumnsDescription getObjectColumns(
|
|
|
|
Iterator begin, Iterator end,
|
|
|
|
const ColumnsDescription & storage_columns,
|
|
|
|
EntryColumnsGetter && entry_columns_getter)
|
|
|
|
{
|
|
|
|
ColumnsDescription res;
|
|
|
|
|
|
|
|
if (begin == end)
|
|
|
|
{
|
|
|
|
for (const auto & column : storage_columns)
|
|
|
|
{
|
|
|
|
if (isObject(column.type))
|
|
|
|
{
|
|
|
|
auto tuple_type = std::make_shared<DataTypeTuple>(
|
|
|
|
DataTypes{std::make_shared<DataTypeUInt8>()},
|
|
|
|
Names{ColumnObject::COLUMN_NAME_DUMMY});
|
|
|
|
|
|
|
|
res.add({column.name, std::move(tuple_type)});
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::unordered_map<String, DataTypes> types_in_entries;
|
|
|
|
|
|
|
|
for (auto it = begin; it != end; ++it)
|
|
|
|
{
|
|
|
|
const auto & entry_columns = entry_columns_getter(*it);
|
|
|
|
for (const auto & column : entry_columns)
|
|
|
|
{
|
|
|
|
auto storage_column = storage_columns.tryGetPhysical(column.name);
|
|
|
|
if (storage_column && isObject(storage_column->type))
|
|
|
|
types_in_entries[column.name].push_back(column.type);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for (const auto & [name, types] : types_in_entries)
|
|
|
|
res.add({String(name), getLeastCommonTypeForObject(types)});
|
|
|
|
|
|
|
|
return res;
|
|
|
|
}
|
|
|
|
|
2021-04-23 23:56:26 +00:00
|
|
|
}
|