2017-04-01 09:19:00 +00:00
|
|
|
#include <Columns/ColumnTuple.h>
|
2017-06-06 17:18:32 +00:00
|
|
|
#include <ext/map.h>
|
|
|
|
#include <ext/range.h>
|
2017-07-06 13:54:55 +00:00
|
|
|
#include <DataStreams/ColumnGathererStream.h>
|
2017-03-12 12:56:59 +00:00
|
|
|
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
|
|
|
namespace ErrorCodes
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
extern const int NOT_IMPLEMENTED;
|
|
|
|
extern const int CANNOT_INSERT_VALUE_OF_DIFFERENT_SIZE_INTO_TUPLE;
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2017-12-07 05:53:23 +00:00
|
|
|
std::string ColumnTuple::getName() const
|
|
|
|
{
|
|
|
|
std::stringstream res;
|
|
|
|
res << "Tuple(";
|
|
|
|
bool is_first = true;
|
|
|
|
for (const auto & column : columns)
|
|
|
|
{
|
|
|
|
if (!is_first)
|
|
|
|
res << ", ";
|
|
|
|
is_first = false;
|
|
|
|
res << column->getName();
|
|
|
|
}
|
|
|
|
res << ")";
|
|
|
|
return res.str();
|
|
|
|
}
|
|
|
|
|
2017-03-12 12:56:59 +00:00
|
|
|
ColumnTuple::ColumnTuple(Block data_) : data(data_)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
size_t size = data.columns();
|
|
|
|
columns.resize(size);
|
|
|
|
for (size_t i = 0; i < size; ++i)
|
|
|
|
columns[i] = data.getByPosition(i).column;
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
2017-03-12 13:16:48 +00:00
|
|
|
ColumnPtr ColumnTuple::cloneEmpty() const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
return std::make_shared<ColumnTuple>(data.cloneEmpty());
|
2017-03-12 13:16:48 +00:00
|
|
|
}
|
|
|
|
|
2017-03-12 12:56:59 +00:00
|
|
|
Field ColumnTuple::operator[](size_t n) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
return Tuple{ext::map<TupleBackend>(columns, [n] (const auto & column) { return (*column)[n]; })};
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ColumnTuple::get(size_t n, Field & res) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
const size_t size = columns.size();
|
|
|
|
res = Tuple(TupleBackend(size));
|
|
|
|
TupleBackend & res_arr = DB::get<Tuple &>(res).t;
|
|
|
|
for (const auto i : ext::range(0, size))
|
|
|
|
columns[i]->get(n, res_arr[i]);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
2017-12-01 21:13:25 +00:00
|
|
|
StringRef ColumnTuple::getDataAt(size_t) const
|
2017-03-12 12:56:59 +00:00
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
throw Exception("Method getDataAt is not supported for " + getName(), ErrorCodes::NOT_IMPLEMENTED);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
2017-12-01 21:13:25 +00:00
|
|
|
void ColumnTuple::insertData(const char *, size_t)
|
2017-03-12 12:56:59 +00:00
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
throw Exception("Method insertData is not supported for " + getName(), ErrorCodes::NOT_IMPLEMENTED);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ColumnTuple::insert(const Field & x)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
const TupleBackend & tuple = DB::get<const Tuple &>(x).t;
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
const size_t size = columns.size();
|
|
|
|
if (tuple.size() != size)
|
|
|
|
throw Exception("Cannot insert value of different size into tuple", ErrorCodes::CANNOT_INSERT_VALUE_OF_DIFFERENT_SIZE_INTO_TUPLE);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
for (size_t i = 0; i < size; ++i)
|
|
|
|
columns[i]->insert(tuple[i]);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ColumnTuple::insertFrom(const IColumn & src_, size_t n)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
const ColumnTuple & src = static_cast<const ColumnTuple &>(src_);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
size_t size = columns.size();
|
|
|
|
if (src.columns.size() != size)
|
|
|
|
throw Exception("Cannot insert value of different size into tuple", ErrorCodes::CANNOT_INSERT_VALUE_OF_DIFFERENT_SIZE_INTO_TUPLE);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
for (size_t i = 0; i < size; ++i)
|
|
|
|
columns[i]->insertFrom(*src.columns[i], n);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ColumnTuple::insertDefault()
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
for (auto & column : columns)
|
|
|
|
column->insertDefault();
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ColumnTuple::popBack(size_t n)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
for (auto & column : columns)
|
|
|
|
column->popBack(n);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
StringRef ColumnTuple::serializeValueIntoArena(size_t n, Arena & arena, char const *& begin) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
size_t values_size = 0;
|
|
|
|
for (auto & column : columns)
|
|
|
|
values_size += column->serializeValueIntoArena(n, arena, begin).size;
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return StringRef(begin, values_size);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
const char * ColumnTuple::deserializeAndInsertFromArena(const char * pos)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
for (auto & column : columns)
|
|
|
|
pos = column->deserializeAndInsertFromArena(pos);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return pos;
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ColumnTuple::updateHashWithValue(size_t n, SipHash & hash) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
for (auto & column : columns)
|
|
|
|
column->updateHashWithValue(n, hash);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ColumnTuple::insertRangeFrom(const IColumn & src, size_t start, size_t length)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
for (size_t i = 0; i < columns.size(); ++i)
|
|
|
|
data.getByPosition(i).column->insertRangeFrom(
|
|
|
|
*static_cast<const ColumnTuple &>(src).data.getByPosition(i).column.get(),
|
|
|
|
start, length);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
ColumnPtr ColumnTuple::filter(const Filter & filt, ssize_t result_size_hint) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
Block res_block = data.cloneEmpty();
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
for (size_t i = 0; i < columns.size(); ++i)
|
|
|
|
res_block.getByPosition(i).column = data.getByPosition(i).column->filter(filt, result_size_hint);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return std::make_shared<ColumnTuple>(res_block);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
ColumnPtr ColumnTuple::permute(const Permutation & perm, size_t limit) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
Block res_block = data.cloneEmpty();
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
for (size_t i = 0; i < columns.size(); ++i)
|
|
|
|
res_block.getByPosition(i).column = data.getByPosition(i).column->permute(perm, limit);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return std::make_shared<ColumnTuple>(res_block);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
ColumnPtr ColumnTuple::replicate(const Offsets_t & offsets) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
Block res_block = data.cloneEmpty();
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
for (size_t i = 0; i < columns.size(); ++i)
|
|
|
|
res_block.getByPosition(i).column = data.getByPosition(i).column->replicate(offsets);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return std::make_shared<ColumnTuple>(res_block);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
Columns ColumnTuple::scatter(ColumnIndex num_columns, const Selector & selector) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
size_t num_tuple_elements = columns.size();
|
|
|
|
std::vector<Columns> scattered_tuple_elements(num_tuple_elements);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
for (size_t tuple_element_idx = 0; tuple_element_idx < num_tuple_elements; ++tuple_element_idx)
|
|
|
|
scattered_tuple_elements[tuple_element_idx] = data.getByPosition(tuple_element_idx).column->scatter(num_columns, selector);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
Columns res(num_columns);
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
for (size_t scattered_idx = 0; scattered_idx < num_columns; ++scattered_idx)
|
|
|
|
{
|
|
|
|
Block res_block = data.cloneEmpty();
|
|
|
|
for (size_t tuple_element_idx = 0; tuple_element_idx < num_tuple_elements; ++tuple_element_idx)
|
|
|
|
res_block.getByPosition(tuple_element_idx).column = scattered_tuple_elements[tuple_element_idx][scattered_idx];
|
|
|
|
res[scattered_idx] = std::make_shared<ColumnTuple>(res_block);
|
|
|
|
}
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return res;
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
int ColumnTuple::compareAt(size_t n, size_t m, const IColumn & rhs, int nan_direction_hint) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
size_t size = columns.size();
|
|
|
|
for (size_t i = 0; i < size; ++i)
|
|
|
|
if (int res = columns[i]->compareAt(n, m, *static_cast<const ColumnTuple &>(rhs).columns[i], nan_direction_hint))
|
|
|
|
return res;
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return 0;
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
template <bool positive>
|
|
|
|
struct ColumnTuple::Less
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
ConstColumnPlainPtrs plain_columns;
|
|
|
|
int nan_direction_hint;
|
|
|
|
|
|
|
|
Less(const Columns & columns, int nan_direction_hint_)
|
|
|
|
: nan_direction_hint(nan_direction_hint_)
|
|
|
|
{
|
|
|
|
for (const auto & column : columns)
|
|
|
|
plain_columns.push_back(column.get());
|
|
|
|
}
|
|
|
|
|
|
|
|
bool operator() (size_t a, size_t b) const
|
|
|
|
{
|
|
|
|
for (ConstColumnPlainPtrs::const_iterator it = plain_columns.begin(); it != plain_columns.end(); ++it)
|
|
|
|
{
|
|
|
|
int res = (*it)->compareAt(a, b, **it, nan_direction_hint);
|
|
|
|
if (res < 0)
|
|
|
|
return positive;
|
|
|
|
else if (res > 0)
|
|
|
|
return !positive;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
2017-03-12 12:56:59 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
void ColumnTuple::getPermutation(bool reverse, size_t limit, int nan_direction_hint, Permutation & res) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
size_t rows = size();
|
|
|
|
res.resize(rows);
|
|
|
|
for (size_t i = 0; i < rows; ++i)
|
|
|
|
res[i] = i;
|
|
|
|
|
|
|
|
if (limit >= rows)
|
|
|
|
limit = 0;
|
|
|
|
|
|
|
|
if (limit)
|
|
|
|
{
|
|
|
|
if (reverse)
|
|
|
|
std::partial_sort(res.begin(), res.begin() + limit, res.end(), Less<false>(columns, nan_direction_hint));
|
|
|
|
else
|
|
|
|
std::partial_sort(res.begin(), res.begin() + limit, res.end(), Less<true>(columns, nan_direction_hint));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
if (reverse)
|
|
|
|
std::sort(res.begin(), res.end(), Less<false>(columns, nan_direction_hint));
|
|
|
|
else
|
|
|
|
std::sort(res.begin(), res.end(), Less<true>(columns, nan_direction_hint));
|
|
|
|
}
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
2017-07-06 13:54:55 +00:00
|
|
|
void ColumnTuple::gather(ColumnGathererStream & gatherer)
|
|
|
|
{
|
|
|
|
gatherer.gather(*this);
|
|
|
|
}
|
|
|
|
|
2017-03-12 12:56:59 +00:00
|
|
|
void ColumnTuple::reserve(size_t n)
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
for (auto & column : columns)
|
|
|
|
column->reserve(n);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
size_t ColumnTuple::byteSize() const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
size_t res = 0;
|
|
|
|
for (const auto & column : columns)
|
|
|
|
res += column->byteSize();
|
|
|
|
return res;
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
2017-07-13 16:49:09 +00:00
|
|
|
size_t ColumnTuple::allocatedBytes() const
|
2017-03-12 12:56:59 +00:00
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
size_t res = 0;
|
|
|
|
for (const auto & column : columns)
|
2017-07-13 16:49:09 +00:00
|
|
|
res += column->allocatedBytes();
|
2017-04-01 07:20:54 +00:00
|
|
|
return res;
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
ColumnPtr ColumnTuple::convertToFullColumnIfConst() const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
Block materialized = data;
|
|
|
|
for (size_t i = 0, size = materialized.columns(); i < size; ++i)
|
|
|
|
if (auto converted = materialized.getByPosition(i).column->convertToFullColumnIfConst())
|
|
|
|
materialized.getByPosition(i).column = converted;
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
return std::make_shared<ColumnTuple>(materialized);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void ColumnTuple::getExtremes(Field & min, Field & max) const
|
|
|
|
{
|
2017-04-01 07:20:54 +00:00
|
|
|
const size_t tuple_size = columns.size();
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
min = Tuple(TupleBackend(tuple_size));
|
|
|
|
max = Tuple(TupleBackend(tuple_size));
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
auto & min_backend = min.get<Tuple &>().t;
|
|
|
|
auto & max_backend = max.get<Tuple &>().t;
|
2017-03-12 12:56:59 +00:00
|
|
|
|
2017-04-01 07:20:54 +00:00
|
|
|
for (const auto i : ext::range(0, tuple_size))
|
|
|
|
columns[i]->getExtremes(min_backend[i], max_backend[i]);
|
2017-03-12 12:56:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
}
|