mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-10-19 06:50:50 +00:00
8b3afeb60d
commit f968e7e7f0d84c89fd26dea1d541bd9f6041d7c8 Author: Alexey Milovidov <milovidov@yandex-team.ru> Date: Tue Feb 16 06:11:29 2016 +0300 Addition [#METR-2944]. commit 7524981fa7c4f22929dd5009444a0ae28500f620 Author: Alexey Milovidov <milovidov@yandex-team.ru> Date: Tue Feb 16 06:08:43 2016 +0300 Fixed error (incomplete) [#METR-2944]. commit 2f1e7bf9f46cd9ce958ade9041c00ce067940fd2 Author: Alexey Milovidov <milovidov@yandex-team.ru> Date: Tue Feb 16 05:37:43 2016 +0300 Improving performance of row formats [#METR-2944]. commit 9848910f235863c9571ef1ebe0d87d4929ee283c Author: Alexey Milovidov <milovidov@yandex-team.ru> Date: Tue Feb 16 00:37:12 2016 +0300 Improving performance of text formats [#METR-2944]. commit 3aedc7fd784af962e64ffdd10ec23ac53827d8e2 Author: Alexey Milovidov <milovidov@yandex-team.ru> Date: Tue Feb 16 00:18:00 2016 +0300 Improving performance of row formats [#METR-2944]. commit cb5932c2b0385604477e69c8262dc31a4bb4b23b Author: Alexey Milovidov <milovidov@yandex-team.ru> Date: Mon Feb 15 00:53:27 2016 +0300 Fixed error. commit 42863fd4eddeef594e846c598b92877b6ff86fa6 Author: Alexey Milovidov <milovidov@yandex-team.ru> Date: Sun Feb 14 23:13:46 2016 +0300 Improving performance of row formats [#METR-2944]. commit 71c6fb19a85a79297433ceb486fdb97e551d964f Author: Alexey Milovidov <milovidov@yandex-team.ru> Date: Sun Feb 14 16:58:56 2016 +0300 Improving performance of row formats [#METR-2944].
240 lines
7.0 KiB
C++
240 lines
7.0 KiB
C++
#include <DB/IO/WriteBufferFromString.h>
|
|
#include <DB/DataTypes/DataTypeEnum.h>
|
|
|
|
|
|
namespace DB
|
|
{
|
|
|
|
namespace ErrorCodes
|
|
{
|
|
extern const int SYNTAX_ERROR;
|
|
extern const int EMPTY_DATA_PASSED;
|
|
}
|
|
|
|
|
|
template <typename FieldType> struct EnumName;
|
|
template <> struct EnumName<Int8> { static constexpr auto value = "Enum8"; };
|
|
template <> struct EnumName<Int16> { static constexpr auto value = "Enum16"; };
|
|
|
|
|
|
template <typename Type>
|
|
std::string DataTypeEnum<Type>::generateName(const Values & values)
|
|
{
|
|
std::string name;
|
|
|
|
{
|
|
WriteBufferFromString out{name};
|
|
|
|
writeString(EnumName<FieldType>::value, out);
|
|
writeChar('(', out);
|
|
|
|
auto first = true;
|
|
for (const auto & name_and_value : values)
|
|
{
|
|
if (!first)
|
|
writeString(", ", out);
|
|
|
|
first = false;
|
|
|
|
writeQuotedString(name_and_value.first, out);
|
|
writeString(" = ", out);
|
|
writeText(name_and_value.second, out);
|
|
}
|
|
|
|
writeChar(')', out);
|
|
}
|
|
|
|
return name;
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::fillMaps()
|
|
{
|
|
for (const auto & name_and_value : values )
|
|
{
|
|
const auto name_to_value_pair = name_to_value_map.insert(
|
|
{ StringRef{name_and_value.first}, name_and_value.second });
|
|
if (!name_to_value_pair.second)
|
|
throw Exception{
|
|
"Duplicate names in enum: '" + name_and_value.first + "' = " + toString(name_and_value.second)
|
|
+ " and '" + name_to_value_pair.first->first.toString() + "' = " + toString(
|
|
name_to_value_pair.first->second),
|
|
ErrorCodes::SYNTAX_ERROR
|
|
};
|
|
|
|
const auto value_to_name_pair = value_to_name_map.insert(
|
|
{ name_and_value.second, StringRef{name_and_value.first} });
|
|
if (!value_to_name_pair.second)
|
|
throw Exception{
|
|
"Duplicate values in enum: '" + name_and_value.first + "' = " + toString(name_and_value.second)
|
|
+ " and '" + value_to_name_pair.first->second.toString() + "' = " + toString(
|
|
value_to_name_pair.first->first),
|
|
ErrorCodes::SYNTAX_ERROR
|
|
};
|
|
}
|
|
}
|
|
|
|
template <typename Type>
|
|
DataTypeEnum<Type>::DataTypeEnum(const Values & values_) : values{values_}
|
|
{
|
|
if (values.empty())
|
|
throw Exception{
|
|
"DataTypeEnum enumeration cannot be empty",
|
|
ErrorCodes::EMPTY_DATA_PASSED
|
|
};
|
|
|
|
fillMaps();
|
|
|
|
std::sort(std::begin(values), std::end(values), [] (auto & left, auto & right) {
|
|
return left.second < right.second;
|
|
});
|
|
|
|
name = generateName(values);
|
|
}
|
|
|
|
template <typename Type>
|
|
DataTypeEnum<Type>::DataTypeEnum(const DataTypeEnum & other) : values{other.values}, name{other.name}
|
|
{
|
|
fillMaps();
|
|
}
|
|
|
|
template <typename Type>
|
|
DataTypePtr DataTypeEnum<Type>::clone() const
|
|
{
|
|
return new DataTypeEnum(*this);
|
|
}
|
|
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeBinary(const Field & field, WriteBuffer & ostr) const
|
|
{
|
|
const FieldType x = get<typename NearestFieldType<FieldType>::Type>(field);
|
|
writeBinary(x, ostr);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::deserializeBinary(Field & field, ReadBuffer & istr) const
|
|
{
|
|
FieldType x;
|
|
readBinary(x, istr);
|
|
field = nearestFieldType(x);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeBinary(const IColumn & column, size_t row_num, WriteBuffer & ostr) const
|
|
{
|
|
writeBinary(static_cast<const ColumnType &>(column).getData()[row_num], ostr);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::deserializeBinary(IColumn & column, ReadBuffer & istr) const
|
|
{
|
|
typename ColumnType::value_type x;
|
|
readBinary(x, istr);
|
|
static_cast<ColumnType &>(column).getData().push_back(x);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr) const
|
|
{
|
|
writeString(getNameForValue(static_cast<const ColumnType &>(column).getData()[row_num]), ostr);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr) const
|
|
{
|
|
writeEscapedString(getNameForValue(static_cast<const ColumnType &>(column).getData()[row_num]), ostr);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::deserializeTextEscaped(IColumn & column, ReadBuffer & istr) const
|
|
{
|
|
/// NOTE Неплохо было бы сделать без создания временного объекта - хотя бы вынести std::string наружу.
|
|
std::string name;
|
|
readEscapedString(name, istr);
|
|
static_cast<ColumnType &>(column).getData().push_back(getValue(StringRef(name)));
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr) const
|
|
{
|
|
writeQuotedString(getNameForValue(static_cast<const ColumnType &>(column).getData()[row_num]), ostr);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::deserializeTextQuoted(IColumn & column, ReadBuffer & istr) const
|
|
{
|
|
std::string name;
|
|
readQuotedString(name, istr);
|
|
static_cast<ColumnType &>(column).getData().push_back(getValue(StringRef(name)));
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr) const
|
|
{
|
|
writeJSONString(getNameForValue(static_cast<const ColumnType &>(column).getData()[row_num]), ostr);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr) const
|
|
{
|
|
writeXMLString(getNameForValue(static_cast<const ColumnType &>(column).getData()[row_num]), ostr);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr) const
|
|
{
|
|
writeCSVString(getNameForValue(static_cast<const ColumnType &>(column).getData()[row_num]), ostr);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::deserializeTextCSV(IColumn & column, ReadBuffer & istr, const char delimiter) const
|
|
{
|
|
std::string name;
|
|
readCSVString(name, istr, delimiter);
|
|
static_cast<ColumnType &>(column).getData().push_back(getValue(StringRef(name)));
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::serializeBinary(
|
|
const IColumn & column, WriteBuffer & ostr, const size_t offset, size_t limit) const
|
|
{
|
|
const auto & x = typeid_cast<const ColumnType &>(column).getData();
|
|
const auto size = x.size();
|
|
|
|
if (limit == 0 || offset + limit > size)
|
|
limit = size - offset;
|
|
|
|
ostr.write(reinterpret_cast<const char *>(&x[offset]), sizeof(FieldType) * limit);
|
|
}
|
|
|
|
template <typename Type>
|
|
void DataTypeEnum<Type>::deserializeBinary(
|
|
IColumn & column, ReadBuffer & istr, const size_t limit, const double avg_value_size_hint) const
|
|
{
|
|
auto & x = typeid_cast<ColumnType &>(column).getData();
|
|
const auto initial_size = x.size();
|
|
x.resize(initial_size + limit);
|
|
const auto size = istr.readBig(reinterpret_cast<char*>(&x[initial_size]), sizeof(FieldType) * limit);
|
|
x.resize(initial_size + size / sizeof(FieldType));
|
|
}
|
|
|
|
template <typename Type>
|
|
ColumnPtr DataTypeEnum<Type>::createConstColumn(const size_t size, const Field & field) const
|
|
{
|
|
return new ConstColumnType(size, get<typename NearestFieldType<FieldType>::Type>(field));
|
|
}
|
|
|
|
template <typename Type>
|
|
Field DataTypeEnum<Type>::getDefault() const
|
|
{
|
|
return typename NearestFieldType<FieldType>::Type(values.front().second);
|
|
}
|
|
|
|
|
|
/// Явные инстанцирования.
|
|
template class DataTypeEnum<Int8>;
|
|
template class DataTypeEnum<Int16>;
|
|
|
|
}
|