ClickHouse/dbms/src/Storages/ColumnsDescription.cpp

286 lines
7.9 KiB
C++

#include <Storages/ColumnsDescription.h>
#include <Parsers/ASTLiteral.h>
#include <Parsers/ExpressionElementParsers.h>
#include <Parsers/ExpressionListParsers.h>
#include <Parsers/parseQuery.h>
#include <Parsers/queryToString.h>
#include <IO/WriteBuffer.h>
#include <IO/WriteHelpers.h>
#include <IO/ReadBuffer.h>
#include <IO/ReadHelpers.h>
#include <IO/WriteBufferFromString.h>
#include <IO/ReadBufferFromString.h>
#include <DataTypes/DataTypeFactory.h>
#include <Common/Exception.h>
#include <Interpreters/Context.h>
#include <Storages/IStorage.h>
#include <Common/typeid_cast.h>
#include <ext/collection_cast.h>
#include <ext/map.h>
#include <boost/range/join.hpp>
#include <Compression/CompressionFactory.h>
#include <optional>
namespace DB
{
namespace ErrorCodes
{
extern const int NO_SUCH_COLUMN_IN_TABLE;
extern const int CANNOT_PARSE_TEXT;
}
NamesAndTypesList ColumnsDescription::getAllPhysical() const
{
return ext::collection_cast<NamesAndTypesList>(boost::join(ordinary, materialized));
}
NamesAndTypesList ColumnsDescription::getAll() const
{
return ext::collection_cast<NamesAndTypesList>(boost::join(ordinary, boost::join(materialized, aliases)));
}
Names ColumnsDescription::getNamesOfPhysical() const
{
return ext::map<Names>(boost::join(ordinary, materialized), [] (const auto & it) { return it.name; });
}
NameAndTypePair ColumnsDescription::getPhysical(const String & column_name) const
{
for (auto & it : boost::join(ordinary, materialized))
if (it.name == column_name)
return it;
throw Exception("There is no column " + column_name + " in table.", ErrorCodes::NO_SUCH_COLUMN_IN_TABLE);
}
bool ColumnsDescription::hasPhysical(const String & column_name) const
{
for (auto & it : boost::join(ordinary, materialized))
if (it.name == column_name)
return true;
return false;
}
String ColumnsDescription::toString() const
{
WriteBufferFromOwnString buf;
writeCString("columns format version: 1\n", buf);
writeText(ordinary.size() + materialized.size() + aliases.size(), buf);
writeCString(" columns:\n", buf);
const auto write_columns = [this, &buf] (const NamesAndTypesList & columns)
{
for (const auto & column : columns)
{
const auto defaults_it = defaults.find(column.name);
const auto comments_it = comments.find(column.name);
const auto codec_it = codecs.find(column.name);
writeBackQuotedString(column.name, buf);
writeChar(' ', buf);
writeText(column.type->getName(), buf);
const bool exist_comment = comments_it != std::end(comments);
const bool exist_codec = codec_it != std::end(codecs);
if (defaults_it != std::end(defaults))
{
writeChar('\t', buf);
writeText(DB::toString(defaults_it->second.kind), buf);
writeChar('\t', buf);
writeText(queryToString(defaults_it->second.expression), buf);
}
else if (exist_comment)
{
writeChar('\t', buf);
}
if (exist_comment)
{
writeChar('\t', buf);
writeText(queryToString(ASTLiteral(Field(comments_it->second))), buf);
}
if (exist_codec)
{
writeChar('\t', buf);
writeText("CODEC(", buf);
writeText(codec_it->second->getCodecDesc(), buf);
writeText(")", buf);
}
writeChar('\n', buf);
}
};
write_columns(ordinary);
write_columns(materialized);
write_columns(aliases);
return buf.str();
}
std::optional<ColumnDefault> parseDefaultInfo(ReadBufferFromString & buf)
{
if (*buf.position() == '\n')
return {};
assertChar('\t', buf);
if (*buf.position() == '\t')
return {};
String default_kind_str;
readText(default_kind_str, buf);
const auto default_kind = columnDefaultKindFromString(default_kind_str);
assertChar('\t', buf);
ParserExpression expr_parser;
String default_expr_str;
readText(default_expr_str, buf);
ASTPtr default_expr = parseQuery(expr_parser, default_expr_str, "default_expression", 0);
return ColumnDefault{default_kind, std::move(default_expr)};
}
String parseComment(ReadBufferFromString& buf)
{
if (*buf.position() == '\n')
return {};
assertChar('\t', buf);
ParserStringLiteral string_literal_parser;
String comment_expr_str;
readText(comment_expr_str, buf);
ASTPtr comment_expr = parseQuery(string_literal_parser, comment_expr_str, "comment expression", 0);
return typeid_cast<ASTLiteral &>(*comment_expr).value.get<String>();
}
CompressionCodecPtr parseCodec(ReadBufferFromString& buf)
{
if (*buf.position() == '\n')
return {};
assertChar('\t', buf);
ParserCodec codec_parser;
String codec_expr_str;
readText(codec_expr_str, buf);
ASTPtr codec_expr = parseQuery(codec_parser, codec_expr_str, "codec expression", 0);
if (codec_expr)
return CompressionCodecFactory::instance().get(codec_expr);
else
return nullptr;
}
void parseColumn(ReadBufferFromString & buf, ColumnsDescription & result, const DataTypeFactory & data_type_factory)
{
String column_name;
readBackQuotedStringWithSQLStyle(column_name, buf);
assertChar(' ', buf);
String type_name;
readText(type_name, buf);
auto type = data_type_factory.get(type_name);
if (*buf.position() == '\n')
{
assertChar('\n', buf);
result.ordinary.emplace_back(column_name, std::move(type));
return;
}
auto column_default = parseDefaultInfo(buf);
if (column_default)
{
switch (column_default->kind)
{
case ColumnDefaultKind::Default:
result.ordinary.emplace_back(column_name, std::move(type));
break;
case ColumnDefaultKind::Materialized:
result.materialized.emplace_back(column_name, std::move(type));
break;
case ColumnDefaultKind::Alias:
result.aliases.emplace_back(column_name, std::move(type));
}
result.defaults.emplace(column_name, std::move(*column_default));
}
auto comment = parseComment(buf);
if (!comment.empty())
{
result.comments.emplace(column_name, std::move(comment));
}
auto codec = parseCodec(buf);
if (codec)
{
result.codecs.emplace(column_name, std::move(codec));
}
assertChar('\n', buf);
}
CompressionCodecPtr ColumnsDescription::getCodecOrDefault(const String & column_name, CompressionCodecPtr default_codec) const
{
const auto codec = codecs.find(column_name);
if (codec == codecs.end())
return default_codec;
return codec->second;
}
CompressionCodecPtr ColumnsDescription::getCodecOrDefault(const String & column_name) const
{
return getCodecOrDefault(column_name, CompressionCodecFactory::instance().getDefaultCodec());
}
ColumnsDescription ColumnsDescription::parse(const String & str)
{
ReadBufferFromString buf{str};
assertString("columns format version: 1\n", buf);
size_t count{};
readText(count, buf);
assertString(" columns:\n", buf);
ParserExpression expr_parser;
const DataTypeFactory & data_type_factory = DataTypeFactory::instance();
ColumnsDescription result;
for (size_t i = 0; i < count; ++i)
{
parseColumn(buf, result, data_type_factory);
}
assertEOF(buf);
return result;
}
const ColumnsDescription * ColumnsDescription::loadFromContext(const Context & context, const String & db, const String & table)
{
if (context.getSettingsRef().insert_sample_with_metadata)
{
if (context.isTableExist(db, table))
{
StoragePtr storage = context.getTable(db, table);
return &storage->getColumns();
}
}
return nullptr;
}
}