ClickHouse/dbms/include/DB/Core/NamesAndTypes.h

145 lines
3.6 KiB
C
Raw Normal View History

2011-10-31 17:55:06 +00:00
#pragma once
2010-03-18 19:32:14 +00:00
#include <map>
#include <list>
2010-03-18 19:32:14 +00:00
#include <string>
2014-07-09 13:39:19 +00:00
#include <set>
2010-03-18 19:32:14 +00:00
#include <Poco/SharedPtr.h>
#include <DB/DataTypes/IDataType.h>
2014-07-09 13:39:19 +00:00
#include <DB/DataTypes/DataTypeFactory.h>
2014-07-10 10:16:50 +00:00
#include <DB/IO/ReadBufferFromString.h>
#include "Names.h"
2010-03-18 19:32:14 +00:00
namespace DB
{
using Poco::SharedPtr;
struct NameAndTypePair
{
String name;
DataTypePtr type;
NameAndTypePair() {}
NameAndTypePair(const String & name_, const DataTypePtr & type_) : name(name_), type(type_) {}
bool operator<(const NameAndTypePair & rhs) const
{
return std::forward_as_tuple(name, type->getName()) < std::forward_as_tuple(rhs.name, rhs.type->getName());
}
bool operator==(const NameAndTypePair & rhs) const
{
return name == rhs.name && type->getName() == rhs.type->getName();
}
};
typedef std::vector<NameAndTypePair> NamesAndTypes;
2011-11-01 17:12:11 +00:00
2014-07-09 13:39:19 +00:00
class NamesAndTypesList : public std::list<NameAndTypePair>
{
public:
using std::list<NameAndTypePair>::list;
void readText(ReadBuffer & buf, const DataTypeFactory & data_type_factory)
{
DB::assertString("columns format version: 1\n", buf);
size_t count;
DB::readText(count, buf);
DB::assertString(" columns:\n", buf);
resize(count);
for (NameAndTypePair & it : *this)
{
DB::readBackQuotedString(it.name, buf);
DB::assertString(" ", buf);
String type_name;
DB::readString(type_name, buf);
it.type = data_type_factory.get(type_name);
DB::assertString("\n", buf);
}
}
2014-07-10 10:16:50 +00:00
void writeText(WriteBuffer & buf) const
2014-07-09 13:39:19 +00:00
{
DB::writeString("columns format version: 1\n", buf);
DB::writeText(size(), buf);
DB::writeString(" columns:\n", buf);
for (const auto & it : *this)
{
DB::writeBackQuotedString(it.name, buf);
DB::writeChar(' ', buf);
DB::writeString(it.type->getName(), buf);
DB::writeChar('\n', buf);
}
}
2014-07-10 08:40:59 +00:00
String toString() const
{
String s;
{
WriteBufferFromString out(s);
writeText(out);
}
return s;
}
2014-07-10 10:16:50 +00:00
static NamesAndTypesList parse(const String & s, const DataTypeFactory & data_type_factory)
2014-07-10 08:40:59 +00:00
{
ReadBufferFromString in(s);
NamesAndTypesList res;
2014-07-10 10:16:50 +00:00
res.readText(in, data_type_factory);
2014-07-10 08:40:59 +00:00
assertEOF(in);
return res;
}
2014-07-09 13:39:19 +00:00
/// Все элементы rhs должны быть различны.
bool isSubsetOf(const NamesAndTypesList & rhs) const
{
NamesAndTypes vector(rhs.begin(), rhs.end());
vector.insert(vector.end(), begin(), end());
std::sort(vector.begin(), vector.end());
return std::unique(vector.begin(), vector.end()) == vector.begin() + rhs.size();
}
2014-07-10 08:40:59 +00:00
/// Расстояние Хемминга между множествами
/// (иными словами, добавленные и удаленные столбцы считаются один раз; столбцы, изменившие тип, - дважды).
size_t sizeOfDifference(const NamesAndTypesList & rhs) const
{
NamesAndTypes vector(rhs.begin(), rhs.end());
vector.insert(vector.end(), begin(), end());
std::sort(vector.begin(), vector.end());
return (std::unique(vector.begin(), vector.end()) - vector.begin()) * 2 - size() - rhs.size();
}
2014-07-14 14:07:47 +00:00
Names getNames() const
{
Names res;
res.reserve(size());
2014-07-14 14:07:47 +00:00
for (const NameAndTypePair & column : *this)
{
res.push_back(column.name);
}
return res;
}
/// Оставить только столбцы, имена которых есть в names. В names могут быть лишние столбцы.
NamesAndTypesList intersect(const Names & names) const
2014-07-14 14:07:47 +00:00
{
std::set<String> name_set(names.begin(), names.end());
NamesAndTypesList res;
for (const NameAndTypePair & column : *this)
{
if (name_set.count(column.name))
res.push_back(column);
}
return res;
}
2014-07-09 13:39:19 +00:00
};
typedef SharedPtr<NamesAndTypesList> NamesAndTypesListPtr;
2010-03-18 19:32:14 +00:00
}