mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-18 12:22:12 +00:00
2716df8ab2
Added: * IDataTypeDomain interface; * method DataTypeFactory::registerDataTypeDomain for registering domains; * DataTypeDomainWithSimpleSerialization domain base class with simple serialization/deserialization; * Concrete IPv4 and IPv6 domain implementations: DataTypeDomanIPv6 and DataTypeDomanIPv4; Updated: * IDataType text serialization/deserialization methods; * IDataType implementation to use domain for text serialization/deserialization; * Refactored implementation of the IPv4/IPv6 functions to use formatIPv4/v6 and parseIPv4/v6 from Common/formatIPv6.h; Tests: * Added test cases for IPv4 and IPv6 domains. * Updated IPv4/v6 functions tests to validate more cases; * Added performance tests for IPv4 and IPv6 related functions;
241 lines
6.8 KiB
C++
241 lines
6.8 KiB
C++
#include <IO/WriteHelpers.h>
|
|
#include <IO/WriteBufferValidUTF8.h>
|
|
#include <Formats/XMLRowOutputStream.h>
|
|
#include <Formats/FormatFactory.h>
|
|
#include <Formats/BlockOutputStreamFromRowOutputStream.h>
|
|
|
|
|
|
namespace DB
|
|
{
|
|
|
|
XMLRowOutputStream::XMLRowOutputStream(WriteBuffer & ostr_, const Block & sample_, const FormatSettings & format_settings)
|
|
: dst_ostr(ostr_), format_settings(format_settings)
|
|
{
|
|
NamesAndTypesList columns(sample_.getNamesAndTypesList());
|
|
fields.assign(columns.begin(), columns.end());
|
|
field_tag_names.resize(sample_.columns());
|
|
|
|
bool need_validate_utf8 = false;
|
|
for (size_t i = 0; i < sample_.columns(); ++i)
|
|
{
|
|
if (!sample_.getByPosition(i).type->textCanContainOnlyValidUTF8())
|
|
need_validate_utf8 = true;
|
|
|
|
/// As element names, we will use the column name if it has a valid form, or "field", otherwise.
|
|
/// The condition below is more strict than the XML standard requires.
|
|
bool is_column_name_suitable = true;
|
|
const char * begin = fields[i].name.data();
|
|
const char * end = begin + fields[i].name.size();
|
|
for (const char * pos = begin; pos != end; ++pos)
|
|
{
|
|
char c = *pos;
|
|
if (!(isAlphaASCII(c)
|
|
|| (pos != begin && isNumericASCII(c))
|
|
|| c == '_'
|
|
|| c == '-'
|
|
|| c == '.'))
|
|
{
|
|
is_column_name_suitable = false;
|
|
break;
|
|
}
|
|
}
|
|
|
|
field_tag_names[i] = is_column_name_suitable
|
|
? fields[i].name
|
|
: "field";
|
|
}
|
|
|
|
if (need_validate_utf8)
|
|
{
|
|
validating_ostr = std::make_unique<WriteBufferValidUTF8>(dst_ostr);
|
|
ostr = validating_ostr.get();
|
|
}
|
|
else
|
|
ostr = &dst_ostr;
|
|
}
|
|
|
|
|
|
void XMLRowOutputStream::writePrefix()
|
|
{
|
|
writeCString("<?xml version='1.0' encoding='UTF-8' ?>\n", *ostr);
|
|
writeCString("<result>\n", *ostr);
|
|
writeCString("\t<meta>\n", *ostr);
|
|
writeCString("\t\t<columns>\n", *ostr);
|
|
|
|
for (size_t i = 0; i < fields.size(); ++i)
|
|
{
|
|
writeCString("\t\t\t<column>\n", *ostr);
|
|
|
|
writeCString("\t\t\t\t<name>", *ostr);
|
|
writeXMLString(fields[i].name, *ostr);
|
|
writeCString("</name>\n", *ostr);
|
|
writeCString("\t\t\t\t<type>", *ostr);
|
|
writeXMLString(fields[i].type->getName(), *ostr);
|
|
writeCString("</type>\n", *ostr);
|
|
|
|
writeCString("\t\t\t</column>\n", *ostr);
|
|
}
|
|
|
|
writeCString("\t\t</columns>\n", *ostr);
|
|
writeCString("\t</meta>\n", *ostr);
|
|
writeCString("\t<data>\n", *ostr);
|
|
}
|
|
|
|
|
|
void XMLRowOutputStream::writeField(const IColumn & column, const IDataType & type, size_t row_num)
|
|
{
|
|
writeCString("\t\t\t<", *ostr);
|
|
writeString(field_tag_names[field_number], *ostr);
|
|
writeCString(">", *ostr);
|
|
type.serializeAsTextXML(column, row_num, *ostr, format_settings);
|
|
writeCString("</", *ostr);
|
|
writeString(field_tag_names[field_number], *ostr);
|
|
writeCString(">\n", *ostr);
|
|
++field_number;
|
|
}
|
|
|
|
|
|
void XMLRowOutputStream::writeRowStartDelimiter()
|
|
{
|
|
writeCString("\t\t<row>\n", *ostr);
|
|
}
|
|
|
|
|
|
void XMLRowOutputStream::writeRowEndDelimiter()
|
|
{
|
|
writeCString("\t\t</row>\n", *ostr);
|
|
field_number = 0;
|
|
++row_count;
|
|
}
|
|
|
|
|
|
void XMLRowOutputStream::writeSuffix()
|
|
{
|
|
writeCString("\t</data>\n", *ostr);
|
|
|
|
writeTotals();
|
|
writeExtremes();
|
|
|
|
writeCString("\t<rows>", *ostr);
|
|
writeIntText(row_count, *ostr);
|
|
writeCString("</rows>\n", *ostr);
|
|
|
|
writeRowsBeforeLimitAtLeast();
|
|
|
|
if (format_settings.write_statistics)
|
|
writeStatistics();
|
|
|
|
writeCString("</result>\n", *ostr);
|
|
ostr->next();
|
|
}
|
|
|
|
void XMLRowOutputStream::writeRowsBeforeLimitAtLeast()
|
|
{
|
|
if (applied_limit)
|
|
{
|
|
writeCString("\t<rows_before_limit_at_least>", *ostr);
|
|
writeIntText(rows_before_limit, *ostr);
|
|
writeCString("</rows_before_limit_at_least>\n", *ostr);
|
|
}
|
|
}
|
|
|
|
void XMLRowOutputStream::writeTotals()
|
|
{
|
|
if (totals)
|
|
{
|
|
writeCString("\t<totals>\n", *ostr);
|
|
|
|
size_t totals_columns = totals.columns();
|
|
for (size_t i = 0; i < totals_columns; ++i)
|
|
{
|
|
const ColumnWithTypeAndName & column = totals.safeGetByPosition(i);
|
|
|
|
writeCString("\t\t<", *ostr);
|
|
writeString(field_tag_names[i], *ostr);
|
|
writeCString(">", *ostr);
|
|
column.type->serializeAsTextXML(*column.column.get(), 0, *ostr, format_settings);
|
|
writeCString("</", *ostr);
|
|
writeString(field_tag_names[i], *ostr);
|
|
writeCString(">\n", *ostr);
|
|
}
|
|
|
|
writeCString("\t</totals>\n", *ostr);
|
|
}
|
|
}
|
|
|
|
|
|
static void writeExtremesElement(
|
|
const char * title, const Block & extremes, size_t row_num, const Names & field_tag_names, WriteBuffer & ostr, const FormatSettings & format_settings)
|
|
{
|
|
writeCString("\t\t<", ostr);
|
|
writeCString(title, ostr);
|
|
writeCString(">\n", ostr);
|
|
|
|
size_t extremes_columns = extremes.columns();
|
|
for (size_t i = 0; i < extremes_columns; ++i)
|
|
{
|
|
const ColumnWithTypeAndName & column = extremes.safeGetByPosition(i);
|
|
|
|
writeCString("\t\t\t<", ostr);
|
|
writeString(field_tag_names[i], ostr);
|
|
writeCString(">", ostr);
|
|
column.type->serializeAsTextXML(*column.column.get(), row_num, ostr, format_settings);
|
|
writeCString("</", ostr);
|
|
writeString(field_tag_names[i], ostr);
|
|
writeCString(">\n", ostr);
|
|
}
|
|
|
|
writeCString("\t\t</", ostr);
|
|
writeCString(title, ostr);
|
|
writeCString(">\n", ostr);
|
|
}
|
|
|
|
void XMLRowOutputStream::writeExtremes()
|
|
{
|
|
if (extremes)
|
|
{
|
|
writeCString("\t<extremes>\n", *ostr);
|
|
writeExtremesElement("min", extremes, 0, field_tag_names, *ostr, format_settings);
|
|
writeExtremesElement("max", extremes, 1, field_tag_names, *ostr, format_settings);
|
|
writeCString("\t</extremes>\n", *ostr);
|
|
}
|
|
}
|
|
|
|
|
|
void XMLRowOutputStream::onProgress(const Progress & value)
|
|
{
|
|
progress.incrementPiecewiseAtomically(value);
|
|
}
|
|
|
|
|
|
void XMLRowOutputStream::writeStatistics()
|
|
{
|
|
writeCString("\t<statistics>\n", *ostr);
|
|
writeCString("\t\t<elapsed>", *ostr);
|
|
writeText(watch.elapsedSeconds(), *ostr);
|
|
writeCString("</elapsed>\n", *ostr);
|
|
writeCString("\t\t<rows_read>", *ostr);
|
|
writeText(progress.rows.load(), *ostr);
|
|
writeCString("</rows_read>\n", *ostr);
|
|
writeCString("\t\t<bytes_read>", *ostr);
|
|
writeText(progress.bytes.load(), *ostr);
|
|
writeCString("</bytes_read>\n", *ostr);
|
|
writeCString("\t</statistics>\n", *ostr);
|
|
}
|
|
|
|
|
|
void registerOutputFormatXML(FormatFactory & factory)
|
|
{
|
|
factory.registerOutputFormat("XML", [](
|
|
WriteBuffer & buf,
|
|
const Block & sample,
|
|
const Context &,
|
|
const FormatSettings & settings)
|
|
{
|
|
return std::make_shared<BlockOutputStreamFromRowOutputStream>(
|
|
std::make_shared<XMLRowOutputStream>(buf, sample, settings), sample);
|
|
});
|
|
}
|
|
|
|
}
|