2019-08-17 22:53:46 +00:00
|
|
|
#include "ProtobufRowInputFormat.h"
|
2019-02-21 18:36:46 +00:00
|
|
|
|
2019-08-04 12:43:11 +00:00
|
|
|
#if USE_PROTOBUF
|
2021-01-11 01:50:30 +00:00
|
|
|
# include <Core/Block.h>
|
|
|
|
# include <Formats/FormatFactory.h>
|
|
|
|
# include <Formats/FormatSchemaInfo.h>
|
|
|
|
# include <Formats/ProtobufReader.h>
|
|
|
|
# include <Formats/ProtobufSchemas.h>
|
|
|
|
# include <Formats/ProtobufSerializer.h>
|
|
|
|
# include <Interpreters/Context.h>
|
2021-10-02 07:13:14 +00:00
|
|
|
# include <base/range.h>
|
2019-02-21 18:36:46 +00:00
|
|
|
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
2021-01-11 01:50:30 +00:00
|
|
|
ProtobufRowInputFormat::ProtobufRowInputFormat(ReadBuffer & in_, const Block & header_, const Params & params_, const FormatSchemaInfo & schema_info_, bool with_length_delimiter_)
|
2019-08-03 11:02:40 +00:00
|
|
|
: IRowInputFormat(header_, in_, params_)
|
2021-01-11 01:50:30 +00:00
|
|
|
, reader(std::make_unique<ProtobufReader>(in_))
|
|
|
|
, serializer(ProtobufSerializer::create(
|
|
|
|
header_.getNames(),
|
|
|
|
header_.getDataTypes(),
|
|
|
|
missing_column_indices,
|
|
|
|
*ProtobufSchemas::instance().getMessageTypeForFormatSchema(schema_info_),
|
|
|
|
with_length_delimiter_,
|
|
|
|
*reader))
|
2019-02-21 18:36:46 +00:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
ProtobufRowInputFormat::~ProtobufRowInputFormat() = default;
|
|
|
|
|
2021-01-11 01:50:30 +00:00
|
|
|
bool ProtobufRowInputFormat::readRow(MutableColumns & columns, RowReadExtension & row_read_extension)
|
2019-02-21 18:36:46 +00:00
|
|
|
{
|
2021-01-11 01:50:30 +00:00
|
|
|
if (reader->eof())
|
|
|
|
return false;
|
2019-02-21 18:36:46 +00:00
|
|
|
|
2021-01-11 01:50:30 +00:00
|
|
|
size_t row_num = columns.empty() ? 0 : columns[0]->size();
|
|
|
|
if (!row_num)
|
|
|
|
serializer->setColumns(columns.data(), columns.size());
|
2019-02-21 18:36:46 +00:00
|
|
|
|
2021-01-11 01:50:30 +00:00
|
|
|
serializer->readRow(row_num);
|
2019-02-21 18:36:46 +00:00
|
|
|
|
2021-01-11 01:50:30 +00:00
|
|
|
row_read_extension.read_columns.clear();
|
|
|
|
row_read_extension.read_columns.resize(columns.size(), true);
|
|
|
|
for (size_t column_idx : missing_column_indices)
|
|
|
|
row_read_extension.read_columns[column_idx] = false;
|
2019-02-21 18:36:46 +00:00
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool ProtobufRowInputFormat::allowSyncAfterError() const
|
|
|
|
{
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void ProtobufRowInputFormat::syncAfterError()
|
|
|
|
{
|
2021-01-11 01:50:30 +00:00
|
|
|
reader->endMessage(true);
|
2019-02-21 18:36:46 +00:00
|
|
|
}
|
|
|
|
|
2021-10-11 16:11:50 +00:00
|
|
|
void registerInputFormatProtobuf(FormatFactory & factory)
|
2019-02-21 18:36:46 +00:00
|
|
|
{
|
2021-01-11 01:50:30 +00:00
|
|
|
for (bool with_length_delimiter : {false, true})
|
2019-02-21 18:36:46 +00:00
|
|
|
{
|
2021-10-11 16:11:50 +00:00
|
|
|
factory.registerInputFormat(with_length_delimiter ? "Protobuf" : "ProtobufSingle", [with_length_delimiter](
|
2020-09-23 15:10:04 +00:00
|
|
|
ReadBuffer & buf,
|
|
|
|
const Block & sample,
|
|
|
|
IRowInputFormat::Params params,
|
|
|
|
const FormatSettings & settings)
|
|
|
|
{
|
|
|
|
return std::make_shared<ProtobufRowInputFormat>(buf, sample, std::move(params),
|
2021-09-28 12:59:22 +00:00
|
|
|
FormatSchemaInfo(settings, "Protobuf", true),
|
2021-01-11 01:50:30 +00:00
|
|
|
with_length_delimiter);
|
2020-09-23 15:10:04 +00:00
|
|
|
});
|
|
|
|
}
|
2019-02-21 18:36:46 +00:00
|
|
|
}
|
|
|
|
|
2021-12-15 11:30:57 +00:00
|
|
|
ProtobufSchemaReader::ProtobufSchemaReader(const FormatSettings & format_settings)
|
|
|
|
: schema_info(
|
|
|
|
format_settings.schema.format_schema,
|
|
|
|
"Protobuf",
|
|
|
|
true,
|
|
|
|
format_settings.schema.is_server,
|
|
|
|
format_settings.schema.format_schema_path)
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
NamesAndTypesList ProtobufSchemaReader::readSchema()
|
|
|
|
{
|
|
|
|
const auto * message_descriptor = ProtobufSchemas::instance().getMessageTypeForFormatSchema(schema_info);
|
|
|
|
return protobufSchemaToCHSchema(message_descriptor);
|
|
|
|
}
|
|
|
|
|
|
|
|
void registerProtobufSchemaReader(FormatFactory & factory)
|
|
|
|
{
|
|
|
|
factory.registerExternalSchemaReader("Protobuf", [](const FormatSettings & settings)
|
|
|
|
{
|
|
|
|
return std::make_shared<ProtobufSchemaReader>(settings);
|
|
|
|
});
|
|
|
|
factory.registerExternalSchemaReader("ProtobufSingle", [](const FormatSettings & settings)
|
|
|
|
{
|
|
|
|
return std::make_shared<ProtobufSchemaReader>(settings);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2019-02-21 18:36:46 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#else
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
class FormatFactory;
|
2021-10-11 16:11:50 +00:00
|
|
|
void registerInputFormatProtobuf(FormatFactory &) {}
|
2021-12-15 11:30:57 +00:00
|
|
|
|
|
|
|
void registerProtobufSchemaReader(FormatFactory &) {}
|
2019-02-21 18:36:46 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#endif
|