ClickHouse/dbms/src/Dictionaries/HTTPDictionarySource.cpp

142 lines
4.6 KiB
C++
Raw Normal View History

2016-11-15 19:51:06 +00:00
#include <DB/Dictionaries/HTTPDictionarySource.h>
#include <DB/Interpreters/Context.h>
#include <DB/Dictionaries/OwningBufferBlockInputStream.h>
2016-11-19 00:07:58 +00:00
#include <DB/Dictionaries/OwningBlockInputStream.h>
2016-11-15 19:51:06 +00:00
#include <DB/IO/ReadBufferFromHTTP.h>
2016-11-19 00:07:58 +00:00
#include <DB/IO/ReadWriteBufferFromHTTP.h>
2016-11-15 19:51:06 +00:00
2016-11-22 15:03:54 +00:00
#include <DB/DataStreams/IBlockOutputStream.h>
#include <DB/DataTypes/DataTypesNumberFixed.h>
#include <DB/IO/WriteBufferFromOStream.h>
2016-11-15 19:51:06 +00:00
namespace DB
{
2016-11-22 15:03:54 +00:00
HTTPDictionarySource::HTTPDictionarySource(const DictionaryStructure & dict_struct_,
const Poco::Util::AbstractConfiguration & config, const std::string & config_prefix,
Block & sample_block, const Context & context) :
2016-11-18 01:48:13 +00:00
dict_struct{dict_struct_},
2016-11-19 00:07:58 +00:00
host{config.getString(config_prefix + ".host", "::1")},
port{std::stoi(config.getString(config_prefix + ".port", "80"))},
path{config.getString(config_prefix + ".path", "")},
//method{config.getString(config_prefix + ".method", "")},
2016-11-15 23:55:45 +00:00
format{config.getString(config_prefix + ".format")},
2016-11-22 15:03:54 +00:00
selective{!config.getString(config_prefix + ".selective", "").empty()}, // todo! how to correct?
2016-11-15 22:05:49 +00:00
sample_block{sample_block},
context(context)
2016-11-15 19:51:06 +00:00
{
}
2016-11-15 22:05:49 +00:00
HTTPDictionarySource::HTTPDictionarySource(const HTTPDictionarySource & other) :
2016-11-18 01:48:13 +00:00
dict_struct{other.dict_struct},
2016-11-15 22:05:49 +00:00
host{other.host},
port{other.port},
path{other.path},
format{other.format},
2016-11-22 15:03:54 +00:00
selective{other.selective},
2016-11-18 01:48:13 +00:00
sample_block{other.sample_block},
context(other.context)
2016-11-15 19:51:06 +00:00
{
}
BlockInputStreamPtr HTTPDictionarySource::loadAll()
{
2016-11-19 00:07:58 +00:00
LOG_TRACE(log, "loadAll " + toString());
2016-11-19 00:56:15 +00:00
auto in_ptr = std::make_unique<ReadBufferFromHTTP>(host, port, path, ReadBufferFromHTTP::Params(), Poco::Net::HTTPRequest::HTTP_GET);
2016-11-18 01:48:13 +00:00
auto stream = context.getInputFormat(format, *in_ptr, sample_block, max_block_size);
2016-11-15 19:51:06 +00:00
return std::make_shared<OwningBufferBlockInputStream>(stream, std::move(in_ptr));
}
BlockInputStreamPtr HTTPDictionarySource::loadIds(const std::vector<UInt64> & ids)
{
2016-11-19 00:07:58 +00:00
LOG_TRACE(log, "loadIds " + toString());
HTTPLocation http_location;
http_location.host = host;
http_location.port = port;
http_location.path = path;
2016-11-22 15:03:54 +00:00
http_location.method = Poco::Net::HTTPRequest::HTTP_POST;
ReadWriteBufferFromHTTP::OutStreamCallback out_stream_callback = [&](std::ostream & out_stream) {
// copypaste from ExecutableDictionarySource.cpp, todo: make func
ColumnWithTypeAndName column;
column.type = std::make_shared<DataTypeUInt64>();
column.column = column.type->createColumn();
for (auto & id : ids) {
column.column->insert(id); //CHECKME maybe faster?
}
Block block;
block.insert(std::move(column));
WriteBufferFromOStream out_buffer(out_stream);
auto stream_out = context.getOutputFormat(format, out_buffer, sample_block);
stream_out->write(block);
};
auto in_ptr = std::make_unique<ReadWriteBufferFromHTTP>(http_location, out_stream_callback);
2016-11-19 00:07:58 +00:00
auto stream = context.getInputFormat(format, *in_ptr, sample_block, max_block_size);
return std::make_shared<OwningBlockInputStream<ReadWriteBufferFromHTTP>>(stream, std::move(in_ptr));
2016-11-15 19:51:06 +00:00
}
BlockInputStreamPtr HTTPDictionarySource::loadKeys(
const ConstColumnPlainPtrs & key_columns, const std::vector<std::size_t> & requested_rows)
{
2016-11-19 00:07:58 +00:00
LOG_TRACE(log, "loadKeys " + toString());
2016-11-22 15:03:54 +00:00
HTTPLocation http_location;
http_location.host = host;
http_location.port = port;
http_location.path = path;
http_location.method = Poco::Net::HTTPRequest::HTTP_POST;
ReadWriteBufferFromHTTP::OutStreamCallback out_stream_callback = [&](std::ostream & out_stream) {
// copypaste from ExecutableDictionarySource.cpp, todo: make func
Block block;
const auto keys_size = key_columns.size();
for (const auto i : ext::range(0, keys_size))
{
const auto & key_description = (*dict_struct.key)[i];
const auto & key = key_columns[i];
ColumnWithTypeAndName column;
column.type = key_description.type;
column.column = key->clone(); // CHECKME !!
block.insert(std::move(column));
}
WriteBufferFromOStream out_buffer(out_stream);
auto stream_out = context.getOutputFormat(format, out_buffer, sample_block);
stream_out->write(block);
};
auto in_ptr = std::make_unique<ReadWriteBufferFromHTTP>(http_location, out_stream_callback);
auto stream = context.getInputFormat(format, *in_ptr, sample_block, max_block_size);
return std::make_shared<OwningBlockInputStream<ReadWriteBufferFromHTTP>>(stream, std::move(in_ptr));
2016-11-15 19:51:06 +00:00
}
bool HTTPDictionarySource::isModified() const
{
2016-11-18 01:48:13 +00:00
return true;
2016-11-15 19:51:06 +00:00
}
bool HTTPDictionarySource::supportsSelectiveLoad() const
{
2016-11-22 15:03:54 +00:00
return selective;
2016-11-15 19:51:06 +00:00
}
DictionarySourcePtr HTTPDictionarySource::clone() const
{
return std::make_unique<HTTPDictionarySource>(*this);
}
std::string HTTPDictionarySource::toString() const
{
2016-11-15 23:55:45 +00:00
return "http://" + host + ":" + std::to_string(port) + "/" + path;
2016-11-15 19:51:06 +00:00
}
}