ClickHouse/src/Storages/StorageURL.h

134 lines
4.2 KiB
C++
Raw Normal View History

2018-06-11 12:13:00 +00:00
#pragma once
#include <Storages/IStorage.h>
#include <Poco/URI.h>
#include <ext/shared_ptr_helper.h>
2020-04-28 00:56:44 +00:00
#include <DataStreams/IBlockOutputStream.h>
#include <Formats/FormatSettings.h>
2020-04-28 00:56:44 +00:00
#include <IO/CompressionMethod.h>
2018-06-11 12:13:00 +00:00
2019-08-24 21:20:20 +00:00
2018-06-11 12:13:00 +00:00
namespace DB
{
struct ConnectionTimeouts;
2018-06-11 12:13:00 +00:00
/**
* This class represents table engine for external urls.
* It sends HTTP GET to server when select is called and
* HTTP POST when insert is called. In POST request the data is send
* using Chunked transfer encoding, so server have to support it.
*/
class IStorageURLBase : public IStorage
2018-06-11 12:13:00 +00:00
{
public:
2020-08-03 13:54:14 +00:00
Pipe read(
2019-08-24 21:20:20 +00:00
const Names & column_names,
const StorageMetadataPtr & /*metadata_snapshot*/,
SelectQueryInfo & query_info,
2018-06-11 12:13:00 +00:00
const Context & context,
2018-06-25 12:21:54 +00:00
QueryProcessingStage::Enum processed_stage,
size_t max_block_size,
2018-06-11 12:13:00 +00:00
unsigned num_streams) override;
BlockOutputStreamPtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, const Context & context) override;
2018-06-11 12:13:00 +00:00
protected:
2019-08-24 21:20:20 +00:00
IStorageURLBase(
const Poco::URI & uri_,
const Context & context_,
2019-12-04 16:06:55 +00:00
const StorageID & id_,
2018-06-11 12:13:00 +00:00
const String & format_name_,
const std::optional<FormatSettings> & format_settings_,
2019-08-24 21:20:20 +00:00
const ColumnsDescription & columns_,
const ConstraintsDescription & constraints_,
const String & compression_method_);
2018-06-11 12:13:00 +00:00
Poco::URI uri;
const Context & context_global;
String compression_method;
2018-06-11 12:13:00 +00:00
String format_name;
// For URL engine, we use format settings from server context + `SETTINGS`
// clause of the `CREATE` query. In this case, format_settings is set.
// For `url` table function, we use settings from current query context.
// In this case, format_settings is not set.
std::optional<FormatSettings> format_settings;
2018-06-11 12:13:00 +00:00
2020-04-28 00:56:44 +00:00
private:
virtual std::string getReadMethod() const;
2019-08-24 21:20:20 +00:00
virtual std::vector<std::pair<std::string, std::string>> getReadURIParams(
const Names & column_names,
const StorageMetadataPtr & metadata_snapshot,
const SelectQueryInfo & query_info,
const Context & context,
QueryProcessingStage::Enum & processed_stage,
size_t max_block_size) const;
2019-08-24 21:20:20 +00:00
virtual std::function<void(std::ostream &)> getReadPOSTDataCallback(
const Names & column_names,
const StorageMetadataPtr & /*metadata_snapshot*/,
const SelectQueryInfo & query_info,
const Context & context,
QueryProcessingStage::Enum & processed_stage,
size_t max_block_size) const;
2018-09-22 14:58:03 +00:00
virtual Block getHeaderBlock(const Names & column_names, const StorageMetadataPtr & metadata_snapshot) const = 0;
};
2020-04-28 00:56:44 +00:00
class StorageURLBlockOutputStream : public IBlockOutputStream
{
public:
StorageURLBlockOutputStream(
const Poco::URI & uri,
const String & format,
const std::optional<FormatSettings> & format_settings,
const Block & sample_block_,
const Context & context,
const ConnectionTimeouts & timeouts,
const CompressionMethod compression_method);
2020-04-28 00:56:44 +00:00
Block getHeader() const override
{
return sample_block;
}
2020-07-09 01:00:16 +00:00
void write(const Block & block) override;
void writePrefix() override;
void writeSuffix() override;
2020-04-28 00:56:44 +00:00
private:
Block sample_block;
std::unique_ptr<WriteBuffer> write_buf;
BlockOutputStreamPtr writer;
};
2019-08-24 21:20:20 +00:00
class StorageURL final : public ext::shared_ptr_helper<StorageURL>, public IStorageURLBase
{
2019-08-26 19:07:29 +00:00
friend struct ext::shared_ptr_helper<StorageURL>;
public:
StorageURL(const Poco::URI & uri_,
const StorageID & table_id_,
const String & format_name_,
const std::optional<FormatSettings> & format_settings_,
const ColumnsDescription & columns_,
const ConstraintsDescription & constraints_,
Context & context_,
const String & compression_method_)
: IStorageURLBase(uri_, context_, table_id_, format_name_,
format_settings_, columns_, constraints_, compression_method_)
{
}
String getName() const override
{
return "URL";
}
2018-09-22 14:58:03 +00:00
Block getHeaderBlock(const Names & /*column_names*/, const StorageMetadataPtr & metadata_snapshot) const override
2018-09-22 14:58:03 +00:00
{
return metadata_snapshot->getSampleBlock();
2018-09-22 14:58:03 +00:00
}
2018-06-11 12:13:00 +00:00
};
}