2017-01-07 16:11:30 +00:00
|
|
|
#pragma once
|
|
|
|
|
2020-01-04 07:31:00 +00:00
|
|
|
#include <memory>
|
2020-10-31 23:56:41 +00:00
|
|
|
#include <string>
|
2020-01-04 07:31:00 +00:00
|
|
|
|
2020-01-04 22:59:08 +00:00
|
|
|
#include <Core/Defines.h>
|
2020-01-04 07:31:00 +00:00
|
|
|
|
2017-01-07 16:11:30 +00:00
|
|
|
namespace DB
|
|
|
|
{
|
2020-01-04 07:31:00 +00:00
|
|
|
class ReadBuffer;
|
|
|
|
class WriteBuffer;
|
|
|
|
|
|
|
|
/** These are "generally recognizable" compression methods for data import/export.
|
|
|
|
* Do not mess with more efficient compression methods used by ClickHouse internally
|
|
|
|
* (they use non-standard framing, indexes, checksums...)
|
|
|
|
*/
|
|
|
|
|
2019-02-13 20:54:12 +00:00
|
|
|
enum class CompressionMethod
|
2017-01-07 16:11:30 +00:00
|
|
|
{
|
2020-01-04 22:59:08 +00:00
|
|
|
None,
|
2017-01-07 16:11:30 +00:00
|
|
|
/// DEFLATE compression with gzip header and CRC32 checksum.
|
|
|
|
/// This option corresponds to files produced by gzip(1) or HTTP Content-Encoding: gzip.
|
|
|
|
Gzip,
|
|
|
|
/// DEFLATE compression with zlib header and Adler32 checksum.
|
|
|
|
/// This option corresponds to HTTP Content-Encoding: deflate.
|
|
|
|
Zlib,
|
2020-10-31 23:56:41 +00:00
|
|
|
/// LZMA2-based content compression
|
|
|
|
/// This option corresponds to HTTP Content-Encoding: xz
|
|
|
|
Xz,
|
2020-11-17 16:02:10 +00:00
|
|
|
/// Zstd compressor
|
|
|
|
/// This option corresponds to HTTP Content-Encoding: zstd
|
|
|
|
Zstd,
|
2021-06-16 05:43:07 +00:00
|
|
|
Brotli,
|
2021-08-18 07:20:23 +00:00
|
|
|
Lz4,
|
2021-11-05 11:55:30 +00:00
|
|
|
Bzip2,
|
|
|
|
Snappy,
|
2017-01-07 16:11:30 +00:00
|
|
|
};
|
|
|
|
|
2020-01-04 07:31:00 +00:00
|
|
|
/// How the compression method is named in HTTP.
|
|
|
|
std::string toContentEncodingName(CompressionMethod method);
|
|
|
|
|
|
|
|
/** Choose compression method from path and hint.
|
|
|
|
* if hint is "auto" or empty string, then path is analyzed,
|
|
|
|
* otherwise path parameter is ignored and hint is used as compression method name.
|
|
|
|
* path is arbitrary string that will be analyzed for file extension (gz, br...) that determines compression.
|
|
|
|
*/
|
|
|
|
CompressionMethod chooseCompressionMethod(const std::string & path, const std::string & hint);
|
|
|
|
|
2022-10-04 03:13:46 +00:00
|
|
|
/** Choose a compression method from HTTP header list of supported compression methods.
|
|
|
|
*/
|
2022-10-04 19:04:03 +00:00
|
|
|
CompressionMethod chooseHTTPCompressionMethod(const std::string & list);
|
2022-10-04 03:13:46 +00:00
|
|
|
|
2022-07-07 01:47:33 +00:00
|
|
|
/// Get a range of the valid compression levels for the compression method.
|
|
|
|
std::pair<uint64_t, uint64_t> getCompressionLevelRange(const CompressionMethod & method);
|
|
|
|
|
2022-05-08 06:02:40 +00:00
|
|
|
std::unique_ptr<ReadBuffer> wrapReadBufferWithCompressionMethod(
|
|
|
|
std::unique_ptr<ReadBuffer> nested,
|
|
|
|
CompressionMethod method,
|
2022-06-18 12:55:35 +00:00
|
|
|
int zstd_window_log_max = 0,
|
2022-05-08 06:02:40 +00:00
|
|
|
size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
|
|
|
|
char * existing_memory = nullptr,
|
|
|
|
size_t alignment = 0);
|
|
|
|
|
2022-06-18 12:55:35 +00:00
|
|
|
|
2023-10-27 02:38:36 +00:00
|
|
|
/*
|
|
|
|
template<typename WriteBufferT>
|
|
|
|
std::unique_ptr<WriteBuffer> wrapWriteBufferWithCompressionMethod(
|
|
|
|
WriteBufferT && nested,
|
|
|
|
CompressionMethod method,
|
|
|
|
int level,
|
|
|
|
size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
|
|
|
|
char * existing_memory = nullptr,
|
|
|
|
size_t alignment = 0);
|
|
|
|
*/
|
|
|
|
|
2020-01-04 22:59:08 +00:00
|
|
|
std::unique_ptr<WriteBuffer> wrapWriteBufferWithCompressionMethod(
|
|
|
|
std::unique_ptr<WriteBuffer> nested,
|
|
|
|
CompressionMethod method,
|
|
|
|
int level,
|
|
|
|
size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
|
|
|
|
char * existing_memory = nullptr,
|
2023-10-30 05:37:47 +00:00
|
|
|
size_t alignment = 0,
|
|
|
|
bool compress_empty = true);
|
2020-01-04 07:31:00 +00:00
|
|
|
|
2023-10-27 02:38:36 +00:00
|
|
|
std::unique_ptr<WriteBuffer> wrapWriteBufferWithCompressionMethod(
|
|
|
|
WriteBuffer * nested,
|
|
|
|
CompressionMethod method,
|
|
|
|
int level,
|
|
|
|
size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
|
|
|
|
char * existing_memory = nullptr,
|
2023-10-30 05:37:47 +00:00
|
|
|
size_t alignment = 0,
|
|
|
|
bool compress_empty = true);
|
2023-10-27 02:38:36 +00:00
|
|
|
|
2017-01-07 16:11:30 +00:00
|
|
|
}
|