ClickHouse/dbms/src/IO/CompressedStream.h

#pragma once

#include <cstdint>

/** Common Defines */

#define DBMS_MAX_COMPRESSED_SIZE 0x40000000ULL    /// 1GB

#define COMPRESSED_BLOCK_HEADER_SIZE 9


namespace DB
{

/** Compression method */
enum class CompressionMethod
{
    LZ4 = 1,
    LZ4HC = 2,        /// The format is the same as for LZ4. The difference is only in compression.
    ZSTD = 3,         /// Experimental algorithm: https://github.com/Cyan4973/zstd
};

/** The compressed block format is as follows:
  *
  * The first 16 bytes are the checksum from all other bytes of the block. Now only CityHash128 is used.
  * In the future, you can provide other checksums, although it will not be possible to make them different in size.
  *
  * The next byte specifies the compression algorithm. Then everything depends on the algorithm.
  *
  * 0x82 - LZ4 or LZ4HC (they have the same format).
  *        Next 4 bytes - the size of the compressed data, taking into account the header; 4 bytes is the size of the uncompressed data.
  *
  * NOTE: Why is 0x82?
  * Originally only QuickLZ was used. Then LZ4 was added.
  * The high bit is set to distinguish from QuickLZ, and the second bit is set for compatibility,
  *  for the functions qlz_size_compressed, qlz_size_decompressed to work.
  * Although now such compatibility is no longer relevant.
  *
  * 0x90 - ZSTD
  *
  * All sizes are little endian.
  */

enum class CompressionMethodByte : uint8_t
{
    LZ4  = 0x82,
    ZSTD = 0x90,
};

}
dbms: development [#CONV-2944]. 2012-01-05 10:22:02 +00:00			`#pragma once`
Merge 2011-06-17 21:19:39 +00:00
More include fixes (#462) * More include fixes * fix 2017-02-07 21:26:32 +00:00			`#include <cstdint>`

translate comments: IO 2017-05-28 14:29:40 +00:00			`/** Common Defines */`
Merge 2011-06-17 21:19:39 +00:00
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`#define DBMS_MAX_COMPRESSED_SIZE 0x40000000ULL /// 1GB`
dbms: added LZ4 [#CONV-2944]. 2012-01-05 18:35:22 +00:00
dbms: disabled QuickLZ [#METR-17973]. 2016-02-03 21:16:19 +00:00			`#define COMPRESSED_BLOCK_HEADER_SIZE 9`
dbms: added LZ4 [#CONV-2944]. 2012-01-05 18:35:22 +00:00

			`namespace DB`
			`{`

translate comments: IO 2017-05-28 14:29:40 +00:00			`/** Compression method */`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`enum class CompressionMethod`
dbms: added LZ4 [#CONV-2944]. 2012-01-05 18:35:22 +00:00			`{`
Changed tabs to spaces in code [#CLICKHOUSE-3]. 2017-04-01 07:20:54 +00:00			`LZ4 = 1,`
translate comments: IO 2017-05-28 14:29:40 +00:00			`LZ4HC = 2, /// The format is the same as for LZ4. The difference is only in compression.`
			`ZSTD = 3, /// Experimental algorithm: https://github.com/Cyan4973/zstd`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`};`

translate comments: IO 2017-05-28 14:29:40 +00:00			`/** The compressed block format is as follows:`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`*`
translate comments: IO 2017-05-28 14:29:40 +00:00			`* The first 16 bytes are the checksum from all other bytes of the block. Now only CityHash128 is used.`
			`* In the future, you can provide other checksums, although it will not be possible to make them different in size.`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`*`
translate comments: IO 2017-05-28 14:29:40 +00:00			`* The next byte specifies the compression algorithm. Then everything depends on the algorithm.`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`*`
translate comments: IO 2017-05-28 14:29:40 +00:00			`* 0x82 - LZ4 or LZ4HC (they have the same format).`
			`* Next 4 bytes - the size of the compressed data, taking into account the header; 4 bytes is the size of the uncompressed data.`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`*`
translate comments: IO 2017-05-28 14:29:40 +00:00			`* NOTE: Why is 0x82?`
			`* Originally only QuickLZ was used. Then LZ4 was added.`
			`* The high bit is set to distinguish from QuickLZ, and the second bit is set for compatibility,`
			`* for the functions qlz_size_compressed, qlz_size_decompressed to work.`
			`* Although now such compatibility is no longer relevant.`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`*`
			`* 0x90 - ZSTD`
			`*`
translate comments: IO 2017-05-28 14:29:40 +00:00			`* All sizes are little endian.`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`*/`

			`enum class CompressionMethodByte : uint8_t`
			`{`
Removed support for QuickLZ (obsolete) [#CLICKHOUSE-2]. 2017-06-15 18:21:59 +00:00			`LZ4 = 0x82,`
			`ZSTD = 0x90,`
dbms: added ZSTD algorithm (experimental) [#METR-15386]. 2015-03-09 01:15:43 +00:00			`};`
dbms: added LZ4 [#CONV-2944]. 2012-01-05 18:35:22 +00:00
			`}`