ClickHouse/src/Processors/Formats/Impl/ORCBlockInputFormat.h

58 lines
1.1 KiB
C++
Raw Normal View History

2019-08-21 14:19:47 +00:00
#pragma once
2021-10-27 23:10:39 +00:00
#include "config_formats.h"
2020-05-03 23:19:56 +00:00
#if USE_ORC
2019-08-21 14:19:47 +00:00
#include <Processors/Formats/IInputFormat.h>
#include <Formats/FormatSettings.h>
2019-08-21 14:19:47 +00:00
2021-10-31 19:53:24 +00:00
#include <arrow/adapters/orc/adapter.h>
namespace arrow::adapters::orc
{
class ORCFileReader;
}
2019-08-21 14:19:47 +00:00
namespace DB
{
2021-06-02 08:51:07 +00:00
class ArrowColumnToCHColumn;
2020-05-05 12:56:54 +00:00
class ORCBlockInputFormat : public IInputFormat
2019-08-21 14:19:47 +00:00
{
public:
ORCBlockInputFormat(ReadBuffer & in_, Block header_, const FormatSettings & format_settings_);
2019-08-21 14:19:47 +00:00
String getName() const override { return "ORCBlockInputFormat"; }
void resetParser() override;
2019-08-21 14:19:47 +00:00
protected:
Chunk generate() override;
private:
// TODO: check that this class implements every part of its parent
std::unique_ptr<arrow::adapters::orc::ORCFileReader> file_reader;
2021-10-31 19:53:24 +00:00
std::shared_ptr<arrow::RecordBatchReader> batch_reader;
2021-06-02 08:51:07 +00:00
std::unique_ptr<ArrowColumnToCHColumn> arrow_column_to_ch_column;
2021-10-31 19:53:24 +00:00
std::vector<String> column_names;
int stripe_total = 0;
int stripe_current = 0;
// indices of columns to read from ORC file
std::vector<int> include_indices;
const FormatSettings format_settings;
void prepareReader();
2019-08-21 14:19:47 +00:00
};
}
#endif