2011-10-24 12:10:59 +00:00
|
|
|
#pragma once
|
|
|
|
|
2017-04-01 09:19:00 +00:00
|
|
|
#include <IO/ReadBufferFromFileBase.h>
|
2022-07-20 20:30:16 +00:00
|
|
|
#include <Interpreters/Context_fwd.h>
|
2023-03-30 17:02:28 +00:00
|
|
|
#include <Common/Throttler_fwd.h>
|
2020-02-17 14:27:09 +00:00
|
|
|
|
|
|
|
#include <unistd.h>
|
2016-10-24 02:02:37 +00:00
|
|
|
|
2016-10-24 04:06:27 +00:00
|
|
|
|
2011-10-24 12:10:59 +00:00
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2016-10-24 02:02:37 +00:00
|
|
|
/** Use ready file descriptor. Does not open or close a file.
|
2011-10-24 12:10:59 +00:00
|
|
|
*/
|
2015-03-30 15:39:55 +00:00
|
|
|
class ReadBufferFromFileDescriptor : public ReadBufferFromFileBase
|
2011-10-24 12:10:59 +00:00
|
|
|
{
|
|
|
|
protected:
|
2021-07-12 01:12:34 +00:00
|
|
|
const size_t required_alignment = 0; /// For O_DIRECT both file offsets and memory addresses have to be aligned.
|
|
|
|
bool use_pread = false; /// To access one fd from multiple threads, use 'pread' syscall instead of 'read'.
|
|
|
|
|
|
|
|
size_t file_offset_of_buffer_end = 0; /// What offset in file corresponds to working_buffer.end().
|
2022-04-26 10:55:27 +00:00
|
|
|
|
2011-10-24 12:10:59 +00:00
|
|
|
int fd;
|
2015-04-16 12:06:05 +00:00
|
|
|
|
2023-03-30 17:02:28 +00:00
|
|
|
ThrottlerPtr throttler;
|
|
|
|
|
2016-10-25 06:49:24 +00:00
|
|
|
bool nextImpl() override;
|
2023-05-26 13:55:30 +00:00
|
|
|
void prefetch(Priority priority) override;
|
2011-10-24 12:10:59 +00:00
|
|
|
|
2016-10-24 02:02:37 +00:00
|
|
|
/// Name or some description of file.
|
2016-10-25 06:49:24 +00:00
|
|
|
std::string getFileName() const override;
|
2011-10-24 12:10:59 +00:00
|
|
|
|
2023-05-05 03:11:51 +00:00
|
|
|
/// Does the read()/pread(), with all the metric increments, error handling, throttling, etc.
|
|
|
|
/// Doesn't seek (`offset` must match fd's position if !use_pread).
|
|
|
|
/// Stops after min_bytes or eof. Returns 0 if eof.
|
|
|
|
/// Thread safe.
|
2024-03-03 13:22:40 +00:00
|
|
|
size_t readImpl(char * to, size_t min_bytes, size_t max_bytes, size_t offset) const;
|
2023-05-05 03:11:51 +00:00
|
|
|
|
2011-10-24 12:10:59 +00:00
|
|
|
public:
|
2022-03-13 11:59:20 +00:00
|
|
|
explicit ReadBufferFromFileDescriptor(
|
2022-01-03 16:05:46 +00:00
|
|
|
int fd_,
|
|
|
|
size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
|
|
|
|
char * existing_memory = nullptr,
|
|
|
|
size_t alignment = 0,
|
2023-03-30 17:02:28 +00:00
|
|
|
std::optional<size_t> file_size_ = std::nullopt,
|
|
|
|
ThrottlerPtr throttler_ = {})
|
2022-01-03 16:05:46 +00:00
|
|
|
: ReadBufferFromFileBase(buf_size, existing_memory, alignment, file_size_)
|
|
|
|
, required_alignment(alignment)
|
|
|
|
, fd(fd_)
|
2023-03-30 17:02:28 +00:00
|
|
|
, throttler(throttler_)
|
2021-07-12 01:12:34 +00:00
|
|
|
{
|
|
|
|
}
|
2017-08-30 20:23:29 +00:00
|
|
|
|
2020-02-14 14:28:33 +00:00
|
|
|
int getFD() const
|
2011-12-28 20:01:41 +00:00
|
|
|
{
|
|
|
|
return fd;
|
|
|
|
}
|
|
|
|
|
2020-02-14 14:28:33 +00:00
|
|
|
off_t getPosition() override
|
2015-04-03 13:45:44 +00:00
|
|
|
{
|
2020-07-31 14:53:41 +00:00
|
|
|
return file_offset_of_buffer_end - (working_buffer.end() - pos);
|
2015-04-03 13:45:44 +00:00
|
|
|
}
|
|
|
|
|
2022-05-30 18:35:31 +00:00
|
|
|
size_t getFileOffsetOfBufferEnd() const override { return file_offset_of_buffer_end; }
|
|
|
|
|
2016-10-24 02:02:37 +00:00
|
|
|
/// If 'offset' is small enough to stay in buffer after seek, then true seek in file does not happen.
|
2020-01-27 18:44:30 +00:00
|
|
|
off_t seek(off_t off, int whence) override;
|
2015-12-13 08:51:28 +00:00
|
|
|
|
2021-07-04 03:03:49 +00:00
|
|
|
/// Seek to the beginning, discarding already read data if any. Useful to reread file that changes on every read.
|
|
|
|
void rewind();
|
|
|
|
|
2024-07-18 02:54:36 +00:00
|
|
|
std::optional<size_t> tryGetFileSize() override;
|
2021-04-28 16:25:14 +00:00
|
|
|
|
2023-05-05 03:11:51 +00:00
|
|
|
bool checkIfActuallySeekable() override;
|
|
|
|
|
2024-03-03 13:22:40 +00:00
|
|
|
size_t readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &) const override;
|
2023-05-05 03:11:51 +00:00
|
|
|
bool supportsReadAt() override { return use_pread; }
|
2011-10-24 12:10:59 +00:00
|
|
|
};
|
|
|
|
|
2021-07-12 01:12:34 +00:00
|
|
|
|
|
|
|
/** Similar to ReadBufferFromFileDescriptor but it is using 'pread' allowing multiple concurrent reads from the same fd.
|
|
|
|
*/
|
|
|
|
class ReadBufferFromFileDescriptorPRead : public ReadBufferFromFileDescriptor
|
|
|
|
{
|
|
|
|
public:
|
2022-03-13 11:59:20 +00:00
|
|
|
explicit ReadBufferFromFileDescriptorPRead(
|
2022-01-03 16:05:46 +00:00
|
|
|
int fd_,
|
|
|
|
size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
|
|
|
|
char * existing_memory = nullptr,
|
|
|
|
size_t alignment = 0,
|
2023-03-30 17:02:28 +00:00
|
|
|
std::optional<size_t> file_size_ = std::nullopt,
|
|
|
|
ThrottlerPtr throttler_ = {})
|
|
|
|
: ReadBufferFromFileDescriptor(fd_, buf_size, existing_memory, alignment, file_size_, throttler_)
|
2021-07-12 01:12:34 +00:00
|
|
|
{
|
|
|
|
use_pread = true;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
2011-10-24 12:10:59 +00:00
|
|
|
}
|