mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-12 09:22:05 +00:00
3f57fc085b
Also remove it from some visitors.
126 lines
4.8 KiB
C++
126 lines
4.8 KiB
C++
#include <memory>
|
|
#include <Columns/ColumnString.h>
|
|
#include <DataStreams/materializeBlock.h>
|
|
#include <DataTypes/DataTypeString.h>
|
|
#include <Formats/FormatFactory.h>
|
|
#include <Functions/FunctionFactory.h>
|
|
#include <Functions/FunctionHelpers.h>
|
|
#include <Functions/IFunction.h>
|
|
#include <IO/WriteBufferFromVector.h>
|
|
#include <IO/WriteHelpers.h>
|
|
#include <Processors/Formats/IOutputFormat.h>
|
|
#include <ext/map.h>
|
|
|
|
|
|
namespace DB
|
|
{
|
|
namespace ErrorCodes
|
|
{
|
|
extern const int ILLEGAL_TYPE_OF_ARGUMENT;
|
|
extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
|
|
extern const int UNKNOWN_FORMAT;
|
|
}
|
|
|
|
namespace
|
|
{
|
|
|
|
/** formatRow(<format>, x, y, ...) is a function that allows you to use RowOutputFormat over
|
|
* several columns to generate a string per row, such as CSV, TSV, JSONEachRow, etc.
|
|
* formatRowNoNewline(...) trims the newline character of each row.
|
|
*/
|
|
|
|
template <bool no_newline>
|
|
class FunctionFormatRow : public IFunction
|
|
{
|
|
public:
|
|
static constexpr auto name = no_newline ? "formatRowNoNewline" : "formatRow";
|
|
|
|
FunctionFormatRow(const String & format_name_, ContextConstPtr context_) : format_name(format_name_), context(context_)
|
|
{
|
|
if (!FormatFactory::instance().getAllFormats().count(format_name))
|
|
throw Exception("Unknown format " + format_name, ErrorCodes::UNKNOWN_FORMAT);
|
|
}
|
|
|
|
String getName() const override { return name; }
|
|
size_t getNumberOfArguments() const override { return 0; }
|
|
bool useDefaultImplementationForNulls() const override { return false; }
|
|
bool useDefaultImplementationForConstants() const override { return true; }
|
|
ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {0}; }
|
|
|
|
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
|
|
{
|
|
auto col_str = ColumnString::create();
|
|
ColumnString::Chars & vec = col_str->getChars();
|
|
WriteBufferFromVector buffer(vec);
|
|
ColumnString::Offsets & offsets = col_str->getOffsets();
|
|
offsets.resize(input_rows_count);
|
|
Block arg_columns;
|
|
for (auto i = 1u; i < arguments.size(); ++i)
|
|
arg_columns.insert(arguments[i]);
|
|
materializeBlockInplace(arg_columns);
|
|
auto out = FormatFactory::instance().getOutputFormat(format_name, buffer, arg_columns, context, [&](const Columns &, size_t row)
|
|
{
|
|
if constexpr (no_newline)
|
|
{
|
|
// replace '\n' with '\0'
|
|
if (buffer.position() != buffer.buffer().begin() && buffer.position()[-1] == '\n')
|
|
buffer.position()[-1] = '\0';
|
|
}
|
|
else
|
|
writeChar('\0', buffer);
|
|
offsets[row] = buffer.count();
|
|
});
|
|
out->write(arg_columns);
|
|
return col_str;
|
|
}
|
|
|
|
private:
|
|
String format_name;
|
|
ContextConstPtr context;
|
|
};
|
|
|
|
template <bool no_newline>
|
|
class FormatRowOverloadResolver : public IFunctionOverloadResolver
|
|
{
|
|
public:
|
|
static constexpr auto name = no_newline ? "formatRowNoNewline" : "formatRow";
|
|
static FunctionOverloadResolverPtr create(ContextConstPtr context) { return std::make_unique<FormatRowOverloadResolver>(context); }
|
|
explicit FormatRowOverloadResolver(ContextConstPtr context_) : context(context_) { }
|
|
String getName() const override { return name; }
|
|
bool isVariadic() const override { return true; }
|
|
size_t getNumberOfArguments() const override { return 0; }
|
|
ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {0}; }
|
|
bool useDefaultImplementationForNulls() const override { return false; }
|
|
|
|
FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
|
|
{
|
|
if (arguments.size() < 2)
|
|
throw Exception(
|
|
"Function " + getName() + " requires at least two arguments: the format name and its output expression(s)",
|
|
ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
|
|
|
|
if (const auto * name_col = checkAndGetColumnConst<ColumnString>(arguments.at(0).column.get()))
|
|
return std::make_unique<FunctionToFunctionBaseAdaptor>(
|
|
std::make_shared<FunctionFormatRow<no_newline>>(name_col->getValue<String>(), context),
|
|
ext::map<DataTypes>(arguments, [](const auto & elem) { return elem.type; }),
|
|
return_type);
|
|
else
|
|
throw Exception("First argument to " + getName() + " must be a format name", ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT);
|
|
}
|
|
|
|
DataTypePtr getReturnTypeImpl(const DataTypes &) const override { return std::make_shared<DataTypeString>(); }
|
|
|
|
private:
|
|
ContextConstPtr context;
|
|
};
|
|
|
|
}
|
|
|
|
void registerFunctionFormatRow(FunctionFactory & factory)
|
|
{
|
|
factory.registerFunction<FormatRowOverloadResolver<true>>();
|
|
factory.registerFunction<FormatRowOverloadResolver<false>>();
|
|
}
|
|
|
|
}
|