ClickHouse/src/Functions/visibleWidth.cpp

85 lines
2.5 KiB
C++
Raw Normal View History

2021-05-17 07:30:42 +00:00
#include <Functions/IFunction.h>
#include <Functions/FunctionFactory.h>
#include <DataTypes/DataTypesNumber.h>
#include <Formats/FormatSettings.h>
#include <Columns/ColumnsNumber.h>
#include <IO/WriteBufferFromString.h>
#include <Common/UTF8Helpers.h>
#include <Common/assert_cast.h>
namespace DB
{
/** visibleWidth(x) - calculates the approximate width when outputting the value in a text form to the console.
* In fact it calculate the number of Unicode code points.
* It does not support zero width and full width characters, combining characters, etc.
*/
class FunctionVisibleWidth : public IFunction
{
public:
static constexpr auto name = "visibleWidth";
2021-06-01 12:20:52 +00:00
static FunctionPtr create(ContextPtr)
{
return std::make_shared<FunctionVisibleWidth>();
}
bool useDefaultImplementationForNulls() const override { return false; }
2019-10-02 17:51:00 +00:00
ColumnNumbers getArgumentsThatDontImplyNullableReturnType(size_t /*number_of_arguments*/) const override { return {0}; }
2021-06-22 16:21:23 +00:00
bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
/// Get the name of the function.
String getName() const override
{
return name;
}
size_t getNumberOfArguments() const override
{
return 1;
}
DataTypePtr getReturnTypeImpl(const DataTypes & /*arguments*/) const override
{
return std::make_shared<DataTypeUInt64>();
}
bool useDefaultImplementationForConstants() const override { return true; }
2020-10-14 14:04:50 +00:00
/// Execute the function on the columns.
ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
{
2020-11-19 07:14:23 +00:00
const auto & src = arguments[0];
size_t size = input_rows_count;
auto res_col = ColumnUInt64::create(size);
auto & res_data = assert_cast<ColumnUInt64 &>(*res_col).getData();
/// For simplicity reasons, function is implemented by serializing into temporary buffer.
String tmp;
FormatSettings format_settings;
2021-03-13 18:05:18 +00:00
auto serialization = src.type->getDefaultSerialization();
for (size_t i = 0; i < size; ++i)
{
{
WriteBufferFromString out(tmp);
2021-03-13 18:05:18 +00:00
serialization->serializeText(*src.column, i, out, format_settings);
}
res_data[i] = UTF8::countCodePoints(reinterpret_cast<const UInt8 *>(tmp.data()), tmp.size());
}
2020-10-19 15:27:41 +00:00
return res_col;
}
};
REGISTER_FUNCTION(VisibleWidth)
{
factory.registerFunction<FunctionVisibleWidth>();
}
}