mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-12-15 02:41:59 +00:00
dbb4f8216f
Conflicts: - src/Functions/GregorianDate.h
423 lines
12 KiB
C++
423 lines
12 KiB
C++
#pragma once
|
|
|
|
#include <base/extended_types.h>
|
|
#include <Common/Exception.h>
|
|
#include <Core/Types.h>
|
|
#include <IO/ReadBuffer.h>
|
|
#include <IO/ReadHelpers.h>
|
|
#include <IO/WriteBufferFromString.h>
|
|
#include <IO/WriteHelpers.h>
|
|
|
|
#include <cstdint>
|
|
|
|
|
|
namespace DB
|
|
{
|
|
namespace ErrorCodes
|
|
{
|
|
extern const int CANNOT_PARSE_INPUT_ASSERTION_FAILED;
|
|
extern const int CANNOT_PARSE_DATE;
|
|
extern const int CANNOT_FORMAT_DATETIME;
|
|
extern const int LOGICAL_ERROR;
|
|
}
|
|
|
|
/** Proleptic Gregorian calendar date. YearT is an integral type
|
|
* which should be at least 32 bits wide, and should preferably
|
|
* be signed.
|
|
*/
|
|
template <typename YearT = int32_t>
|
|
class GregorianDate
|
|
{
|
|
public:
|
|
/** Construct from date in text form 'YYYY-MM-DD' by reading from
|
|
* ReadBuffer.
|
|
*/
|
|
explicit GregorianDate(ReadBuffer & in);
|
|
|
|
/** Construct from Modified Julian Day. The type T is an
|
|
* integral type which should be at least 32 bits wide, and
|
|
* should preferably signed.
|
|
*/
|
|
explicit GregorianDate(is_integer auto modified_julian_day);
|
|
|
|
/** Convert to Modified Julian Day. The type T is an integral type
|
|
* which should be at least 32 bits wide, and should preferably
|
|
* signed.
|
|
*/
|
|
template <is_integer T>
|
|
T toModifiedJulianDay() const;
|
|
|
|
/** Write the date in text form 'YYYY-MM-DD' to a buffer.
|
|
*/
|
|
void write(WriteBuffer & buf) const;
|
|
|
|
/** Convert to a string in text form 'YYYY-MM-DD'.
|
|
*/
|
|
std::string toString() const;
|
|
|
|
YearT year() const noexcept
|
|
{
|
|
return year_;
|
|
}
|
|
|
|
uint8_t month() const noexcept
|
|
{
|
|
return month_;
|
|
}
|
|
|
|
uint8_t day_of_month() const noexcept /// NOLINT
|
|
{
|
|
return day_of_month_;
|
|
}
|
|
|
|
private:
|
|
YearT year_; /// NOLINT
|
|
uint8_t month_; /// NOLINT
|
|
uint8_t day_of_month_; /// NOLINT
|
|
};
|
|
|
|
/** ISO 8601 Ordinal Date. YearT is an integral type which should
|
|
* be at least 32 bits wide, and should preferably signed.
|
|
*/
|
|
template <typename YearT = int32_t>
|
|
class OrdinalDate
|
|
{
|
|
public:
|
|
OrdinalDate(YearT year, uint16_t day_of_year);
|
|
|
|
/** Construct from Modified Julian Day. The type T is an
|
|
* integral type which should be at least 32 bits wide, and
|
|
* should preferably signed.
|
|
*/
|
|
template <is_integer DayT>
|
|
explicit OrdinalDate(DayT modified_julian_day);
|
|
|
|
/** Convert to Modified Julian Day. The type T is an integral
|
|
* type which should be at least 32 bits wide, and should
|
|
* preferably be signed.
|
|
*/
|
|
template <is_integer T>
|
|
T toModifiedJulianDay() const noexcept;
|
|
|
|
YearT year() const noexcept
|
|
{
|
|
return year_;
|
|
}
|
|
|
|
uint16_t dayOfYear() const noexcept
|
|
{
|
|
return day_of_year_;
|
|
}
|
|
|
|
private:
|
|
YearT year_; /// NOLINT
|
|
uint16_t day_of_year_; /// NOLINT
|
|
};
|
|
|
|
class MonthDay
|
|
{
|
|
public:
|
|
/** Construct from month and day. */
|
|
MonthDay(uint8_t month, uint8_t day_of_month);
|
|
|
|
/** Construct from day of year in Gregorian or Julian
|
|
* calendars to month and day.
|
|
*/
|
|
MonthDay(bool is_leap_year, uint16_t day_of_year);
|
|
|
|
/** Convert month and day in Gregorian or Julian calendars to
|
|
* day of year.
|
|
*/
|
|
uint16_t dayOfYear(bool is_leap_year) const;
|
|
|
|
uint8_t month() const noexcept
|
|
{
|
|
return month_;
|
|
}
|
|
|
|
uint8_t day_of_month() const noexcept /// NOLINT
|
|
{
|
|
return day_of_month_;
|
|
}
|
|
|
|
private:
|
|
uint8_t month_; /// NOLINT
|
|
uint8_t day_of_month_; /// NOLINT
|
|
};
|
|
}
|
|
|
|
/* Implementation */
|
|
|
|
namespace gd
|
|
{
|
|
using namespace DB;
|
|
|
|
template <typename YearT>
|
|
static inline constexpr bool is_leap_year(YearT year)
|
|
{
|
|
return (year % 4 == 0) && ((year % 400 == 0) || (year % 100 != 0));
|
|
}
|
|
|
|
static inline constexpr uint8_t monthLength(bool is_leap_year, uint8_t month)
|
|
{
|
|
switch (month)
|
|
{
|
|
case 1: return 31;
|
|
case 2: return is_leap_year ? 29 : 28;
|
|
case 3: return 31;
|
|
case 4: return 30;
|
|
case 5: return 31;
|
|
case 6: return 30;
|
|
case 7: return 31;
|
|
case 8: return 31;
|
|
case 9: return 30;
|
|
case 10: return 31;
|
|
case 11: return 30;
|
|
case 12: return 31;
|
|
default:
|
|
std::terminate();
|
|
}
|
|
}
|
|
|
|
/** Integer division truncated toward negative infinity.
|
|
*/
|
|
template <typename I, typename J>
|
|
static inline constexpr I div(I x, J y)
|
|
{
|
|
const auto y_cast = static_cast<I>(y);
|
|
if (x > 0 && y_cast < 0)
|
|
return ((x - 1) / y_cast) - 1;
|
|
else if (x < 0 && y_cast > 0)
|
|
return ((x + 1) / y_cast) - 1;
|
|
else
|
|
return x / y_cast;
|
|
}
|
|
|
|
/** Integer modulus, satisfying div(x, y)*y + mod(x, y) == x.
|
|
*/
|
|
template <typename I, typename J>
|
|
static inline constexpr I mod(I x, J y)
|
|
{
|
|
const auto y_cast = static_cast<I>(y);
|
|
const auto r = x % y_cast;
|
|
if ((x > 0 && y_cast < 0) || (x < 0 && y_cast > 0))
|
|
return r == 0 ? static_cast<I>(0) : r + y_cast;
|
|
else
|
|
return r;
|
|
}
|
|
|
|
/** Like std::min(), but the type of operands may differ.
|
|
*/
|
|
template <typename I, typename J>
|
|
static inline constexpr I min(I x, J y)
|
|
{
|
|
const auto y_cast = static_cast<I>(y);
|
|
return x < y_cast ? x : y_cast;
|
|
}
|
|
|
|
static inline char readDigit(ReadBuffer & in)
|
|
{
|
|
char c;
|
|
if (!in.read(c))
|
|
throw Exception(
|
|
"Cannot parse input: expected a digit at the end of stream",
|
|
ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED);
|
|
else if (c < '0' || c > '9')
|
|
throw Exception(
|
|
"Cannot read input: expected a digit but got something else",
|
|
ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED);
|
|
else
|
|
return c - '0';
|
|
}
|
|
}
|
|
|
|
namespace DB
|
|
{
|
|
template <typename YearT>
|
|
GregorianDate<YearT>::GregorianDate(ReadBuffer & in)
|
|
{
|
|
year_ = gd::readDigit(in) * 1000
|
|
+ gd::readDigit(in) * 100
|
|
+ gd::readDigit(in) * 10
|
|
+ gd::readDigit(in);
|
|
|
|
assertChar('-', in);
|
|
|
|
month_ = gd::readDigit(in) * 10
|
|
+ gd::readDigit(in);
|
|
|
|
assertChar('-', in);
|
|
|
|
day_of_month_ = gd::readDigit(in) * 10
|
|
+ gd::readDigit(in);
|
|
|
|
assertEOF(in);
|
|
|
|
if (month_ < 1 || month_ > 12 || day_of_month_ < 1 || day_of_month_ > gd::monthLength(gd::is_leap_year(year_), month_))
|
|
throw Exception("Invalid date: " + toString(), ErrorCodes::CANNOT_PARSE_DATE);
|
|
}
|
|
|
|
template <typename YearT>
|
|
GregorianDate<YearT>::GregorianDate(is_integer auto modified_julian_day)
|
|
{
|
|
const OrdinalDate<YearT> ord(modified_julian_day);
|
|
const MonthDay md(gd::is_leap_year(ord.year()), ord.dayOfYear());
|
|
year_ = ord.year();
|
|
month_ = md.month();
|
|
day_of_month_ = md.day_of_month();
|
|
}
|
|
|
|
template <typename YearT>
|
|
template <is_integer T>
|
|
T GregorianDate<YearT>::toModifiedJulianDay() const
|
|
{
|
|
const MonthDay md(month_, day_of_month_);
|
|
const auto day_of_year = md.dayOfYear(gd::is_leap_year(year_));
|
|
const OrdinalDate<YearT> ord(year_, day_of_year);
|
|
return ord.template toModifiedJulianDay<T>();
|
|
}
|
|
|
|
template <typename YearT>
|
|
void GregorianDate<YearT>::write(WriteBuffer & buf) const
|
|
{
|
|
if (year_ < 0 || year_ > 9999)
|
|
{
|
|
throw Exception(
|
|
"Impossible to stringify: year too big or small: " + DB::toString(year_),
|
|
ErrorCodes::CANNOT_FORMAT_DATETIME);
|
|
}
|
|
else
|
|
{
|
|
auto y = year_;
|
|
writeChar('0' + y / 1000, buf); y %= 1000;
|
|
writeChar('0' + y / 100, buf); y %= 100;
|
|
writeChar('0' + y / 10, buf); y %= 10;
|
|
writeChar('0' + y , buf);
|
|
|
|
writeChar('-', buf);
|
|
|
|
auto m = month_;
|
|
writeChar('0' + m / 10, buf); m %= 10;
|
|
writeChar('0' + m , buf);
|
|
|
|
writeChar('-', buf);
|
|
|
|
auto d = day_of_month_;
|
|
writeChar('0' + d / 10, buf); d %= 10;
|
|
writeChar('0' + d , buf);
|
|
}
|
|
}
|
|
|
|
template <typename YearT>
|
|
std::string GregorianDate<YearT>::toString() const
|
|
{
|
|
WriteBufferFromOwnString buf;
|
|
write(buf);
|
|
return buf.str();
|
|
}
|
|
|
|
template <typename YearT>
|
|
OrdinalDate<YearT>::OrdinalDate(YearT year, uint16_t day_of_year)
|
|
: year_(year)
|
|
, day_of_year_(day_of_year)
|
|
{
|
|
if (day_of_year < 1 || day_of_year > (gd::is_leap_year(year) ? 366 : 365))
|
|
{
|
|
throw Exception(
|
|
"Invalid ordinal date: " + toString(year) + "-" + toString(day_of_year),
|
|
ErrorCodes::LOGICAL_ERROR);
|
|
}
|
|
}
|
|
|
|
template <typename YearT>
|
|
template <is_integer DayT>
|
|
OrdinalDate<YearT>::OrdinalDate(DayT modified_julian_day)
|
|
{
|
|
/// This function supports day number from -678941 to 2973119 (which represent 0000-01-01 and 9999-12-31 respectively).
|
|
|
|
if constexpr (is_signed_v<DayT> && std::numeric_limits<DayT>::lowest() < -678941)
|
|
if (modified_julian_day < -678941)
|
|
throw Exception(
|
|
ErrorCodes::CANNOT_FORMAT_DATETIME,
|
|
"Value cannot be represented as date because it's out of range");
|
|
|
|
if constexpr (std::numeric_limits<DayT>::max() > 2973119)
|
|
if (modified_julian_day > 2973119)
|
|
throw Exception(
|
|
ErrorCodes::CANNOT_FORMAT_DATETIME,
|
|
"Value cannot be represented as date because it's out of range");
|
|
|
|
const auto a = modified_julian_day + 678575;
|
|
const auto quad_cent = gd::div(a, 146097);
|
|
const auto b = gd::mod(a, 146097);
|
|
const auto cent = gd::min(gd::div(b, 36524), 3);
|
|
const auto c = b - cent * 36524;
|
|
const auto quad = gd::div(c, 1461);
|
|
const auto d = gd::mod(c, 1461);
|
|
const auto y = gd::min(gd::div(d, 365), 3);
|
|
|
|
day_of_year_ = d - y * 365 + 1;
|
|
year_ = static_cast<YearT>(quad_cent * 400 + cent * 100 + quad * 4 + y + 1);
|
|
}
|
|
|
|
template <typename YearT>
|
|
template <is_integer T>
|
|
T OrdinalDate<YearT>::toModifiedJulianDay() const noexcept
|
|
{
|
|
const auto y = year_ - 1;
|
|
return day_of_year_
|
|
+ 365 * y
|
|
+ gd::div(y, 4)
|
|
- gd::div(y, 100)
|
|
+ gd::div(y, 400)
|
|
- 678576;
|
|
}
|
|
|
|
inline MonthDay::MonthDay(uint8_t month, uint8_t day_of_month)
|
|
: month_(month)
|
|
, day_of_month_(day_of_month)
|
|
{
|
|
if (month < 1 || month > 12)
|
|
throw Exception(
|
|
"Invalid month: " + DB::toString(month),
|
|
ErrorCodes::LOGICAL_ERROR);
|
|
/* We can't validate day_of_month here, because we don't know if
|
|
* it's a leap year. */
|
|
}
|
|
|
|
inline MonthDay::MonthDay(bool is_leap_year, uint16_t day_of_year)
|
|
{
|
|
if (day_of_year < 1 || day_of_year > (is_leap_year ? 366 : 365))
|
|
throw Exception(
|
|
std::string("Invalid day of year: ") +
|
|
(is_leap_year ? "leap, " : "non-leap, ") + DB::toString(day_of_year),
|
|
ErrorCodes::LOGICAL_ERROR);
|
|
|
|
month_ = 1;
|
|
uint16_t d = day_of_year;
|
|
while (true)
|
|
{
|
|
const auto len = gd::monthLength(is_leap_year, month_);
|
|
if (d <= len)
|
|
break;
|
|
month_++;
|
|
d -= len;
|
|
}
|
|
day_of_month_ = d;
|
|
}
|
|
|
|
inline uint16_t MonthDay::dayOfYear(bool is_leap_year) const
|
|
{
|
|
if (day_of_month_ < 1 || day_of_month_ > gd::monthLength(is_leap_year, month_))
|
|
{
|
|
throw Exception(
|
|
std::string("Invalid day of month: ") +
|
|
(is_leap_year ? "leap, " : "non-leap, ") + DB::toString(month_) +
|
|
"-" + DB::toString(day_of_month_),
|
|
ErrorCodes::LOGICAL_ERROR);
|
|
}
|
|
const auto k = month_ <= 2 ? 0 : is_leap_year ? -1 :-2;
|
|
return (367 * month_ - 362) / 12 + k + day_of_month_;
|
|
}
|
|
}
|