#pragma once #include #include #include #include #include #include #include #include #include namespace DB { class RangeHashedDictionary final : public IDictionaryBase { public: RangeHashedDictionary( const std::string & name, const DictionaryStructure & dict_struct, DictionarySourcePtr source_ptr, const DictionaryLifetime dict_lifetime, bool require_nonempty); RangeHashedDictionary(const RangeHashedDictionary & other); std::exception_ptr getCreationException() const override { return creation_exception; } std::string getName() const override { return name; } std::string getTypeName() const override { return "RangeHashed"; } size_t getBytesAllocated() const override { return bytes_allocated; } size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); } double getHitRate() const override { return 1.0; } size_t getElementCount() const override { return element_count; } double getLoadFactor() const override { return static_cast(element_count) / bucket_count; } bool isCached() const override { return false; } std::unique_ptr clone() const override { return std::make_unique(*this); } const IDictionarySource * getSource() const override { return source_ptr.get(); } const DictionaryLifetime & getLifetime() const override { return dict_lifetime; } const DictionaryStructure & getStructure() const override { return dict_struct; } std::chrono::time_point getCreationTime() const override { return creation_time; } bool isInjective(const std::string & attribute_name) const override { return dict_struct.attributes[&getAttribute(attribute_name) - attributes.data()].injective; } #define DECLARE_MULTIPLE_GETTER(TYPE)\ void get##TYPE(\ const std::string & attribute_name, const PaddedPODArray & ids, const PaddedPODArray & dates,\ PaddedPODArray & out) const; DECLARE_MULTIPLE_GETTER(UInt8) DECLARE_MULTIPLE_GETTER(UInt16) DECLARE_MULTIPLE_GETTER(UInt32) DECLARE_MULTIPLE_GETTER(UInt64) DECLARE_MULTIPLE_GETTER(UInt128) DECLARE_MULTIPLE_GETTER(Int8) DECLARE_MULTIPLE_GETTER(Int16) DECLARE_MULTIPLE_GETTER(Int32) DECLARE_MULTIPLE_GETTER(Int64) DECLARE_MULTIPLE_GETTER(Float32) DECLARE_MULTIPLE_GETTER(Float64) #undef DECLARE_MULTIPLE_GETTER void getString( const std::string & attribute_name, const PaddedPODArray & ids, const PaddedPODArray & dates, ColumnString * out) const; BlockInputStreamPtr getBlockInputStream(const Names & column_names, size_t max_block_size) const override; struct Range : std::pair { using std::pair::pair; static bool isCorrectDate(const UInt16 date) { return 0 < date && date <= DATE_LUT_MAX_DAY_NUM; } bool contains(const UInt16 date) const { const auto & left = first; const auto & right = second; if (left <= date && date <= right) return true; const auto has_left_bound = isCorrectDate(left); const auto has_right_bound = isCorrectDate(right); if ((!has_left_bound || left <= date) && (!has_right_bound || date <= right)) return true; return false; } }; private: template struct Value final { Range range; T value; }; template using Values = std::vector>; template using Collection = HashMap>; template using Ptr = std::unique_ptr>; struct Attribute final { public: AttributeUnderlyingType type; std::tuple null_values; std::tuple, Ptr, Ptr, Ptr, Ptr, Ptr, Ptr, Ptr, Ptr, Ptr, Ptr, Ptr> maps; std::unique_ptr string_arena; }; void createAttributes(); void loadData(); template void addAttributeSize(const Attribute & attribute); void calculateBytesAllocated(); template void createAttributeImpl(Attribute & attribute, const Field & null_value); Attribute createAttributeWithType(const AttributeUnderlyingType type, const Field & null_value); template void getItems( const Attribute & attribute, const PaddedPODArray & ids, const PaddedPODArray & dates, PaddedPODArray & out) const; template void getItemsImpl( const Attribute & attribute, const PaddedPODArray & ids, const PaddedPODArray & dates, PaddedPODArray & out) const; template void setAttributeValueImpl(Attribute & attribute, const Key id, const Range & range, const T value); void setAttributeValue(Attribute & attribute, const Key id, const Range & range, const Field & value); const Attribute & getAttribute(const std::string & attribute_name) const; const Attribute & getAttributeWithType(const std::string & name, const AttributeUnderlyingType type) const; void getIdsAndDates(PaddedPODArray & ids, PaddedPODArray & start_dates, PaddedPODArray & end_dates) const; template void getIdsAndDates(const Attribute & attribute, PaddedPODArray & ids, PaddedPODArray & start_dates, PaddedPODArray & end_dates) const; const std::string name; const DictionaryStructure dict_struct; const DictionarySourcePtr source_ptr; const DictionaryLifetime dict_lifetime; const bool require_nonempty; std::map attribute_index_by_name; std::vector attributes; size_t bytes_allocated = 0; size_t element_count = 0; size_t bucket_count = 0; mutable std::atomic query_count{0}; std::chrono::time_point creation_time; std::exception_ptr creation_exception; }; }