#pragma once #include #include #include #include #include #include #include #include #include #include #include namespace DB { using BlockPtr = std::shared_ptr; class ComplexKeyHashedDictionary final : public IDictionaryBase { public: ComplexKeyHashedDictionary( const std::string & name, const DictionaryStructure & dict_struct, DictionarySourcePtr source_ptr, const DictionaryLifetime dict_lifetime, bool require_nonempty, BlockPtr saved_block = nullptr); ComplexKeyHashedDictionary(const ComplexKeyHashedDictionary & other); std::string getKeyDescription() const { return key_description; }; std::exception_ptr getCreationException() const override { return creation_exception; } std::string getName() const override { return name; } std::string getTypeName() const override { return "ComplexKeyHashed"; } size_t getBytesAllocated() const override { return bytes_allocated; } size_t getQueryCount() const override { return query_count.load(std::memory_order_relaxed); } double getHitRate() const override { return 1.0; } size_t getElementCount() const override { return element_count; } double getLoadFactor() const override { return static_cast(element_count) / bucket_count; } bool isCached() const override { return false; } std::unique_ptr clone() const override { return std::make_unique(*this); } const IDictionarySource * getSource() const override { return source_ptr.get(); } const DictionaryLifetime & getLifetime() const override { return dict_lifetime; } const DictionaryStructure & getStructure() const override { return dict_struct; } std::chrono::time_point getCreationTime() const override { return creation_time; } bool isInjective(const std::string & attribute_name) const override { return dict_struct.attributes[&getAttribute(attribute_name) - attributes.data()].injective; } #define DECLARE(TYPE)\ void get##TYPE(\ const std::string & attribute_name, const Columns & key_columns, const DataTypes & key_types,\ PaddedPODArray & out) const; DECLARE(UInt8) DECLARE(UInt16) DECLARE(UInt32) DECLARE(UInt64) DECLARE(UInt128) DECLARE(Int8) DECLARE(Int16) DECLARE(Int32) DECLARE(Int64) DECLARE(Float32) DECLARE(Float64) #undef DECLARE void getString( const std::string & attribute_name, const Columns & key_columns, const DataTypes & key_types, ColumnString * out) const; #define DECLARE(TYPE)\ void get##TYPE(\ const std::string & attribute_name, const Columns & key_columns, const DataTypes & key_types,\ const PaddedPODArray & def, PaddedPODArray & out) const; DECLARE(UInt8) DECLARE(UInt16) DECLARE(UInt32) DECLARE(UInt64) DECLARE(UInt128) DECLARE(Int8) DECLARE(Int16) DECLARE(Int32) DECLARE(Int64) DECLARE(Float32) DECLARE(Float64) #undef DECLARE void getString( const std::string & attribute_name, const Columns & key_columns, const DataTypes & key_types, const ColumnString * const def, ColumnString * const out) const; #define DECLARE(TYPE)\ void get##TYPE(\ const std::string & attribute_name, const Columns & key_columns, const DataTypes & key_types,\ const TYPE def, PaddedPODArray & out) const; DECLARE(UInt8) DECLARE(UInt16) DECLARE(UInt32) DECLARE(UInt64) DECLARE(UInt128) DECLARE(Int8) DECLARE(Int16) DECLARE(Int32) DECLARE(Int64) DECLARE(Float32) DECLARE(Float64) #undef DECLARE void getString( const std::string & attribute_name, const Columns & key_columns, const DataTypes & key_types, const String & def, ColumnString * const out) const; void has(const Columns & key_columns, const DataTypes & key_types, PaddedPODArray & out) const; BlockInputStreamPtr getBlockInputStream(const Names & column_names, size_t max_block_size) const override; private: template using ContainerType = HashMapWithSavedHash; template using ContainerPtrType = std::unique_ptr>; struct Attribute final { AttributeUnderlyingType type; std::tuple< UInt8, UInt16, UInt32, UInt64, UInt128, Int8, Int16, Int32, Int64, Float32, Float64, String> null_values; std::tuple< ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType, ContainerPtrType> maps; std::unique_ptr string_arena; }; void createAttributes(); void blockToAttributes(const Block & block); void updateData(); void loadData(); template void addAttributeSize(const Attribute & attribute); void calculateBytesAllocated(); template void createAttributeImpl(Attribute & attribute, const Field & null_value); Attribute createAttributeWithType(const AttributeUnderlyingType type, const Field & null_value); template void getItemsNumber( const Attribute & attribute, const Columns & key_columns, ValueSetter && set_value, DefaultGetter && get_default) const; template void getItemsImpl( const Attribute & attribute, const Columns & key_columns, ValueSetter && set_value, DefaultGetter && get_default) const; template bool setAttributeValueImpl(Attribute & attribute, const StringRef key, const T value); bool setAttributeValue(Attribute & attribute, const StringRef key, const Field & value); const Attribute & getAttribute(const std::string & attribute_name) const; static StringRef placeKeysInPool( const size_t row, const Columns & key_columns, StringRefs & keys, Arena & pool); template void has(const Attribute & attribute, const Columns & key_columns, PaddedPODArray & out) const; std::vector getKeys() const; template std::vector getKeys(const Attribute & attribute) const; const std::string name; const DictionaryStructure dict_struct; const DictionarySourcePtr source_ptr; const DictionaryLifetime dict_lifetime; const bool require_nonempty; const std::string key_description{dict_struct.getKeyDescription()}; std::map attribute_index_by_name; std::vector attributes; Arena keys_pool; size_t bytes_allocated = 0; size_t element_count = 0; size_t bucket_count = 0; mutable std::atomic query_count{0}; std::chrono::time_point creation_time; std::exception_ptr creation_exception; BlockPtr saved_block; }; }