ClickHouse/dbms/Common/HashTable/TwoLevelStringHashTable.h

#pragma once

#include <Common/HashTable/StringHashTable.h>

template <typename SubMaps, typename ImplTable = StringHashTable<SubMaps>, size_t BITS_FOR_BUCKET = 8>
class TwoLevelStringHashTable : private boost::noncopyable
{
protected:
    using HashValue = size_t;
    using Self = TwoLevelStringHashTable;

public:
    using Key = StringRef;
    using Impl = ImplTable;

    static constexpr size_t NUM_BUCKETS = 1ULL << BITS_FOR_BUCKET;
    static constexpr size_t MAX_BUCKET = NUM_BUCKETS - 1;

    // TODO: currently hashing contains redundant computations when doing distributed or external aggregations
    size_t hash(const Key & x) const
    {
        return const_cast<Self &>(*this).dispatch(*this, x, [&](const auto &, const auto &, size_t hash) { return hash; });
    }

    size_t operator()(const Key & x) const { return hash(x); }

    /// NOTE Bad for hash tables with more than 2^32 cells.
    static size_t getBucketFromHash(size_t hash_value) { return (hash_value >> (32 - BITS_FOR_BUCKET)) & MAX_BUCKET; }

public:
    using key_type = typename Impl::key_type;
    using mapped_type = typename Impl::mapped_type;
    using value_type = typename Impl::value_type;
    using cell_type = typename Impl::cell_type;

    using LookupResult = typename Impl::LookupResult;
    using ConstLookupResult = typename Impl::ConstLookupResult;

    Impl impls[NUM_BUCKETS];

    TwoLevelStringHashTable() {}

    template <typename Source>
    TwoLevelStringHashTable(const Source & src)
    {
        if (src.m0.hasZero())
            impls[0].m0.setHasZero(*src.m0.zeroValue());

        for (auto & v : src.m1)
        {
            size_t hash_value = v.getHash(src.m1);
            size_t buck = getBucketFromHash(hash_value);
            impls[buck].m1.insertUniqueNonZero(&v, hash_value);
        }
        for (auto & v : src.m2)
        {
            size_t hash_value = v.getHash(src.m2);
            size_t buck = getBucketFromHash(hash_value);
            impls[buck].m2.insertUniqueNonZero(&v, hash_value);
        }
        for (auto & v : src.m3)
        {
            size_t hash_value = v.getHash(src.m3);
            size_t buck = getBucketFromHash(hash_value);
            impls[buck].m3.insertUniqueNonZero(&v, hash_value);
        }
        for (auto & v : src.ms)
        {
            size_t hash_value = v.getHash(src.ms);
            size_t buck = getBucketFromHash(hash_value);
            impls[buck].ms.insertUniqueNonZero(&v, hash_value);
        }
    }

    // This function is mostly the same as StringHashTable::dispatch, but with
    // added bucket computation. See the comments there.
    template <typename Self, typename Func, typename KeyHolder>
    static auto ALWAYS_INLINE dispatch(Self & self, KeyHolder && key_holder, Func && func)
    {
        const StringRef & x = keyHolderGetKey(key_holder);
        const size_t sz = x.size;
        if (sz == 0)
        {
            keyHolderDiscardKey(key_holder);
            return func(self.impls[0].m0, VoidKey{}, 0);
        }

        const char * p = x.data;
        // pending bits that needs to be shifted out
        const char s = (-sz & 7) * 8;
        union
        {
            StringKey8 k8;
            StringKey16 k16;
            StringKey24 k24;
            UInt64 n[3];
        };
        StringHashTableHash hash;
        switch ((sz - 1) >> 3)
        {
            case 0:
            {
                // first half page
                if ((reinterpret_cast<uintptr_t>(p) & 2048) == 0)
                {
                    memcpy(&n[0], p, 8);
                    n[0] &= -1ul >> s;
                }
                else
                {
                    const char * lp = x.data + x.size - 8;
                    memcpy(&n[0], lp, 8);
                    n[0] >>= s;
                }
                auto res = hash(k8);
                auto buck = getBucketFromHash(res);
                keyHolderDiscardKey(key_holder);
                return func(self.impls[buck].m1, k8, res);
            }
            case 1:
            {
                memcpy(&n[0], p, 8);
                const char * lp = x.data + x.size - 8;
                memcpy(&n[1], lp, 8);
                n[1] >>= s;
                auto res = hash(k16);
                auto buck = getBucketFromHash(res);
                keyHolderDiscardKey(key_holder);
                return func(self.impls[buck].m2, k16, res);
            }
            case 2:
            {
                memcpy(&n[0], p, 16);
                const char * lp = x.data + x.size - 8;
                memcpy(&n[2], lp, 8);
                n[2] >>= s;
                auto res = hash(k24);
                auto buck = getBucketFromHash(res);
                keyHolderDiscardKey(key_holder);
                return func(self.impls[buck].m3, k24, res);
            }
            default:
            {
                auto res = hash(x);
                auto buck = getBucketFromHash(res);
                return func(self.impls[buck].ms, std::forward<KeyHolder>(key_holder), res);
            }
        }
    }

    template <typename KeyHolder>
    void ALWAYS_INLINE emplace(KeyHolder && key_holder, LookupResult & it, bool & inserted)
    {
        dispatch(*this, key_holder, typename Impl::EmplaceCallable{it, inserted});
    }

    LookupResult ALWAYS_INLINE find(const Key x)
    {
        return dispatch(*this, x, typename Impl::FindCallable{});
    }

    ConstLookupResult ALWAYS_INLINE find(const Key x) const
    {
        return dispatch(*this, x, typename Impl::FindCallable{});
    }

    void write(DB::WriteBuffer & wb) const
    {
        for (size_t i = 0; i < NUM_BUCKETS; ++i)
            impls[i].write(wb);
    }

    void writeText(DB::WriteBuffer & wb) const
    {
        for (size_t i = 0; i < NUM_BUCKETS; ++i)
        {
            if (i != 0)
                DB::writeChar(',', wb);
            impls[i].writeText(wb);
        }
    }

    void read(DB::ReadBuffer & rb)
    {
        for (size_t i = 0; i < NUM_BUCKETS; ++i)
            impls[i].read(rb);
    }

    void readText(DB::ReadBuffer & rb)
    {
        for (size_t i = 0; i < NUM_BUCKETS; ++i)
        {
            if (i != 0)
                DB::assertChar(',', rb);
            impls[i].readText(rb);
        }
    }

    size_t size() const
    {
        size_t res = 0;
        for (size_t i = 0; i < NUM_BUCKETS; ++i)
            res += impls[i].size();

        return res;
    }

    bool empty() const
    {
        for (size_t i = 0; i < NUM_BUCKETS; ++i)
            if (!impls[i].empty())
                return false;

        return true;
    }

    size_t getBufferSizeInBytes() const
    {
        size_t res = 0;
        for (size_t i = 0; i < NUM_BUCKETS; ++i)
            res += impls[i].getBufferSizeInBytes();

        return res;
    }
};
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`#pragma once`

			`#include <Common/HashTable/StringHashTable.h>`

			`template <typename SubMaps, typename ImplTable = StringHashTable<SubMaps>, size_t BITS_FOR_BUCKET = 8>`
			`class TwoLevelStringHashTable : private boost::noncopyable`
			`{`
			`protected:`
			`using HashValue = size_t;`
			`using Self = TwoLevelStringHashTable;`

			`public:`
			`using Key = StringRef;`
			`using Impl = ImplTable;`

			`static constexpr size_t NUM_BUCKETS = 1ULL << BITS_FOR_BUCKET;`
			`static constexpr size_t MAX_BUCKET = NUM_BUCKETS - 1;`

			`// TODO: currently hashing contains redundant computations when doing distributed or external aggregations`
			`size_t hash(const Key & x) const`
			`{`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`return const_cast<Self &>(this).dispatch(this, x, [&](const auto &, const auto &, size_t hash) { return hash; });`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`}`

			`size_t operator()(const Key & x) const { return hash(x); }`

			`/// NOTE Bad for hash tables with more than 2^32 cells.`
			`static size_t getBucketFromHash(size_t hash_value) { return (hash_value >> (32 - BITS_FOR_BUCKET)) & MAX_BUCKET; }`

			`public:`
			`using key_type = typename Impl::key_type;`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`using mapped_type = typename Impl::mapped_type;`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`using value_type = typename Impl::value_type;`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`using cell_type = typename Impl::cell_type;`

Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`using LookupResult = typename Impl::LookupResult;`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`using ConstLookupResult = typename Impl::ConstLookupResult;`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00
			`Impl impls[NUM_BUCKETS];`

			`TwoLevelStringHashTable() {}`

			`template <typename Source>`
			`TwoLevelStringHashTable(const Source & src)`
			`{`
			`if (src.m0.hasZero())`
			`impls[0].m0.setHasZero(*src.m0.zeroValue());`

			`for (auto & v : src.m1)`
			`{`
			`size_t hash_value = v.getHash(src.m1);`
			`size_t buck = getBucketFromHash(hash_value);`
			`impls[buck].m1.insertUniqueNonZero(&v, hash_value);`
			`}`
			`for (auto & v : src.m2)`
			`{`
			`size_t hash_value = v.getHash(src.m2);`
			`size_t buck = getBucketFromHash(hash_value);`
			`impls[buck].m2.insertUniqueNonZero(&v, hash_value);`
			`}`
			`for (auto & v : src.m3)`
			`{`
			`size_t hash_value = v.getHash(src.m3);`
			`size_t buck = getBucketFromHash(hash_value);`
			`impls[buck].m3.insertUniqueNonZero(&v, hash_value);`
			`}`
			`for (auto & v : src.ms)`
			`{`
			`size_t hash_value = v.getHash(src.ms);`
			`size_t buck = getBucketFromHash(hash_value);`
			`impls[buck].ms.insertUniqueNonZero(&v, hash_value);`
			`}`
			`}`

Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`// This function is mostly the same as StringHashTable::dispatch, but with`
			`// added bucket computation. See the comments there.`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`template <typename Self, typename Func, typename KeyHolder>`
			`static auto ALWAYS_INLINE dispatch(Self & self, KeyHolder && key_holder, Func && func)`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`{`
			`const StringRef & x = keyHolderGetKey(key_holder);`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`const size_t sz = x.size;`
			`if (sz == 0)`
			`{`
			`keyHolderDiscardKey(key_holder);`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`return func(self.impls[0].m0, VoidKey{}, 0);`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`}`

Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`const char * p = x.data;`
			`// pending bits that needs to be shifted out`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`const char s = (-sz & 7) * 8;`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`union`
			`{`
			`StringKey8 k8;`
			`StringKey16 k16;`
			`StringKey24 k24;`
			`UInt64 n[3];`
			`};`
			`StringHashTableHash hash;`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`switch ((sz - 1) >> 3)`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`{`
			`case 0:`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`{`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`// first half page`
			`if ((reinterpret_cast<uintptr_t>(p) & 2048) == 0)`
			`{`
			`memcpy(&n[0], p, 8);`
			`n[0] &= -1ul >> s;`
			`}`
			`else`
			`{`
			`const char * lp = x.data + x.size - 8;`
			`memcpy(&n[0], lp, 8);`
			`n[0] >>= s;`
			`}`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`auto res = hash(k8);`
			`auto buck = getBucketFromHash(res);`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`keyHolderDiscardKey(key_holder);`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`return func(self.impls[buck].m1, k8, res);`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`}`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`case 1:`
			`{`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`memcpy(&n[0], p, 8);`
			`const char * lp = x.data + x.size - 8;`
			`memcpy(&n[1], lp, 8);`
			`n[1] >>= s;`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`auto res = hash(k16);`
			`auto buck = getBucketFromHash(res);`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`keyHolderDiscardKey(key_holder);`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`return func(self.impls[buck].m2, k16, res);`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`}`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`case 2:`
			`{`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`memcpy(&n[0], p, 16);`
			`const char * lp = x.data + x.size - 8;`
			`memcpy(&n[2], lp, 8);`
			`n[2] >>= s;`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`auto res = hash(k24);`
			`auto buck = getBucketFromHash(res);`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`keyHolderDiscardKey(key_holder);`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`return func(self.impls[buck].m3, k24, res);`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`}`
Port the latest dispatch() improvements. 2019-10-22 10:43:52 +00:00			`default:`
			`{`
			`auto res = hash(x);`
			`auto buck = getBucketFromHash(res);`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`return func(self.impls[buck].ms, std::forward<KeyHolder>(key_holder), res);`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`}`
			`}`
			`}`

			`template <typename KeyHolder>`
			`void ALWAYS_INLINE emplace(KeyHolder && key_holder, LookupResult & it, bool & inserted)`
			`{`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`dispatch(*this, key_holder, typename Impl::EmplaceCallable{it, inserted});`
			`}`

			`LookupResult ALWAYS_INLINE find(const Key x)`
			`{`
			`return dispatch(*this, x, typename Impl::FindCallable{});`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`}`

Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`ConstLookupResult ALWAYS_INLINE find(const Key x) const`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`{`
Unify hash tables interface. 2019-10-29 15:16:51 +00:00			`return dispatch(*this, x, typename Impl::FindCallable{});`
Introduce String Hash Map. It speeds up aggregation over short string keys. Use it as a default aggregation method for string keys. 2019-08-20 17:38:56 +00:00			`}`

			`void write(DB::WriteBuffer & wb) const`
			`{`
			`for (size_t i = 0; i < NUM_BUCKETS; ++i)`
			`impls[i].write(wb);`
			`}`

			`void writeText(DB::WriteBuffer & wb) const`
			`{`
			`for (size_t i = 0; i < NUM_BUCKETS; ++i)`
			`{`
			`if (i != 0)`
			`DB::writeChar(',', wb);`
			`impls[i].writeText(wb);`
			`}`
			`}`

			`void read(DB::ReadBuffer & rb)`
			`{`
			`for (size_t i = 0; i < NUM_BUCKETS; ++i)`
			`impls[i].read(rb);`
			`}`

			`void readText(DB::ReadBuffer & rb)`
			`{`
			`for (size_t i = 0; i < NUM_BUCKETS; ++i)`
			`{`
			`if (i != 0)`
			`DB::assertChar(',', rb);`
			`impls[i].readText(rb);`
			`}`
			`}`

			`size_t size() const`
			`{`
			`size_t res = 0;`
			`for (size_t i = 0; i < NUM_BUCKETS; ++i)`
			`res += impls[i].size();`

			`return res;`
			`}`

			`bool empty() const`
			`{`
			`for (size_t i = 0; i < NUM_BUCKETS; ++i)`
			`if (!impls[i].empty())`
			`return false;`

			`return true;`
			`}`

			`size_t getBufferSizeInBytes() const`
			`{`
			`size_t res = 0;`
			`for (size_t i = 0; i < NUM_BUCKETS; ++i)`
			`res += impls[i].getBufferSizeInBytes();`

			`return res;`
			`}`
			`};`