fix bug in minMap and maxMap with zero values

2024-11-23 08:02:02 +00:00 · 2020-11-03 10:22:51 +00:00 · 2020-11-03 10:22:51 +00:00 · 2534ea3426
commit 2534ea3426
parent 8a68ee2547
3 changed files with 42 additions and 25 deletions
--- a/src/AggregateFunctions/AggregateFunctionSumMap.h
+++ b/src/AggregateFunctions/AggregateFunctionSumMap.h
@ -56,7 +56,7 @@ struct AggregateFunctionMapData
  * minMap and maxMap share the same idea, but calculate min and max correspondingly.
  */

-template <typename T, typename Derived, typename Visitor, bool overflow, bool tuple_argument>
+template <typename T, typename Derived, typename Visitor, bool overflow, bool tuple_argument, bool compact>
 class AggregateFunctionMapBase : public IAggregateFunctionDataHelper<
    AggregateFunctionMapData<NearestFieldType<T>>, Derived>
 {
@ -255,23 +255,27 @@ public:
    {
        // Final step does compaction of keys that have zero values, this mutates the state
        auto & merged_maps = this->data(place).merged_maps;
-        for (auto it = merged_maps.cbegin(); it != merged_maps.cend();)
-        {
-            // Key is not compacted if it has at least one non-zero value
-            bool erase = true;
-            for (size_t col = 0; col < values_types.size(); ++col)
-            {
-                if (it->second[col] != values_types[col]->getDefault())
-                {
-                    erase = false;
-                    break;
-                }
-            }

-            if (erase)
-                it = merged_maps.erase(it);
-            else
-                ++it;
+        if constexpr (compact)
+        {
+            for (auto it = merged_maps.cbegin(); it != merged_maps.cend();)
+            {
+                // Key is not compacted if it has at least one non-zero value
+                bool erase = true;
+                for (size_t col = 0; col < values_types.size(); ++col)
+                {
+                    if (it->second[col] != values_types[col]->getDefault())
+                    {
+                        erase = false;
+                        break;
+                    }
+                }
+
+                if (erase)
+                    it = merged_maps.erase(it);
+                else
+                    ++it;
+            }
        }

        size_t size = merged_maps.size();
@ -314,11 +318,11 @@ public:

 template <typename T, bool overflow, bool tuple_argument>
 class AggregateFunctionSumMap final :
-    public AggregateFunctionMapBase<T, AggregateFunctionSumMap<T, overflow, tuple_argument>, FieldVisitorSum, overflow, tuple_argument>
+    public AggregateFunctionMapBase<T, AggregateFunctionSumMap<T, overflow, tuple_argument>, FieldVisitorSum, overflow, tuple_argument, true>
 {
 private:
    using Self = AggregateFunctionSumMap<T, overflow, tuple_argument>;
-    using Base = AggregateFunctionMapBase<T, Self, FieldVisitorSum, overflow, tuple_argument>;
+    using Base = AggregateFunctionMapBase<T, Self, FieldVisitorSum, overflow, tuple_argument, true>;

 public:
    AggregateFunctionSumMap(const DataTypePtr & keys_type_,
@ -342,11 +346,12 @@ class AggregateFunctionSumMapFiltered final :
        AggregateFunctionSumMapFiltered<T, overflow, tuple_argument>,
        FieldVisitorSum,
        overflow,
-        tuple_argument>
+        tuple_argument,
+        true>
 {
 private:
    using Self = AggregateFunctionSumMapFiltered<T, overflow, tuple_argument>;
-    using Base = AggregateFunctionMapBase<T, Self, FieldVisitorSum, overflow, tuple_argument>;
+    using Base = AggregateFunctionMapBase<T, Self, FieldVisitorSum, overflow, tuple_argument, true>;

    /// ARCADIA_BUILD disallow unordered_set for big ints for some reason
    static constexpr const bool allow_hash = !OverBigInt<T>;
@ -474,11 +479,11 @@ public:

 template <typename T, bool tuple_argument>
 class AggregateFunctionMinMap final :
-    public AggregateFunctionMapBase<T, AggregateFunctionMinMap<T, tuple_argument>, FieldVisitorMin, true, tuple_argument>
+    public AggregateFunctionMapBase<T, AggregateFunctionMinMap<T, tuple_argument>, FieldVisitorMin, true, tuple_argument, false>
 {
 private:
    using Self = AggregateFunctionMinMap<T, tuple_argument>;
-    using Base = AggregateFunctionMapBase<T, Self, FieldVisitorMin, true, tuple_argument>;
+    using Base = AggregateFunctionMapBase<T, Self, FieldVisitorMin, true, tuple_argument, false>;

 public:
    AggregateFunctionMinMap(const DataTypePtr & keys_type_,
@ -498,11 +503,11 @@ public:

 template <typename T, bool tuple_argument>
 class AggregateFunctionMaxMap final :
-    public AggregateFunctionMapBase<T, AggregateFunctionMaxMap<T, tuple_argument>, FieldVisitorMax, true, tuple_argument>
+    public AggregateFunctionMapBase<T, AggregateFunctionMaxMap<T, tuple_argument>, FieldVisitorMax, true, tuple_argument, false>
 {
 private:
    using Self = AggregateFunctionMaxMap<T, tuple_argument>;
-    using Base = AggregateFunctionMapBase<T, Self, FieldVisitorMax, true, tuple_argument>;
+    using Base = AggregateFunctionMapBase<T, Self, FieldVisitorMax, true, tuple_argument, false>;

 public:
    AggregateFunctionMaxMap(const DataTypePtr & keys_type_,
--- a/tests/queries/0_stateless/01280_min_map_max_map.reference
+++ b/tests/queries/0_stateless/01280_min_map_max_map.reference
@ -22,3 +22,8 @@
 (['1970-01-01 03:00:01'],[2])
 ([1.01],[2])
 (['a'],[2])
+([1,2],[0,0])
+([1,2],[0,0])
+(['A','B'],['',''])
+(['A','B'],['',''])
+([],[])
--- a/tests/queries/0_stateless/01280_min_map_max_map.sql
+++ b/tests/queries/0_stateless/01280_min_map_max_map.sql
@ -31,3 +31,10 @@ select maxMap(val, cnt) from values ('val Array(Date), cnt Array(Int16)',  ([1],
 select maxMap(val, cnt) from values ('val Array(DateTime(\'Europe/Moscow\')), cnt Array(Int32)',  ([1], [1]), ([1], [2]));
 select maxMap(val, cnt) from values ('val Array(Decimal(10, 2)), cnt Array(Int16)',  (['1.01'], [1]), (['1.01'], [2]));
 select maxMap(val, cnt) from values ('val Array(Enum16(\'a\'=1)), cnt Array(Int16)',  (['a'], [1]), (['a'], [2]));
+
+-- bugfix, minMap and maxMap should not remove values with zero and empty strings but this behavior should not affect sumMap
+select minMap(val, cnt) from values ('val Array(UInt64), cnt Array(UInt64)',  ([1], [0]), ([2], [0]));
+select maxMap(val, cnt) from values ('val Array(UInt64), cnt Array(UInt64)',  ([1], [0]), ([2], [0]));
+select minMap(val, cnt) from values ('val Array(String), cnt Array(String)',  (['A'], ['']), (['B'], ['']));
+select minMap(val, cnt) from values ('val Array(String), cnt Array(String)',  (['A'], ['']), (['B'], ['']));
+select sumMap(val, cnt) from values ('val Array(UInt64), cnt Array(UInt64)',  ([1], [0]), ([2], [0]));