From 3a38d4ed50c62f5fcf6a083f307b99f27e2e07ad Mon Sep 17 00:00:00 2001
From: ogorbacheva <ogorbacheva@yandex-team.ru>
Date: Tue, 22 Jan 2019 14:01:05 +0300
Subject: [PATCH 01/63] Doc fix: delete VerticalRaw format and remove escaping
 from Pretty and Vertical formats

---
 docs/en/interfaces/formats.md | 44 ++++++++++++++---------------------
 1 file changed, 18 insertions(+), 26 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index c47e75142df..54d839a99d3 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -14,7 +14,6 @@ The table below lists supported formats and how they can be used in `INSERT` and
 | [CSVWithNames](#csvwithnames) | ✔ | ✔ |
 | [Values](#values) | ✔ | ✔ |
 | [Vertical](#vertical) | ✗ | ✔ |
-| [VerticalRaw](#verticalraw) | ✗ | ✔ |
 | [JSON](#json) | ✗ | ✔ |
 | [JSONCompact](#jsoncompact) | ✗ | ✔ |
 | [JSONEachRow](#jsoneachrow) | ✔ | ✔ |
@@ -355,6 +354,19 @@ SELECT * FROM t_null
 └───┴──────┘
 ```
 
+Rows are not escaped in `Pretty` format:
+
+``` sql
+:) SELECT 'String with \'quotes\' and \t character' AS Test_escaping
+FORMAT Pretty
+
+┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+┃ Test_escaping                             ┃
+┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+│ String with 'quotes' and 	 character      │
+└───────────────────────────────────────────┘
+```
+
 To avoid dumping too much data to the terminal, only the first 10,000 rows are printed. If the number of rows is greater than or equal to 10,000, the message "Showed first 10 000" is printed.
 This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
 
@@ -461,38 +473,18 @@ Row 1:
 x: 1
 y: ᴺᵁᴸᴸ
 ```
-
-This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
-
-## VerticalRaw {#verticalraw}
-
-Differs from `Vertical` format in that the rows are not escaped.
-This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
-
-Examples:
-
-```
-:) SHOW CREATE TABLE geonames FORMAT VerticalRaw;
-Row 1:
-──────
-statement: CREATE TABLE default.geonames ( geonameid UInt32, date Date DEFAULT CAST('2017-12-08' AS Date)) ENGINE = MergeTree(date, geonameid, 8192)
-
-:) SELECT 'string with \'quotes\' and \t with some special \n characters' AS test FORMAT VerticalRaw;
-Row 1:
-──────
-test: string with 'quotes' and   with some special
- characters
-```
-
-Compare with the Vertical format:
+Rows are not escaped in `Vertical` format: 
 
 ```
 :) SELECT 'string with \'quotes\' and \t with some special \n characters' AS test FORMAT Vertical;
 Row 1:
 ──────
-test: string with \'quotes\' and \t with some special \n characters
+test: string with 'quotes' and 	 with some special 
+ characters
 ```
 
+This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
+
 ## XML {#xml}
 
 XML format is suitable only for output, not for parsing. Example:

From fd7c1589bb573475a3d007ebd73227f5359eff26 Mon Sep 17 00:00:00 2001
From: ogorbacheva <ogorbacheva@yandex-team.ru>
Date: Tue, 22 Jan 2019 14:10:55 +0300
Subject: [PATCH 02/63] Doc fix: editing text about escaping

---
 docs/en/interfaces/formats.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 54d839a99d3..cdb1422b480 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -357,11 +357,11 @@ SELECT * FROM t_null
 Rows are not escaped in `Pretty` format:
 
 ``` sql
-:) SELECT 'String with \'quotes\' and \t character' AS Test_escaping
-FORMAT Pretty
+:) SELECT 'String with \'quotes\' and \t character' AS Escaping_test
+FORMAT Pretty;
 
 ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ Test_escaping                             ┃
+┃ Escaping_test                             ┃
 ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
 │ String with 'quotes' and 	 character      │
 └───────────────────────────────────────────┘

From a650e1ed08095bccbb3608243d20d7d7e86e662f Mon Sep 17 00:00:00 2001
From: ogorbacheva <ogorbacheva@yandex-team.ru>
Date: Tue, 22 Jan 2019 15:07:34 +0300
Subject: [PATCH 03/63] Doc fix: fix example in pretty format

---
 docs/en/interfaces/formats.md | 18 +++++++++++-------
 1 file changed, 11 insertions(+), 7 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index cdb1422b480..9c888eaa3ad 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -345,11 +345,13 @@ Each result block is output as a separate table. This is necessary so that block
 [NULL](../query_language/syntax.md) is output as `ᴺᵁᴸᴸ`.
 
 ``` sql
-SELECT * FROM t_null
+SELECT * FROM t_null FORMAT Pretty;
 ```
 
 ```
-┌─x─┬────y─┐
+┏━━━┳━━━━━━┓
+┃ x ┃ y    ┃
+┡━━━╇━━━━━━┩
 │ 1 │ ᴺᵁᴸᴸ │
 └───┴──────┘
 ```
@@ -359,12 +361,14 @@ Rows are not escaped in `Pretty` format:
 ``` sql
 :) SELECT 'String with \'quotes\' and \t character' AS Escaping_test
 FORMAT Pretty;
+```
 
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ Escaping_test                             ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ String with 'quotes' and 	 character      │
-└───────────────────────────────────────────┘
+```
+┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+┃ Escaping_test                            ┃
+┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+│ String with 'quotes' and      character  │
+└──────────────────────────────────────────┘
 ```
 
 To avoid dumping too much data to the terminal, only the first 10,000 rows are printed. If the number of rows is greater than or equal to 10,000, the message "Showed first 10 000" is printed.

From 996263490c9314e68e7ce65cfff8367a392eec73 Mon Sep 17 00:00:00 2001
From: ogorbacheva <ogorbacheva@yandex-team.ru>
Date: Tue, 22 Jan 2019 15:59:25 +0300
Subject: [PATCH 04/63] Doc fix: fix example in pretty format

---
 docs/en/interfaces/formats.md | 32 ++++++++++++++++----------------
 1 file changed, 16 insertions(+), 16 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 9c888eaa3ad..1d32406af34 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -344,37 +344,34 @@ Each result block is output as a separate table. This is necessary so that block
 
 [NULL](../query_language/syntax.md) is output as `ᴺᵁᴸᴸ`.
 
+Example (shown for the [PrettyCompact](#prettycompact) format):
+
 ``` sql
-SELECT * FROM t_null FORMAT Pretty;
+SELECT * FROM t_null FORMAT 
 ```
 
-```
-┏━━━┳━━━━━━┓
-┃ x ┃ y    ┃
-┡━━━╇━━━━━━┩
+``` text
+┌─x─┬─y────┐
 │ 1 │ ᴺᵁᴸᴸ │
 └───┴──────┘
 ```
 
-Rows are not escaped in `Pretty` format:
+Rows are not escaped in Pretty* format. Example is shown for the [PrettyCompact](#prettycompact) format:
 
 ``` sql
-:) SELECT 'String with \'quotes\' and \t character' AS Escaping_test
-FORMAT Pretty;
+SELECT 'String with \'quotes\' and \t character' AS Escaping_test
 ```
 
-```
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ Escaping_test                            ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ String with 'quotes' and      character  │
+``` 
+┌─Escaping_test────────────────────────────┐
+│ String with 'quotes' and 	 character     │
 └──────────────────────────────────────────┘
 ```
 
 To avoid dumping too much data to the terminal, only the first 10,000 rows are printed. If the number of rows is greater than or equal to 10,000, the message "Showed first 10 000" is printed.
 This format is only appropriate for outputting a query result, but not for parsing (retrieving data to insert in a table).
 
-The Pretty format supports outputting total values (when using WITH TOTALS) and extremes (when 'extremes' is set to 1). In these cases, total values and extreme values are output after the main data, in separate tables. Example (shown for the PrettyCompact format):
+The Pretty format supports outputting total values (when using WITH TOTALS) and extremes (when 'extremes' is set to 1). In these cases, total values and extreme values are output after the main data, in separate tables. Example (shown for the [PrettyCompact](#prettycompact) format):
 
 ``` sql
 SELECT EventDate, count() AS c FROM test.hits GROUP BY EventDate WITH TOTALS ORDER BY EventDate FORMAT PrettyCompact
@@ -477,10 +474,13 @@ Row 1:
 x: 1
 y: ᴺᵁᴸᴸ
 ```
-Rows are not escaped in `Vertical` format: 
+Rows are not escaped in Vertical format: 
+
+``` sql
+SELECT 'string with \'quotes\' and \t with some special \n characters' AS test FORMAT Vertical
+```
 
 ```
-:) SELECT 'string with \'quotes\' and \t with some special \n characters' AS test FORMAT Vertical;
 Row 1:
 ──────
 test: string with 'quotes' and 	 with some special 

From 0ce656856a01a2e0977b1660de57fcbc55adc409 Mon Sep 17 00:00:00 2001
From: ogorbacheva <ogorbacheva@yandex-team.ru>
Date: Tue, 22 Jan 2019 16:05:40 +0300
Subject: [PATCH 05/63] Doc fix: last fixes

---
 docs/en/interfaces/formats.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 1d32406af34..24522507b71 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -347,10 +347,10 @@ Each result block is output as a separate table. This is necessary so that block
 Example (shown for the [PrettyCompact](#prettycompact) format):
 
 ``` sql
-SELECT * FROM t_null FORMAT 
+SELECT * FROM t_null 
 ```
 
-``` text
+```
 ┌─x─┬─y────┐
 │ 1 │ ᴺᵁᴸᴸ │
 └───┴──────┘

From 64eb46fa6bf910575cbac40c0bf64273bc19ae4e Mon Sep 17 00:00:00 2001
From: ogorbacheva <ogorbacheva@yandex-team.ru>
Date: Tue, 22 Jan 2019 16:14:43 +0300
Subject: [PATCH 06/63] Doc fix: last fixes

---
 docs/en/interfaces/formats.md | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 24522507b71..5e0c9801ff0 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -347,11 +347,11 @@ Each result block is output as a separate table. This is necessary so that block
 Example (shown for the [PrettyCompact](#prettycompact) format):
 
 ``` sql
-SELECT * FROM t_null 
+SELECT * FROM t_null
 ```
 
 ```
-┌─x─┬─y────┐
+┌─x─┬────y─┐
 │ 1 │ ᴺᵁᴸᴸ │
 └───┴──────┘
 ```
@@ -363,9 +363,9 @@ SELECT 'String with \'quotes\' and \t character' AS Escaping_test
 ```
 
 ``` 
-┌─Escaping_test────────────────────────────┐
-│ String with 'quotes' and 	 character     │
-└──────────────────────────────────────────┘
+┌─Escaping_test────────────────────────┐
+│ String with 'quotes' and 	 character │
+└──────────────────────────────────────┘
 ```
 
 To avoid dumping too much data to the terminal, only the first 10,000 rows are printed. If the number of rows is greater than or equal to 10,000, the message "Showed first 10 000" is printed.
@@ -402,7 +402,7 @@ Extremes:
 
 ## PrettyCompact {#prettycompact}
 
-Differs from `Pretty` in that the grid is drawn between rows and the result is more compact.
+Differs from [Pretty](#pretty) in that the grid is drawn between rows and the result is more compact.
 This format is used by default in the command-line client in interactive mode.
 
 ## PrettyCompactMonoBlock {#prettycompactmonoblock}
@@ -483,7 +483,7 @@ SELECT 'string with \'quotes\' and \t with some special \n characters' AS test F
 ```
 Row 1:
 ──────
-test: string with 'quotes' and 	 with some special 
+test: string with 'quotes' and 	 with some special
  characters
 ```
 

From 632398640646111d9753ecdff4d2d256da31c28e Mon Sep 17 00:00:00 2001
From: ogorbacheva <ogorbacheva@yandex-team.ru>
Date: Tue, 22 Jan 2019 16:17:24 +0300
Subject: [PATCH 07/63] Doc fix

---
 docs/en/interfaces/formats.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 5e0c9801ff0..eddefaa9394 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -356,7 +356,7 @@ SELECT * FROM t_null
 └───┴──────┘
 ```
 
-Rows are not escaped in Pretty* format. Example is shown for the [PrettyCompact](#prettycompact) format:
+Rows are not escaped in Pretty* formats. Example is shown for the [PrettyCompact](#prettycompact) format:
 
 ``` sql
 SELECT 'String with \'quotes\' and \t character' AS Escaping_test

From 58a5a9dc0cdf5d1ff563fd33b68cba36f1a99dbe Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Sat, 16 Feb 2019 18:04:55 +0100
Subject: [PATCH 08/63] Fix "only_from_localhost" example

---
 dbms/programs/server/users.d/allow_only_from_localhost.xml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/dbms/programs/server/users.d/allow_only_from_localhost.xml b/dbms/programs/server/users.d/allow_only_from_localhost.xml
index aad3a696521..bce5858ad41 100644
--- a/dbms/programs/server/users.d/allow_only_from_localhost.xml
+++ b/dbms/programs/server/users.d/allow_only_from_localhost.xml
@@ -4,7 +4,6 @@
         <default>
             <networks replace="replace">
                 <ip>::1</ip>
-                <ip>0.0.0.0</ip>
                 <ip>127.0.0.1</ip>
             </networks>
         </default>

From 88d63a0b3ad43fccb6eb429a995546eee47e6fd9 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Sun, 17 Feb 2019 21:56:27 +0100
Subject: [PATCH 09/63] Use pair of patterns to make combined RollupRules

---
 .../GraphiteRollupSortedBlockInputStream.cpp  | 90 +++++++++++++++----
 .../GraphiteRollupSortedBlockInputStream.h    | 39 ++++++--
 .../MergeTree/registerStorageMergeTree.cpp    | 29 ++++--
 .../Storages/System/StorageSystemGraphite.cpp | 19 +++-
 4 files changed, 145 insertions(+), 32 deletions(-)

diff --git a/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp b/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp
index dc30a3e7a07..6c1983568bb 100644
--- a/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp
+++ b/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp
@@ -23,8 +23,11 @@ GraphiteRollupSortedBlockInputStream::GraphiteRollupSortedBlockInputStream(
 
     for (const auto & pattern : params.patterns)
     {
-        max_size_of_aggregate_state = std::max(max_size_of_aggregate_state, pattern.function->sizeOfData());
-        max_alignment_of_aggregate_state = std::max(max_alignment_of_aggregate_state, pattern.function->alignOfData());
+        if (pattern.function)
+        {
+            max_size_of_aggregate_state = std::max(max_size_of_aggregate_state, pattern.function->sizeOfData());
+            max_alignment_of_aggregate_state = std::max(max_alignment_of_aggregate_state, pattern.function->alignOfData());
+        }
     }
 
     place_for_aggregate_state.reset(max_size_of_aggregate_state, max_alignment_of_aggregate_state);
@@ -41,13 +44,61 @@ GraphiteRollupSortedBlockInputStream::GraphiteRollupSortedBlockInputStream(
 }
 
 
-const Graphite::Pattern * GraphiteRollupSortedBlockInputStream::selectPatternForPath(StringRef path) const
+Graphite::RollupRule GraphiteRollupSortedBlockInputStream::selectPatternForPath(StringRef path) const
 {
+    const Graphite::Pattern * first_match = &undef_pattern;
+
     for (const auto & pattern : params.patterns)
         if (!pattern.regexp || pattern.regexp->match(path.data, path.size))
-            return &pattern;
+        {
+            if (!pattern.regexp)
+            {
+                /// Default pattern
+                if (first_match->type == first_match->TypeUndef && pattern.type == pattern.TypeAll)
+                {
+                    /// There is only default pattern for both retention and aggregation
+                    return std::pair(&pattern, &pattern);
+                }
+                if (pattern.type != first_match->type)
+                {
+                    if (first_match->type == first_match->TypeRetention)
+                    {
+                        return std::pair(first_match, &pattern);
+                    }
+                    if (first_match->type == first_match->TypeAggregation)
+                    {
+                        return std::pair(&pattern, first_match);
+                    }
+                }
+            }
+            else
+            {
+                /// General pattern with matched path
+                if (pattern.type == pattern.TypeAll)
+                {
+                   /// Only for not default patterns with both function and retention parameters
+                   return std::pair(&pattern, &pattern);
+                }
+                if (first_match->type == first_match->TypeUndef)
+                {
+                    first_match = &pattern;
+                    continue;
+                }
+                if (pattern.type != first_match->type)
+                {
+                    if (first_match->type == first_match->TypeRetention)
+                    {
+                        return std::pair(first_match, &pattern);
+                    }
+                    if (first_match->type == first_match->TypeAggregation)
+                    {
+                        return std::pair(&pattern, first_match);
+                    }
+                }
+            }
+        }
 
-    return nullptr;
+    return {nullptr, nullptr};
 }
 
 
@@ -142,14 +193,15 @@ void GraphiteRollupSortedBlockInputStream::merge(MutableColumns & merged_columns
             if (started_rows)
                 accumulateRow(current_subgroup_newest_row);
 
-            const Graphite::Pattern * next_pattern = current_pattern;
+            Graphite::RollupRule next_rule = current_rule;
             if (new_path)
-                next_pattern = selectPatternForPath(next_path);
+                next_rule = selectPatternForPath(next_path);
 
+            const Graphite::RetentionPattern * retention_pattern = std::get<0>(next_rule);
             time_t next_time_rounded;
-            if (next_pattern)
+            if (retention_pattern)
             {
-                UInt32 precision = selectPrecision(next_pattern->retentions, next_row_time);
+                UInt32 precision = selectPrecision(retention_pattern->retentions, next_row_time);
                 next_time_rounded = roundTimeToPrecision(date_lut, next_row_time, precision);
             }
             else
@@ -177,7 +229,7 @@ void GraphiteRollupSortedBlockInputStream::merge(MutableColumns & merged_columns
                 /// At this point previous row has been fully processed, so we can advance the loop
                 /// (substitute current_* values for next_*, advance the cursor).
 
-                startNextGroup(merged_columns, next_cursor, next_pattern);
+                startNextGroup(merged_columns, next_cursor, next_rule);
                 ++started_rows;
 
                 current_time_rounded = next_time_rounded;
@@ -229,8 +281,10 @@ void GraphiteRollupSortedBlockInputStream::merge(MutableColumns & merged_columns
 
 template <typename TSortCursor>
 void GraphiteRollupSortedBlockInputStream::startNextGroup(MutableColumns & merged_columns, TSortCursor & cursor,
-                                                          const Graphite::Pattern * next_pattern)
+                                                          Graphite::RollupRule next_rule)
 {
+    const Graphite::AggregationPattern * aggregation_pattern = std::get<1>(next_rule);
+
     /// Copy unmodified column values (including path column).
     for (size_t i = 0, size = unmodified_column_numbers.size(); i < size; ++i)
     {
@@ -238,13 +292,13 @@ void GraphiteRollupSortedBlockInputStream::startNextGroup(MutableColumns & merge
         merged_columns[j]->insertFrom(*cursor->all_columns[j], cursor->pos);
     }
 
-    if (next_pattern)
+    if (aggregation_pattern)
     {
-        next_pattern->function->create(place_for_aggregate_state.data());
+        aggregation_pattern->function->create(place_for_aggregate_state.data());
         aggregate_state_created = true;
     }
 
-    current_pattern = next_pattern;
+    current_rule = next_rule;
 }
 
 
@@ -255,10 +309,11 @@ void GraphiteRollupSortedBlockInputStream::finishCurrentGroup(MutableColumns & m
     merged_columns[version_column_num]->insertFrom(
         *(*current_subgroup_newest_row.columns)[version_column_num], current_subgroup_newest_row.row_num);
 
+    const Graphite::AggregationPattern * aggregation_pattern = std::get<1>(current_rule);
     if (aggregate_state_created)
     {
-        current_pattern->function->insertResultInto(place_for_aggregate_state.data(), *merged_columns[value_column_num]);
-        current_pattern->function->destroy(place_for_aggregate_state.data());
+        aggregation_pattern->function->insertResultInto(place_for_aggregate_state.data(), *merged_columns[value_column_num]);
+        aggregation_pattern->function->destroy(place_for_aggregate_state.data());
         aggregate_state_created = false;
     }
     else
@@ -269,8 +324,9 @@ void GraphiteRollupSortedBlockInputStream::finishCurrentGroup(MutableColumns & m
 
 void GraphiteRollupSortedBlockInputStream::accumulateRow(RowRef & row)
 {
+    const Graphite::AggregationPattern * aggregation_pattern = std::get<1>(current_rule);
     if (aggregate_state_created)
-        current_pattern->function->add(place_for_aggregate_state.data(), &(*row.columns)[value_column_num], row.row_num, nullptr);
+        aggregation_pattern->function->add(place_for_aggregate_state.data(), &(*row.columns)[value_column_num], row.row_num, nullptr);
 }
 
 }
diff --git a/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.h b/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.h
index e18522d6d25..bb2f81fc81f 100644
--- a/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.h
+++ b/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.h
@@ -27,11 +27,24 @@ namespace DB
   *
   * Each row in a table correspond to one value of one sensor.
   *
+  * Pattern should contain function, retention scheme, or both of them. The order of patterns does mean as well:
+  *   * Aggregation OR retention patterns should be first
+  *   * Then aggregation AND retention full patterns have to be placed
+  *   * default pattern without regexp must be the last
+  *
   * Rollup rules are specified in the following way:
   *
   * pattern
   *     regexp
   *     function
+  * pattern
+  *     regexp
+  *     age -> precision
+  *     age -> precision
+  *     ...
+  * pattern
+  *     regexp
+  *     function
   *     age -> precision
   *     age -> precision
   *     ...
@@ -54,6 +67,10 @@ namespace DB
   *
   * <graphite_rollup>
   *     <pattern>
+  *         <regexp>\.max$</regexp>
+  *         <function>max</function>
+  *     </pattern>
+  *     <pattern>
   *         <regexp>click_cost</regexp>
   *         <function>any</function>
   *         <retention>
@@ -98,9 +115,12 @@ namespace Graphite
         std::shared_ptr<OptimizedRegularExpression> regexp;
         AggregateFunctionPtr function;
         Retentions retentions;    /// Must be ordered by 'age' descending.
+        enum { TypeUndef, TypeRetention, TypeAggregation, TypeAll } type = TypeAll; /// The type of defined pattern, filled automatically
     };
 
     using Patterns = std::vector<Pattern>;
+    using RetentionPattern = Pattern;
+    using AggregationPattern = Pattern;
 
     struct Params
     {
@@ -110,6 +130,8 @@ namespace Graphite
         String version_column_name;
         Graphite::Patterns patterns;
     };
+
+    using RollupRule = std::pair<const RetentionPattern *, const AggregationPattern *>;
 }
 
 /** Merges several sorted streams into one.
@@ -135,7 +157,7 @@ public:
     ~GraphiteRollupSortedBlockInputStream() override
     {
         if (aggregate_state_created)
-            current_pattern->function->destroy(place_for_aggregate_state.data());
+            std::get<1>(current_rule)->function->destroy(place_for_aggregate_state.data());
     }
 
 protected:
@@ -186,11 +208,18 @@ private:
     time_t current_time = 0;
     time_t current_time_rounded = 0;
 
-    const Graphite::Pattern * current_pattern = nullptr;
+    Graphite::RollupRule current_rule = {nullptr, nullptr};
     AlignedBuffer place_for_aggregate_state;
-    bool aggregate_state_created = false; /// Invariant: if true then current_pattern is not NULL.
+    bool aggregate_state_created = false; /// Invariant: if true then current_rule is not NULL.
 
-    const Graphite::Pattern * selectPatternForPath(StringRef path) const;
+    const Graphite::Pattern undef_pattern =
+    { /// temporary empty pattern for selectPatternForPath
+        nullptr,
+        nullptr,
+        DB::Graphite::Retentions(),
+        undef_pattern.TypeUndef,
+    };
+    Graphite::RollupRule selectPatternForPath(StringRef path) const;
     UInt32 selectPrecision(const Graphite::Retentions & retentions, time_t time) const;
 
 
@@ -198,7 +227,7 @@ private:
 
     /// Insert the values into the resulting columns, which will not be changed in the future.
     template <typename TSortCursor>
-    void startNextGroup(MutableColumns & merged_columns, TSortCursor & cursor, const Graphite::Pattern * next_pattern);
+    void startNextGroup(MutableColumns & merged_columns, TSortCursor & cursor, Graphite::RollupRule next_pattern);
 
     /// Insert the calculated `time`, `value`, `version` values into the resulting columns by the last group of rows.
     void finishCurrentGroup(MutableColumns & merged_columns);
diff --git a/dbms/src/Storages/MergeTree/registerStorageMergeTree.cpp b/dbms/src/Storages/MergeTree/registerStorageMergeTree.cpp
index 1958b489023..103be508564 100644
--- a/dbms/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/dbms/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -126,17 +126,32 @@ static void appendGraphitePattern(
             throw Exception("Unknown element in config: " + key, ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG);
     }
 
-    if (!pattern.function)
-        throw Exception("Aggregate function is mandatory for retention patterns in GraphiteMergeTree",
+    if (!pattern.function && pattern.retentions.empty())
+        throw Exception("At least one of an aggregate function or retention rules is mandatory for rollup patterns in GraphiteMergeTree",
             ErrorCodes::NO_ELEMENTS_IN_CONFIG);
 
-    if (pattern.function->allocatesMemoryInArena())
-        throw Exception("Aggregate function " + pattern.function->getName() + " isn't supported in GraphiteMergeTree",
-                        ErrorCodes::NOT_IMPLEMENTED);
+    if (!pattern.function)
+    {
+        pattern.type = pattern.TypeRetention;
+    }
+    else if (pattern.retentions.empty())
+    {
+        pattern.type = pattern.TypeAggregation;
+    }
+    else
+    {
+        pattern.type = pattern.TypeAll;
+    }
+
+    if (pattern.type & pattern.TypeAggregation) /// TypeAggregation or TypeAll
+        if (pattern.function->allocatesMemoryInArena())
+            throw Exception("Aggregate function " + pattern.function->getName() + " isn't supported in GraphiteMergeTree",
+                            ErrorCodes::NOT_IMPLEMENTED);
 
     /// retention should be in descending order of age.
-    std::sort(pattern.retentions.begin(), pattern.retentions.end(),
-        [] (const Graphite::Retention & a, const Graphite::Retention & b) { return a.age > b.age; });
+    if (pattern.type & pattern.TypeRetention) /// TypeRetention or TypeAll
+        std::sort(pattern.retentions.begin(), pattern.retentions.end(),
+            [] (const Graphite::Retention & a, const Graphite::Retention & b) { return a.age > b.age; });
 
     patterns.emplace_back(pattern);
 }
diff --git a/dbms/src/Storages/System/StorageSystemGraphite.cpp b/dbms/src/Storages/System/StorageSystemGraphite.cpp
index 8cd466c050e..d75eb71841e 100644
--- a/dbms/src/Storages/System/StorageSystemGraphite.cpp
+++ b/dbms/src/Storages/System/StorageSystemGraphite.cpp
@@ -148,13 +148,26 @@ void StorageSystemGraphite::fillData(MutableColumns & res_columns, const Context
         const auto patterns = readPatterns(config, section);
         for (const auto & pattern : patterns)
         {
-            for (const auto & ret : pattern.retentions)
+            if (!pattern.retentions.empty())
+            {
+                for (const auto & ret : pattern.retentions)
+                {
+                    res_columns[0]->insert(section);
+                    res_columns[1]->insert(pattern.regexp);
+                    res_columns[2]->insert(pattern.function);
+                    res_columns[3]->insert(ret.age);
+                    res_columns[4]->insert(ret.precision);
+                    res_columns[5]->insert(pattern.priority);
+                    res_columns[6]->insert(pattern.is_default);
+                }
+            }
+            else
             {
                 res_columns[0]->insert(section);
                 res_columns[1]->insert(pattern.regexp);
                 res_columns[2]->insert(pattern.function);
-                res_columns[3]->insert(ret.age);
-                res_columns[4]->insert(ret.precision);
+                res_columns[3]->insert(0);
+                res_columns[4]->insert(0);
                 res_columns[5]->insert(pattern.priority);
                 res_columns[6]->insert(pattern.is_default);
             }

From bc00ae383a99e641c46b5da6528775972ba3a4c8 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Wed, 20 Feb 2019 17:16:46 +0100
Subject: [PATCH 10/63] Update documentation for GraphiteMergeTree rollup

---
 .../table_engines/graphitemergetree.md        |  13 +-
 .../table_engines/graphitemergetree.md        |  19 +-
 .../table_engines/graphitemergetree.md        | 149 +----------
 docs/zh/operations/table_engines/mergetree.md | 236 +-----------------
 4 files changed, 25 insertions(+), 392 deletions(-)
 mode change 100644 => 120000 docs/zh/operations/table_engines/graphitemergetree.md
 mode change 100644 => 120000 docs/zh/operations/table_engines/mergetree.md

diff --git a/docs/en/operations/table_engines/graphitemergetree.md b/docs/en/operations/table_engines/graphitemergetree.md
index 5e30a67c645..4231fb00f43 100644
--- a/docs/en/operations/table_engines/graphitemergetree.md
+++ b/docs/en/operations/table_engines/graphitemergetree.md
@@ -75,6 +75,13 @@ Rollup configuration structure:
 
 ```
 required-columns
+pattern
+    regexp
+    function
+pattern
+    regexp
+    age + precision
+    ...
 pattern
     regexp
     function
@@ -88,15 +95,13 @@ default
     ...
 ```
 
-When processing a row, ClickHouse checks the rules in the `pattern` section. If the metric name matches the `regexp`, the rules from the `pattern`section are applied; otherwise, the rules from the `default` section are used.
-
-The rules are defined with fields `function` and `age + precision`.
+When processing a row, ClickHouse checks the rules in the `pattern` sections. Each of `pattern` sections could contain `function` parameter for aggregation, `retention` parameters or both. If the metric name matches the `regexp`, the rules from the `pattern` section (or sections) are applied; otherwise, the rules from the `default` section are used.
 
 Fields for `pattern` and `default` sections:
 
 - `regexp`– A pattern for the metric name.
 - `age` – The minimum age of the data in seconds.
-- `precision`– How precisely to define the age of the data in seconds.
+- `precision`– How precisely to define the age of the data in seconds. Should be a divisor for 86400 (seconds in a day).
 - `function` – The name of the aggregating function to apply to data whose age falls within the range `[age, age + precision]`.
 
 The `required-columns`:
diff --git a/docs/ru/operations/table_engines/graphitemergetree.md b/docs/ru/operations/table_engines/graphitemergetree.md
index 816fddff7f2..9c9afc9c9a6 100644
--- a/docs/ru/operations/table_engines/graphitemergetree.md
+++ b/docs/ru/operations/table_engines/graphitemergetree.md
@@ -72,12 +72,19 @@ CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
 
 ## Конфигурация rollup
 
-Настройки для прореживания данных задаются параметром [graphite_rollup](../server_settings/settings.md#server_settings-graphite_rollup) Имя параметра может быть любым. Можно создать несколько конфигураций и использовать их для разных таблиц.
+Настройки для прореживания данных задаются параметром [graphite_rollup](../server_settings/settings.md#server_settings-graphite_rollup). Имя параметра может быть любым. Можно создать несколько конфигураций и использовать их для разных таблиц.
 
 Структура конфигурации rollup:
 
 ```
 required-columns
+pattern
+    regexp
+    function
+pattern
+    regexp
+    age + precision
+    ...
 pattern
     regexp
     function
@@ -91,15 +98,13 @@ default
     ...
 ```
 
-При обработке строки ClickHouse проверяет правила в разделе `pattern`. Если имя метрики соответствует шаблону `regexp`, то  применяются правила из раздела `pattern`, в противном случае из раздела `default`.
-
-Правила определяются с помощью полей `function` и `age + precision`.
+При обработке строки ClickHouse проверяет правила в разделах `pattern`. Каждый из разделов `pattern` может содержать параметр `function` для аггрегации, правила `retention` для прореживания или оба эти параметра. Если имя метрики соответствует шаблону `regexp`, то применяются правила из раздела (или разделов) `pattern`, в противном случае из раздела `default`.
 
 Поля для разделов `pattenrn` и `default`:
 
 - `regexp` – шаблон имени метрики.
 - `age` – минимальный возраст данных в секундах.
-- `precision` – точность определения возраста данных в секундах.
+- `precision` – точность определения возраста данных в секундах. Должен быть делителем для 86400 (количество секунд в дне).
 - `function` – имя агрегирующей функции, которую следует применить к данным, чей возраст оказался в интервале `[age, age + precision]`.
 
 `required-columns`:
@@ -117,6 +122,10 @@ default
     <time_column_name>Time</time_column_name>
     <value_column_name>Value</value_column_name>
     <version_column_name>Version</version_column_name>
+    <pattern>
+        <regexp>\.count$</regexp>
+        <function>sum</function>
+    </pattern>
     <pattern>
         <regexp>click_cost</regexp>
         <function>any</function>
diff --git a/docs/zh/operations/table_engines/graphitemergetree.md b/docs/zh/operations/table_engines/graphitemergetree.md
deleted file mode 100644
index fa15ab4daaf..00000000000
--- a/docs/zh/operations/table_engines/graphitemergetree.md
+++ /dev/null
@@ -1,148 +0,0 @@
-
-# GraphiteMergeTree
-
-This engine is designed for rollup (thinning and aggregating/averaging) [Graphite](http://graphite.readthedocs.io/en/latest/index.html) data. It may be helpful to developers who want to use ClickHouse as a data store for Graphite.
-
-You can use any ClickHouse table engine to store the Graphite data if you don't need rollup, but if you need a rollup use `GraphiteMergeTree`. The engine reduces the volume of storage and increases the efficiency of queries from Graphite.
-
-The engine inherits properties from [MergeTree](mergetree.md).
-
-## Creating a Table
-
-```sql
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    Path String,
-    Time DateTime,
-    Value <Numeric_type>,
-    Version <Numeric_type>
-    ...
-) ENGINE = GraphiteMergeTree(config_section)
-[PARTITION BY expr]
-[ORDER BY expr]
-[SAMPLE BY expr]
-[SETTINGS name=value, ...]
-```
-
-For a description of request parameters, see [request description](../../query_language/create.md).
-
-A table for the Graphite date should have the following columns:
-
-- Column with the metric name (Graphite sensor). Data type: `String`.
-- Column with the time for measuring the metric. Data type: `DateTime`.
-- Column with the value of the metric. Data type: any numeric.
-- Column with the version of the metric with the same name and time of measurement. Data type: any numeric.
-
-    ClickHouse saves the rows with the highest version or the last written if versions are the same. Other rows are deleted during the merge of data parts.
-
-The names of these columns should be set in the rollup configuration.
-
-**GraphiteMergeTree parameters**
-
-- `config_section` — Name of the section in the configuration file, where are the rules of rollup set.
-
-**Query clauses**
-
-When creating a `GraphiteMergeTree` table, the same [clauses](mergetree.md) are required, as when creating a `MergeTree` table.
-
-<details markdown="1"><summary>Deprecated Method for Creating a Table</summary>
-
-!!! attention
-    Do not use this method in new projects and, if possible, switch the old projects to the method described above.
-
-```sql
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    EventDate Date,
-    Path String,
-    Time DateTime,
-    Value <Numeric_type>,
-    Version <Numeric_type>
-    ...
-) ENGINE [=] GraphiteMergeTree(date-column [, sampling_expression], (primary, key), index_granularity, config_section)
-```
-
-All of the parameters excepting `config_section` have the same meaning as in `MergeTree`.
-
-- `config_section` — Name of the section in the configuration file, where are the rules of rollup set.
-</details>
-
-## Rollup configuration
-
-The settings for rollup are defined by the [graphite_rollup](../server_settings/settings.md) parameter in the server configuration. The name of the parameter could be any. You can create several configurations and use them for different tables.
-
-Rollup configuration structure:
-
-```
-required-columns
-pattern
-    regexp
-    function
-    age + precision
-    ...
-pattern
-    ...
-default
-    function
-    age + precision
-    ...
-```
-
-When processing a row, ClickHouse checks the rules in the `pattern` section. If the metric name matches the `regexp`, the rules from the `pattern`section are applied; otherwise, the rules from the `default` section are used.
-
-The rules are defined with fields `function` and `age + precision`.
-
-Fields for `pattern` and `default` sections:
-
-- `regexp`– A pattern for the metric name.
-- `age` – The minimum age of the data in seconds.
-- `precision`– How precisely to define the age of the data in seconds.
-- `function` – The name of the aggregating function to apply to data whose age falls within the range `[age, age + precision]`.
-
-The `required-columns`:
-
-- `path_column_name` — Column with the metric name (Graphite sensor).
-- `time_column_name` — Column with the time for measuring the metric.
-- `value_column_name` — Column with the value of the metric at the time set in `time_column_name`.
-- `version_column_name` — Column with the version timestamp of the metric with the same name and time remains in the database.
-
-
-Example of settings:
-
-```xml
-<graphite_rollup>
-    <path_column_name>Path</path_column_name>
-    <time_column_name>Time</time_column_name>
-    <value_column_name>Value</value_column_name>
-    <version_column_name>Version</version_column_name>
-    <pattern>
-        <regexp>click_cost</regexp>
-        <function>any</function>
-        <retention>
-            <age>0</age>
-            <precision>5</precision>
-        </retention>
-        <retention>
-            <age>86400</age>
-            <precision>60</precision>
-        </retention>
-    </pattern>
-    <default>
-        <function>max</function>
-        <retention>
-            <age>0</age>
-            <precision>60</precision>
-        </retention>
-        <retention>
-            <age>3600</age>
-            <precision>300</precision>
-        </retention>
-        <retention>
-            <age>86400</age>
-            <precision>3600</precision>
-        </retention>
-    </default>
-</graphite_rollup>
-```
-
-[Original article](https://clickhouse.yandex/docs/en/operations/table_engines/graphitemergetree/) <!--hide-->
diff --git a/docs/zh/operations/table_engines/graphitemergetree.md b/docs/zh/operations/table_engines/graphitemergetree.md
new file mode 120000
index 00000000000..654425d050a
--- /dev/null
+++ b/docs/zh/operations/table_engines/graphitemergetree.md
@@ -0,0 +1 @@
+../../../en/operations/table_engines/graphitemergetree.md
\ No newline at end of file
diff --git a/docs/zh/operations/table_engines/mergetree.md b/docs/zh/operations/table_engines/mergetree.md
deleted file mode 100644
index abac921f9df..00000000000
--- a/docs/zh/operations/table_engines/mergetree.md
+++ /dev/null
@@ -1,235 +0,0 @@
-# MergeTree {#table_engines-mergetree}
-
-The `MergeTree` engine and other engines of this family (`*MergeTree`) are the most robust ClickHousе table engines.
-
-The basic idea for `MergeTree` engines family is the following. When you have tremendous amount of a data that should be inserted into the table, you should write them quickly part by part and then merge parts by some rules in background. This method is much more efficient than constantly rewriting data in the storage at the insert.
-
-Main features:
-
-- Stores data sorted by primary key.
-
-    This allows you to create a small sparse index that helps find data faster.
-
-- This allows you to use partitions if the [partitioning key](custom_partitioning_key.md) is specified.
-
-    ClickHouse supports certain operations with partitions that are more effective than general operations on the same data with the same result. ClickHouse also automatically cuts off the partition data where the partitioning key is specified in the query. This also increases the query performance.
-
-- Data replication support.
-
-    The family of `ReplicatedMergeTree` tables is used for this. For more information, see the [Data replication](replication.md) section.
-
-- Data sampling support.
-
-    If necessary, you can set the data sampling method in the table.
-
-!!! info
-    The [Merge](merge.md) engine does not belong to the `*MergeTree` family.
-
-
-## Creating a Table
-
-```
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1],
-    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2],
-    ...
-) ENGINE = MergeTree()
-[PARTITION BY expr]
-[ORDER BY expr]
-[PRIMARY KEY expr]
-[SAMPLE BY expr]
-[SETTINGS name=value, ...]
-```
-
-For a description of request parameters, see [request description](../../query_language/create.md).
-
-**Query clauses**
-
-- `ENGINE` - Name and parameters of the engine. `ENGINE = MergeTree()`. `MergeTree` engine does not have parameters.
-
-- `PARTITION BY` — The [partitioning key](custom_partitioning_key.md).
-
-    For partitioning by month, use the `toYYYYMM(date_column)` expression, where `date_column` is a column with a date of the type [Date](../../data_types/date.md). The partition names here have the `"YYYYMM"` format.
-
-- `ORDER BY` — The sorting key.
-
-    A tuple of columns or arbitrary expressions. Example: `ORDER BY (CounterID, EventDate)`.
-
-- `PRIMARY KEY` - The primary key if it [differs from the sorting key](mergetree.md).
-
-    By default the primary key is the same as the sorting key (which is specified by the `ORDER BY` clause).
-    Thus in most cases it is unnecessary to specify a separate `PRIMARY KEY` clause.
-
-- `SAMPLE BY` — An expression for sampling.
-
-    If a sampling expression is used, the primary key must contain it. Example:  
-    `SAMPLE BY intHash32(UserID) ORDER BY (CounterID, EventDate, intHash32(UserID))`.
-
-- `SETTINGS` — Additional parameters that control the behavior of the `MergeTree`:
-    - `index_granularity` — The granularity of an index. The number of data rows between the "marks" of an index. By default, 8192.
-
-**Example of sections setting**
-
-```
-ENGINE MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate, intHash32(UserID)) SAMPLE BY intHash32(UserID) SETTINGS index_granularity=8192
-```
-
-In the example, we set partitioning by month.
-
-We also set an expression for sampling as a hash by the user ID. This allows you to pseudorandomize the data in the table for each `CounterID` and `EventDate`. If, when selecting the data, you define a [SAMPLE](../../query_language/select.md#select-sample-clause) clause, ClickHouse will return an evenly pseudorandom data sample for a subset of users.
-
-`index_granularity` could be omitted because 8192 is the default value.
-
-<details markdown="1"><summary>Deprecated Method for Creating a Table</summary>
-
-!!! attention
-    Do not use this method in new projects and, if possible, switch the old projects to the method described above.
-
-```
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1],
-    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2],
-    ...
-) ENGINE [=] MergeTree(date-column [, sampling_expression], (primary, key), index_granularity)
-```
-
-**MergeTree() parameters**
-
-- `date-column` — The name of a column of the type [Date](../../data_types/date.md). ClickHouse automatically creates partitions by month on the basis of this column. The partition names are in the `"YYYYMM"` format.
-- `sampling_expression` — an expression for sampling.
-- `(primary, key)` — primary key. Type — [Tuple()](../../data_types/tuple.md- `index_granularity` — The granularity of an index. The number of data rows between the "marks" of an index. The value 8192 is appropriate for most tasks.
-
-**Example**
-
-```
-MergeTree(EventDate, intHash32(UserID), (CounterID, EventDate, intHash32(UserID)), 8192)
-```
-
-The `MergeTree` engine is configured in the same way as in the example above for the main engine configuration method.
-</details>
-
-## Data Storage
-
-A table consists of data *parts* sorted by primary key.
-
-When data is inserted in a table, separate data parts are created and each of them is lexicographically sorted by primary key. For example, if the primary key is `(CounterID, Date)`, the data in the part is sorted by `CounterID`, and within each `CounterID`, it is ordered by `Date`.
-
-Data belonging to different partitions are separated into different parts. In the background, ClickHouse merges data parts for more efficient storage. Parts belonging to different partitions are not merged. The merge mechanism does not guarantee that all rows with the same primary key will be in the same data part.
-
-For each data part, ClickHouse creates an index file that contains the primary key value for each index row ("mark"). Index row numbers are defined as `n * index_granularity`. The maximum value `n` is equal to the integer part of dividing the total number of rows by the `index_granularity`. For each column, the "marks" are also written for the same index rows as the primary key. These "marks" allow you to find the data directly in the columns.
-
-You can use a single large table and continually add data to it in small chunks – this is what the `MergeTree` engine is intended for.
-
-## Primary Keys and Indexes in Queries
-
-Let's take the `(CounterID, Date)` primary key. In this case, the sorting and index can be illustrated as follows:
-
-```
-Whole data:     [-------------------------------------------------------------------------]
-CounterID:      [aaaaaaaaaaaaaaaaaabbbbcdeeeeeeeeeeeeefgggggggghhhhhhhhhiiiiiiiiikllllllll]
-Date:           [1111111222222233331233211111222222333211111112122222223111112223311122333]
-Marks:           |      |      |      |      |      |      |      |      |      |      |
-                a,1    a,2    a,3    b,3    e,2    e,3    g,1    h,2    i,1    i,3    l,3
-Marks numbers:   0      1      2      3      4      5      6      7      8      9      10
-```
-
-If the data query specifies:
-
-- `CounterID in ('a', 'h')`, the server reads the data in the ranges of marks `[0, 3)` and `[6, 8)`.
-- `CounterID IN ('a', 'h') AND Date = 3`, the server reads the data in the ranges of marks `[1, 3)` and `[7, 8)`.
-- `Date = 3`, the server reads the data in the range of marks `[1, 10]`.
-
-The examples above show that it is always more effective to use an index than a full scan.
-
-A sparse index allows extra strings to be read. When reading a single range of the primary key, up to `index_granularity * 2` extra rows in each data block can be read. In most cases, ClickHouse performance does not degrade when `index_granularity = 8192`.
-
-Sparse indexes allow you to work with a very large number of table rows, because such indexes are always stored in the computer's RAM.
-
-ClickHouse does not require a unique primary key. You can insert multiple rows with the same primary key.
-
-### Selecting the Primary Key
-
-The number of columns in the primary key is not explicitly limited. Depending on the data structure, you can include more or fewer columns in the primary key. This may:
-
-- Improve the performance of an index.
-
-    If the primary key is `(a, b)`, then adding another column `c` will improve the performance if the following conditions are met:
-    - There are queries with a condition on column `c`.
-    - Long data ranges (several times longer than the `index_granularity`) with identical values for `(a, b)` are common. In other words, when adding another column allows you to skip quite long data ranges.
-
-- Improve data compression.
-
-    ClickHouse sorts data by primary key, so the higher the consistency, the better the compression.
-
-- Provide additional logic when data parts merging in the [CollapsingMergeTree](collapsingmergetree.md#table_engine-collapsingmergetree) and [SummingMergeTree](summingmergetree.md) engines.
-
-    In this case it makes sense to specify the *sorting key* that is different from the primary key.
-
-A long primary key will negatively affect the insert performance and memory consumption, but extra columns in the primary key do not affect ClickHouse performance during `SELECT` queries.
-
-
-### Choosing the Primary Key that differs from the Sorting Key
-
-It is possible to specify the primary key (the expression, values of which are written into the index file
-for each mark) that is different from the sorting key (the expression for sorting the rows in data parts).
-In this case the primary key expression tuple must be a prefix of the sorting key expression tuple.
-
-This feature is helpful when using the [SummingMergeTree](summingmergetree.md) and
-[AggregatingMergeTree](aggregatingmergetree.md) table engines. In a common case when using these engines the
-table has two types of columns: *dimensions* and *measures*. Typical queries aggregate values of measure
-columns with arbitrary `GROUP BY` and filtering by dimensions. As SummingMergeTree and AggregatingMergeTree
-aggregate rows with the same value of the sorting key, it is natural to add all dimensions to it. As a result
-the key expression consists of a long list of columns and this list must be frequently updated with newly
-added dimensions.
-
-In this case it makes sense to leave only a few columns in the primary key that will provide efficient
-range scans and add the remaining dimension columns to the sorting key tuple.
-
-[ALTER of the sorting key](../../query_language/alter.md) is a
-lightweight operation because when a new column is simultaneously added to the table and to the sorting key
-data parts need not be changed (they remain sorted by the new sorting key expression).
-
-### Use of Indexes and Partitions in Queries
-
-For`SELECT` queries, ClickHouse analyzes whether an index can be used. An index can be used if the `WHERE/PREWHERE` clause has an expression (as one of the conjunction elements, or entirely) that represents an equality or inequality comparison operation, or if it has `IN` or `LIKE` with a fixed prefix on columns or expressions that are in the primary key or partitioning key, or on certain partially repetitive functions of these columns, or logical relationships of these expressions.
-
-Thus, it is possible to quickly run queries on one or many ranges of the primary key. In this example, queries will be fast when run for a specific tracking tag; for a specific tag and date range; for a specific tag and date; for multiple tags with a date range, and so on.
-
-Let's look at the engine configured as follows:
-
-```
-ENGINE MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate) SETTINGS index_granularity=8192
-```
-
-In this case, in queries:
-
-``` sql
-SELECT count() FROM table WHERE EventDate = toDate(now()) AND CounterID = 34
-SELECT count() FROM table WHERE EventDate = toDate(now()) AND (CounterID = 34 OR CounterID = 42)
-SELECT count() FROM table WHERE ((EventDate >= toDate('2014-01-01') AND EventDate <= toDate('2014-01-31')) OR EventDate = toDate('2014-05-01')) AND CounterID IN (101500, 731962, 160656) AND (CounterID = 101500 OR EventDate != toDate('2014-05-01'))
-```
-
-ClickHouse will use the primary key index to trim improper data and the monthly partitioning key to trim partitions that are in improper date ranges.
-
-The queries above show that the index is used even for complex expressions. Reading from the table is organized so that using the index can't be slower than a full scan.
-
-In the example below, the index can't be used.
-
-``` sql
-SELECT count() FROM table WHERE CounterID = 34 OR URL LIKE '%upyachka%'
-```
-
-To check whether ClickHouse can use the index when running a query, use the settings [force_index_by_date](../settings/settings.md#settings-force_index_by_date) and [force_primary_key](../settings/settings.md).
-
-The key for partitioning by month allows reading only those data blocks which contain dates from the proper range. In this case, the data block may contain data for many dates (up to an entire month). Within a block, data is sorted by primary key, which might not contain the date as the first column. Because of this, using a query with only a date condition that does not specify the primary key prefix will cause more data to be read than for a single date.
-
-## Concurrent Data Access
-
-For concurrent table access, we use multi-versioning. In other words, when a table is simultaneously read and updated, data is read from a set of parts that is current at the time of the query. There are no lengthy locks. Inserts do not get in the way of read operations.
-
-Reading from a table is automatically parallelized.
-
-
-[Original article](https://clickhouse.yandex/docs/en/operations/table_engines/mergetree/) <!--hide-->
diff --git a/docs/zh/operations/table_engines/mergetree.md b/docs/zh/operations/table_engines/mergetree.md
new file mode 120000
index 00000000000..cc6ac1e5297
--- /dev/null
+++ b/docs/zh/operations/table_engines/mergetree.md
@@ -0,0 +1 @@
+../../../en/operations/table_engines/mergetree.md
\ No newline at end of file

From a1ed5d8eae70cccde8935ee1b05a16a8a62f094c Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Wed, 20 Feb 2019 17:45:51 +0100
Subject: [PATCH 11/63] Apply pep8 to test_graphite_merge_tree

---
 .../test_graphite_merge_tree/test.py          | 102 +++++++++++-------
 1 file changed, 64 insertions(+), 38 deletions(-)

diff --git a/dbms/tests/integration/test_graphite_merge_tree/test.py b/dbms/tests/integration/test_graphite_merge_tree/test.py
index a2e7b5cc0f7..ff37be9371c 100644
--- a/dbms/tests/integration/test_graphite_merge_tree/test.py
+++ b/dbms/tests/integration/test_graphite_merge_tree/test.py
@@ -8,31 +8,38 @@ from helpers.test_tools import TSV
 
 
 cluster = ClickHouseCluster(__file__)
-instance = cluster.add_instance('instance', main_configs=['configs/graphite_rollup.xml'])
+instance = cluster.add_instance('instance',
+                                main_configs=['configs/graphite_rollup.xml'])
+q = instance.query
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
         cluster.start()
-        instance.query('CREATE DATABASE test')
+        q('CREATE DATABASE test')
 
         yield cluster
 
     finally:
         cluster.shutdown()
 
+
 @pytest.fixture
 def graphite_table(started_cluster):
-    instance.query('''
+    q('''
 DROP TABLE IF EXISTS test.graphite;
 CREATE TABLE test.graphite
     (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
-    ENGINE = GraphiteMergeTree(date, (metric, timestamp), 8192, 'graphite_rollup');
+    ENGINE = GraphiteMergeTree('graphite_rollup')
+    PARTITION BY toYYYYMM(date)
+    ORDER BY (metric, timestamp)
+    SETTINGS index_granularity=8192;
 ''')
 
     yield
 
-    instance.query('DROP TABLE test.graphite')
+    q('DROP TABLE test.graphite')
 
 
 def test_rollup_versions(graphite_table):
@@ -40,13 +47,14 @@ def test_rollup_versions(graphite_table):
     rounded_timestamp = timestamp - timestamp % 60
     date = datetime.date.today().isoformat()
 
-    q = instance.query
-
-    # Insert rows with timestamps relative to the current time so that the first retention clause is active.
+    # Insert rows with timestamps relative to the current time so that the
+    # first retention clause is active.
     # Two parts are created.
     q('''
-INSERT INTO test.graphite (metric, value, timestamp, date, updated) VALUES ('one_min.x1', 100, {timestamp}, '{date}', 1);
-INSERT INTO test.graphite (metric, value, timestamp, date, updated) VALUES ('one_min.x1', 200, {timestamp}, '{date}', 2);
+INSERT INTO test.graphite (metric, value, timestamp, date, updated)
+      VALUES ('one_min.x1', 100, {timestamp}, '{date}', 1);
+INSERT INTO test.graphite (metric, value, timestamp, date, updated)
+      VALUES ('one_min.x1', 200, {timestamp}, '{date}', 2);
 '''.format(timestamp=timestamp, date=date))
 
     expected1 = '''\
@@ -54,7 +62,9 @@ one_min.x1	100	{timestamp}	{date}	1
 one_min.x1	200	{timestamp}	{date}	2
 '''.format(timestamp=timestamp, date=date)
 
-    assert TSV(q('SELECT * FROM test.graphite ORDER BY updated')) == TSV(expected1)
+    assert TSV(
+        q('SELECT * FROM test.graphite ORDER BY updated')
+    ) == TSV(expected1)
 
     q('OPTIMIZE TABLE test.graphite')
 
@@ -67,8 +77,6 @@ one_min.x1	200	{timestamp}	{date}	2
 
 
 def test_rollup_aggregation(graphite_table):
-    q = instance.query
-
     # This query essentially emulates what rollup does.
     result1 = q('''
 SELECT avg(v), max(upd)
@@ -91,7 +99,8 @@ FROM (SELECT timestamp,
 '''
     assert TSV(result1) == TSV(expected1)
 
-    # Timestamp 1111111111 is in sufficiently distant past so that the last retention clause is active.
+    # Timestamp 1111111111 is in sufficiently distant past
+    # so that the last retention clause is active.
     result2 = q('''
 INSERT INTO test.graphite
     SELECT 'one_min.x' AS metric,
@@ -114,7 +123,7 @@ one_min.x	999634.9918367347	1111444200	2017-02-02	499999
 
 
 def test_rollup_aggregation_2(graphite_table):
-    result = instance.query('''
+    result = q('''
 INSERT INTO test.graphite
     SELECT 'one_min.x' AS metric,
            toFloat64(number) AS value,
@@ -136,7 +145,7 @@ one_min.x	24	1111110600	2017-02-02	100
 
 
 def test_multiple_paths_and_versions(graphite_table):
-    result = instance.query('''
+    result = q('''
 INSERT INTO test.graphite
     SELECT 'one_min.x' AS metric,
            toFloat64(number) AS value,
@@ -163,7 +172,9 @@ OPTIMIZE TABLE test.graphite PARTITION 201702 FINAL;
 SELECT * FROM test.graphite;
 ''')
 
-    with open(p.join(p.dirname(__file__), 'test_multiple_paths_and_versions.reference')) as reference:
+    with open(p.join(p.dirname(__file__),
+                     'test_multiple_paths_and_versions.reference')
+              ) as reference:
         assert TSV(result) == TSV(reference)
 
 
@@ -177,14 +188,18 @@ def test_multiple_output_blocks(graphite_table):
 
         for j in range(3):
             cur_time = rolled_up_time + 100 * j
-            to_insert += 'one_min.x1	{}	{}	2001-09-09	1\n'.format(10 * j, cur_time)
-            to_insert += 'one_min.x1	{}	{}	2001-09-09	2\n'.format(10 * (j + 1), cur_time)
+            to_insert += 'one_min.x1	{}	{}	2001-09-09	1\n'.format(
+                10 * j, cur_time
+            )
+            to_insert += 'one_min.x1	{}	{}	2001-09-09	2\n'.format(
+                10 * (j + 1), cur_time
+            )
 
         expected += 'one_min.x1	20	{}	2001-09-09	2\n'.format(rolled_up_time)
 
-    instance.query('INSERT INTO test.graphite FORMAT TSV', to_insert)
+    q('INSERT INTO test.graphite FORMAT TSV', to_insert)
 
-    result = instance.query('''
+    result = q('''
 OPTIMIZE TABLE test.graphite PARTITION 200109 FINAL;
 
 SELECT * FROM test.graphite;
@@ -200,14 +215,14 @@ zzzzzzzz	100	1000000001	2001-09-09	1
 zzzzzzzz	200	1000000001	2001-09-09	2
 '''
 
-    instance.query('INSERT INTO test.graphite FORMAT TSV', to_insert)
+    q('INSERT INTO test.graphite FORMAT TSV', to_insert)
 
     expected = '''\
 one_min.x1	100	999999600	2001-09-09	1
 zzzzzzzz	200	1000000001	2001-09-09	2
 '''
 
-    result = instance.query('''
+    result = q('''
 OPTIMIZE TABLE test.graphite PARTITION 200109 FINAL;
 
 SELECT * FROM test.graphite;
@@ -215,27 +230,38 @@ SELECT * FROM test.graphite;
 
     assert TSV(result) == TSV(expected)
 
+
 def test_path_dangling_pointer(graphite_table):
-    instance.query('''
+    q('''
 DROP TABLE IF EXISTS test.graphite2;
 CREATE TABLE test.graphite2
-  (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
-  ENGINE = GraphiteMergeTree(date, (metric, timestamp), 1, 'graphite_rollup');
-  ''')
+    (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
+    ENGINE = GraphiteMergeTree('graphite_rollup')
+    PARTITION BY toYYYYMM(date)
+    ORDER BY (metric, timestamp)
+    SETTINGS index_granularity=1;
+    ''')
 
-    path = 'abcd' * 4000000 # 16MB
-    instance.query('INSERT INTO test.graphite2 FORMAT TSV', "{}\t0.0\t0\t2018-01-01\t100\n".format(path))
-    instance.query('INSERT INTO test.graphite2 FORMAT TSV', "{}\t0.0\t0\t2018-01-01\t101\n".format(path))
+    path = 'abcd' * 4000000  # 16MB
+    q('INSERT INTO test.graphite2 FORMAT TSV',
+      "{}\t0.0\t0\t2018-01-01\t100\n".format(path))
+    q('INSERT INTO test.graphite2 FORMAT TSV',
+      "{}\t0.0\t0\t2018-01-01\t101\n".format(path))
     for version in range(10):
-        instance.query('INSERT INTO test.graphite2 FORMAT TSV', "{}\t0.0\t0\t2018-01-01\t{}\n".format(path, version))
+        q('INSERT INTO test.graphite2 FORMAT TSV',
+          "{}\t0.0\t0\t2018-01-01\t{}\n".format(path, version))
 
     while True:
-      instance.query('OPTIMIZE TABLE test.graphite2 PARTITION 201801 FINAL')
-      parts = int(instance.query("SELECT count() FROM system.parts WHERE active AND database='test' AND table='graphite2'"))
-      if parts == 1:
-        break
-      print "Parts", parts
+        q('OPTIMIZE TABLE test.graphite2 PARTITION 201801 FINAL')
+        parts = int(q("SELECT count() FROM system.parts "
+                      "WHERE active AND database='test' "
+                      "AND table='graphite2'"))
+        if parts == 1:
+            break
+        print('Parts', parts)
 
-    assert TSV(instance.query("SELECT value, timestamp, date, updated FROM test.graphite2")) == TSV("0\t0\t2018-01-01\t101\n")
+    assert TSV(
+        q("SELECT value, timestamp, date, updated FROM test.graphite2")
+    ) == TSV("0\t0\t2018-01-01\t101\n")
 
-    instance.query('DROP TABLE test.graphite2')
\ No newline at end of file
+    q('DROP TABLE test.graphite2')

From 4cfe93a4d0df5e88f1f41e9a135092dbf2f90879 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Thu, 21 Feb 2019 22:34:08 +0100
Subject: [PATCH 12/63] Add necessary integration tests

---
 .../configs/graphite_rollup.xml               |  72 ++++++++++
 .../test_graphite_merge_tree/test.py          | 133 ++++++++++++++++++
 2 files changed, 205 insertions(+)

diff --git a/dbms/tests/integration/test_graphite_merge_tree/configs/graphite_rollup.xml b/dbms/tests/integration/test_graphite_merge_tree/configs/graphite_rollup.xml
index 1390d151731..6d1907f3da7 100644
--- a/dbms/tests/integration/test_graphite_merge_tree/configs/graphite_rollup.xml
+++ b/dbms/tests/integration/test_graphite_merge_tree/configs/graphite_rollup.xml
@@ -5,6 +5,29 @@
         <time_column_name>timestamp</time_column_name>
         <value_column_name>value</value_column_name>
         <version_column_name>updated</version_column_name>
+        <pattern>
+            <regexp>\.count$</regexp>
+            <function>sum</function>
+        </pattern>
+        <pattern>
+            <regexp>\.max$</regexp>
+            <function>max</function>
+        </pattern>
+        <pattern>
+          <regexp>^five_min\.</regexp>
+          <retention>
+              <age>0</age>
+              <precision>300</precision>
+          </retention>
+          <retention>
+              <age>5184000</age>
+              <precision>3600</precision>
+          </retention>
+          <retention>
+              <age>31536000</age>
+              <precision>14400</precision>
+          </retention>
+        </pattern>
         <pattern>
             <regexp>^one_min</regexp>
             <function>avg</function>
@@ -22,4 +45,53 @@
             </retention>
         </pattern>
     </graphite_rollup>
+    <graphite_rollup_with_default>
+        <path_column_name>metric</path_column_name>
+        <time_column_name>timestamp</time_column_name>
+        <value_column_name>value</value_column_name>
+        <version_column_name>updated</version_column_name>
+        <pattern>
+            <regexp>\.count$</regexp>
+            <function>sum</function>
+        </pattern>
+        <pattern>
+            <regexp>\.max$</regexp>
+            <function>max</function>
+        </pattern>
+        <default>
+            <function>any</function>
+            <retention>
+                <age>0</age>
+                <precision>60</precision>
+            </retention>
+            <retention>
+                <age>7776000</age>
+                <precision>300</precision>
+            </retention>
+            <retention>
+                <age>31536000</age>
+                <precision>600</precision>
+            </retention>
+        </default>
+    </graphite_rollup_with_default>
+    <graphite_rollup_broken>
+        <path_column_name>metric</path_column_name>
+        <time_column_name>timestamp</time_column_name>
+        <value_column_name>value</value_column_name>
+        <version_column_name>updated</version_column_name>
+        <default>
+            <retention>
+                <age>0</age>
+                <precision>60</precision>
+            </retention>
+            <retention>
+                <age>7776000</age>
+                <precision>300</precision>
+            </retention>
+            <retention>
+                <age>31536000</age>
+                <precision>600</precision>
+            </retention>
+        </default>
+    </graphite_rollup_broken>
 </yandex>
diff --git a/dbms/tests/integration/test_graphite_merge_tree/test.py b/dbms/tests/integration/test_graphite_merge_tree/test.py
index ff37be9371c..8e98c97e077 100644
--- a/dbms/tests/integration/test_graphite_merge_tree/test.py
+++ b/dbms/tests/integration/test_graphite_merge_tree/test.py
@@ -265,3 +265,136 @@ CREATE TABLE test.graphite2
     ) == TSV("0\t0\t2018-01-01\t101\n")
 
     q('DROP TABLE test.graphite2')
+
+
+def test_combined_rules(graphite_table):
+    # 1487970000 ~ Sat 25 Feb 00:00:00 MSK 2017
+    to_insert = 'INSERT INTO test.graphite VALUES '
+    expected_unmerged = ''
+    for i in range(384):
+        to_insert += "('five_min.count', {v}, {t}, toDate({t}), 1), ".format(
+            v=1, t=1487970000+(i*300)
+        )
+        to_insert += "('five_min.max', {v}, {t}, toDate({t}), 1), ".format(
+            v=i, t=1487970000+(i*300)
+        )
+        expected_unmerged += ("five_min.count\t{v1}\t{t}\n"
+                              "five_min.max\t{v2}\t{t}\n").format(
+                                  v1=1, v2=i,
+                                  t=1487970000+(i*300)
+                              )
+
+    q(to_insert)
+    assert TSV(q('SELECT metric, value, timestamp FROM test.graphite'
+               ' ORDER BY (timestamp, metric)')) == TSV(expected_unmerged)
+
+    q('OPTIMIZE TABLE test.graphite PARTITION 201702 FINAL')
+    expected_merged = '''
+        five_min.count	48	1487970000	2017-02-25	1
+        five_min.count	48	1487984400	2017-02-25	1
+        five_min.count	48	1487998800	2017-02-25	1
+        five_min.count	48	1488013200	2017-02-25	1
+        five_min.count	48	1488027600	2017-02-25	1
+        five_min.count	48	1488042000	2017-02-25	1
+        five_min.count	48	1488056400	2017-02-26	1
+        five_min.count	48	1488070800	2017-02-26	1
+        five_min.max	47	1487970000	2017-02-25	1
+        five_min.max	95	1487984400	2017-02-25	1
+        five_min.max	143	1487998800	2017-02-25	1
+        five_min.max	191	1488013200	2017-02-25	1
+        five_min.max	239	1488027600	2017-02-25	1
+        five_min.max	287	1488042000	2017-02-25	1
+        five_min.max	335	1488056400	2017-02-26	1
+        five_min.max	383	1488070800	2017-02-26	1
+    '''
+    assert TSV(q('SELECT * FROM test.graphite'
+                 ' ORDER BY (metric, timestamp)')) == TSV(expected_merged)
+
+
+def test_combined_rules_with_default(graphite_table):
+    q('''
+DROP TABLE IF EXISTS test.graphite;
+CREATE TABLE test.graphite
+    (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
+    ENGINE = GraphiteMergeTree('graphite_rollup_with_default')
+    PARTITION BY toYYYYMM(date)
+    ORDER BY (metric, timestamp)
+    SETTINGS index_granularity=1;
+      ''')
+    # 1487970000 ~ Sat 25 Feb 00:00:00 MSK 2017
+    to_insert = 'INSERT INTO test.graphite VALUES '
+    expected_unmerged = ''
+    for i in range(100):
+        to_insert += "('top_level.count', {v}, {t}, toDate({t}), 1), ".format(
+            v=1, t=1487970000+(i*60)
+        )
+        to_insert += "('top_level.max', {v}, {t}, toDate({t}), 1), ".format(
+            v=i, t=1487970000+(i*60)
+        )
+        expected_unmerged += ("top_level.count\t{v1}\t{t}\n"
+                              "top_level.max\t{v2}\t{t}\n").format(
+                                  v1=1, v2=i,
+                                  t=1487970000+(i*60)
+                              )
+
+    q(to_insert)
+    assert TSV(q('SELECT metric, value, timestamp FROM test.graphite'
+                 ' ORDER BY (timestamp, metric)')) == TSV(expected_unmerged)
+
+    q('OPTIMIZE TABLE test.graphite PARTITION 201702 FINAL')
+    expected_merged = '''
+        top_level.count	10	1487970000	2017-02-25	1
+        top_level.count	10	1487970600	2017-02-25	1
+        top_level.count	10	1487971200	2017-02-25	1
+        top_level.count	10	1487971800	2017-02-25	1
+        top_level.count	10	1487972400	2017-02-25	1
+        top_level.count	10	1487973000	2017-02-25	1
+        top_level.count	10	1487973600	2017-02-25	1
+        top_level.count	10	1487974200	2017-02-25	1
+        top_level.count	10	1487974800	2017-02-25	1
+        top_level.count	10	1487975400	2017-02-25	1
+        top_level.max	9	1487970000	2017-02-25	1
+        top_level.max	19	1487970600	2017-02-25	1
+        top_level.max	29	1487971200	2017-02-25	1
+        top_level.max	39	1487971800	2017-02-25	1
+        top_level.max	49	1487972400	2017-02-25	1
+        top_level.max	59	1487973000	2017-02-25	1
+        top_level.max	69	1487973600	2017-02-25	1
+        top_level.max	79	1487974200	2017-02-25	1
+        top_level.max	89	1487974800	2017-02-25	1
+        top_level.max	99	1487975400	2017-02-25	1
+    '''
+    assert TSV(q('SELECT * FROM test.graphite'
+                 ' ORDER BY (metric, timestamp)')) == TSV(expected_merged)
+
+
+def test_broken_partial_rollup(graphite_table):
+    q('''
+DROP TABLE IF EXISTS test.graphite;
+CREATE TABLE test.graphite
+    (metric String, value Float64, timestamp UInt32, date Date, updated UInt32)
+    ENGINE = GraphiteMergeTree('graphite_rollup_broken')
+    PARTITION BY toYYYYMM(date)
+    ORDER BY (metric, timestamp)
+    SETTINGS index_granularity=1;
+      ''')
+    to_insert = '''\
+one_min.x1	100	1000000000	2001-09-09	1
+zzzzzzzz	100	1000000001	2001-09-09	1
+zzzzzzzz	200	1000000001	2001-09-09	2
+'''
+
+    q('INSERT INTO test.graphite FORMAT TSV', to_insert)
+
+    expected = '''\
+one_min.x1	100	1000000000	2001-09-09	1
+zzzzzzzz	200	1000000001	2001-09-09	2
+'''
+
+    result = q('''
+OPTIMIZE TABLE test.graphite PARTITION 200109 FINAL;
+
+SELECT * FROM test.graphite;
+''')
+
+    assert TSV(result) == TSV(expected)

From e79235f93257cf08be11f8a128e5fa48c4876933 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Thu, 28 Feb 2019 09:52:33 +0100
Subject: [PATCH 13/63] Fix typo in parameter name

---
 docs/ru/operations/table_engines/graphitemergetree.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/operations/table_engines/graphitemergetree.md b/docs/ru/operations/table_engines/graphitemergetree.md
index 9c9afc9c9a6..37420f317cd 100644
--- a/docs/ru/operations/table_engines/graphitemergetree.md
+++ b/docs/ru/operations/table_engines/graphitemergetree.md
@@ -100,7 +100,7 @@ default
 
 При обработке строки ClickHouse проверяет правила в разделах `pattern`. Каждый из разделов `pattern` может содержать параметр `function` для аггрегации, правила `retention` для прореживания или оба эти параметра. Если имя метрики соответствует шаблону `regexp`, то применяются правила из раздела (или разделов) `pattern`, в противном случае из раздела `default`.
 
-Поля для разделов `pattenrn` и `default`:
+Поля для разделов `pattern` и `default`:
 
 - `regexp` – шаблон имени метрики.
 - `age` – минимальный возраст данных в секундах.

From 3dac4f018b22614093170f644235e9bc52062c59 Mon Sep 17 00:00:00 2001
From: BayoNet <da-daos@yandex.ru>
Date: Thu, 28 Feb 2019 12:06:10 +0300
Subject: [PATCH 14/63] DOCAPI-5441: The tcp_port_secure setting description is
 added.

---
 docs/en/operations/server_settings/settings.md     | 14 ++++++++++++--
 docs/en/operations/troubleshooting.md              |  4 ++--
 .../dicts/external_dicts_dict_sources.md           |  2 +-
 docs/en/query_language/table_functions/remote.md   |  2 +-
 4 files changed, 16 insertions(+), 6 deletions(-)

diff --git a/docs/en/operations/server_settings/settings.md b/docs/en/operations/server_settings/settings.md
index f339fb6ce28..be1b35f038b 100644
--- a/docs/en/operations/server_settings/settings.md
+++ b/docs/en/operations/server_settings/settings.md
@@ -196,7 +196,7 @@ For more details, see [GraphiteMergeTree](../../operations/table_engines/graphit
 
 The port for connecting to the server over HTTP(s).
 
-If `https_port` is specified, [openSSL](#openssl) must be configured.
+If `https_port` is specified, [openSSL](#server_settings-openssl) must be configured.
 
 If `http_port` is specified, the openSSL configuration is ignored even if it is set.
 
@@ -430,7 +430,7 @@ For more information, see the MergeTreeSettings.h header file.
 ```
 
 
-## openSSL
+## openSSL {#server_settings-openssl}
 
 SSL client/server configuration.
 
@@ -609,6 +609,16 @@ Port for communicating with clients over the TCP protocol.
 <tcp_port>9000</tcp_port>
 ```
 
+## tcp_port_secure {#server_settings-tcp_port_secure}
+
+Port for communicating with clients over the secure connection by TCP protocol. Use it with [OpenSSL](#server_settings-openssl) settings.
+
+**Example**
+
+```xml
+<tcp_port>9440</tcp_port>
+```
+
 
 ## tmp_path
 
diff --git a/docs/en/operations/troubleshooting.md b/docs/en/operations/troubleshooting.md
index 445cd67bb7c..fdfff6b26b2 100644
--- a/docs/en/operations/troubleshooting.md
+++ b/docs/en/operations/troubleshooting.md
@@ -111,8 +111,8 @@ Check:
 
     Check:
 
-    - The `tcp_port_secure` setting.
-    - Settings for SSL sertificates.
+    - The [tcp_port_secure](server_settings/settings.md#server_settings-tcp_port_secure) setting.
+    - Settings for [SSL sertificates](server_settings/settings.md#server_settings-openssl).
 
      Use proper parameters while connecting. For example, use the `port_secure` parameter with `clickhouse_client`.
 
diff --git a/docs/en/query_language/dicts/external_dicts_dict_sources.md b/docs/en/query_language/dicts/external_dicts_dict_sources.md
index f26967c2d0f..8fb2145ecaf 100644
--- a/docs/en/query_language/dicts/external_dicts_dict_sources.md
+++ b/docs/en/query_language/dicts/external_dicts_dict_sources.md
@@ -88,7 +88,7 @@ Example of settings:
 </source>
 ```
 
-In order for ClickHouse to access an HTTPS resource, you must [configure openSSL](../../operations/server_settings/settings.md) in the server configuration.
+In order for ClickHouse to access an HTTPS resource, you must [configure openSSL](../../operations/server_settings/settings.md#server_settings-openssl) in the server configuration.
 
 Setting fields:
 
diff --git a/docs/en/query_language/table_functions/remote.md b/docs/en/query_language/table_functions/remote.md
index 06d9876f1c7..3b9263d959c 100644
--- a/docs/en/query_language/table_functions/remote.md
+++ b/docs/en/query_language/table_functions/remote.md
@@ -72,6 +72,6 @@ The `remote` table function can be useful in the following cases:
 If the user is not specified, `default` is used.
 If the password is not specified, an empty password is used.
 
-`remoteSecure` - same as `remote` but with secured connection. Default port - `tcp_port_secure` from config or 9440.
+`remoteSecure` - same as `remote` but with secured connection. Default port — [tcp_port_secure](../../operations/server_settings/settings.md#server_settings-tcp_port_secure) from config or 9440.
 
 [Original article](https://clickhouse.yandex/docs/en/query_language/table_functions/remote/) <!--hide-->

From ae8e84c532f2dd536498e7b57772a36c704af5e7 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Thu, 28 Feb 2019 10:44:30 +0100
Subject: [PATCH 15/63] Add note about patterns order to docs

---
 docs/en/operations/table_engines/graphitemergetree.md | 9 ++++++++-
 docs/ru/operations/table_engines/graphitemergetree.md | 8 +++++++-
 2 files changed, 15 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/table_engines/graphitemergetree.md b/docs/en/operations/table_engines/graphitemergetree.md
index 4231fb00f43..cd0e17652ae 100644
--- a/docs/en/operations/table_engines/graphitemergetree.md
+++ b/docs/en/operations/table_engines/graphitemergetree.md
@@ -95,7 +95,14 @@ default
     ...
 ```
 
-When processing a row, ClickHouse checks the rules in the `pattern` sections. Each of `pattern` sections could contain `function` parameter for aggregation, `retention` parameters or both. If the metric name matches the `regexp`, the rules from the `pattern` section (or sections) are applied; otherwise, the rules from the `default` section are used.
+**Important:** The order of patterns should be next:
+
+1. Patterns *without* `function` *or* `retention`.
+1. Patterns *with* both `function` *and* `retention`.
+1. Pattern `dafault`.
+
+
+When processing a row, ClickHouse checks the rules in the `pattern` sections. Each of `pattern` (including `default`) sections could contain `function` parameter for aggregation, `retention` parameters or both. If the metric name matches the `regexp`, the rules from the `pattern` section (or sections) are applied; otherwise, the rules from the `default` section are used.
 
 Fields for `pattern` and `default` sections:
 
diff --git a/docs/ru/operations/table_engines/graphitemergetree.md b/docs/ru/operations/table_engines/graphitemergetree.md
index 37420f317cd..169df60b0d3 100644
--- a/docs/ru/operations/table_engines/graphitemergetree.md
+++ b/docs/ru/operations/table_engines/graphitemergetree.md
@@ -98,7 +98,13 @@ default
     ...
 ```
 
-При обработке строки ClickHouse проверяет правила в разделах `pattern`. Каждый из разделов `pattern` может содержать параметр `function` для аггрегации, правила `retention` для прореживания или оба эти параметра. Если имя метрики соответствует шаблону `regexp`, то применяются правила из раздела (или разделов) `pattern`, в противном случае из раздела `default`.
+**Важно**: порядок разделов `pattern` должен быть следующим:
+
+1. Разделы *без* параметра `function` *или* `retention`.
+1. Разделы *с* параметрами `function` *и* `retention`.
+1. Раздел `default`.
+
+При обработке строки ClickHouse проверяет правила в разделах `pattern`. Каждый из разделов `pattern` (включая `default`) может содержать параметр `function` для аггрегации, правила `retention` для прореживания или оба эти параметра. Если имя метрики соответствует шаблону `regexp`, то применяются правила из раздела (или разделов) `pattern`, в противном случае из раздела `default`.
 
 Поля для разделов `pattern` и `default`:
 

From 455ca955e569b5e6a23605c828a90686f1ca4567 Mon Sep 17 00:00:00 2001
From: BayoNet <da-daos@yandex.ru>
Date: Thu, 28 Feb 2019 14:20:27 +0300
Subject: [PATCH 16/63] DOCAPI-5203: Added the descriptions for direct I/O
 settings for MergeTree merge and SELECT queries.

---
 dbms/src/Interpreters/Settings.h              |  2 +-
 .../en/operations/server_settings/settings.md |  2 +-
 docs/en/operations/settings/settings.md       | 28 +++++++++++++++++++
 3 files changed, 30 insertions(+), 2 deletions(-)

diff --git a/dbms/src/Interpreters/Settings.h b/dbms/src/Interpreters/Settings.h
index 42e60a2353e..0b0f630b49f 100644
--- a/dbms/src/Interpreters/Settings.h
+++ b/dbms/src/Interpreters/Settings.h
@@ -103,7 +103,7 @@ struct Settings
     \
     M(SettingUInt64, optimize_min_equality_disjunction_chain_length, 3, "The minimum length of the expression `expr = x1 OR ... expr = xN` for optimization ") \
     \
-    M(SettingUInt64, min_bytes_to_use_direct_io, 0, "The minimum number of bytes for input/output operations is bypassing the page cache. 0 - disabled.") \
+    M(SettingUInt64, min_bytes_to_use_direct_io, 0, "The minimum number of bytes for reading the data with O_DIRECT option during SELECT queries execution. 0 - disabled.") \
     \
     M(SettingBool, force_index_by_date, 0, "Throw an exception if there is a partition key in a table, and it is not used.") \
     M(SettingBool, force_primary_key, 0, "Throw an exception if there is primary key in a table, and it is not used.") \
diff --git a/docs/en/operations/server_settings/settings.md b/docs/en/operations/server_settings/settings.md
index f339fb6ce28..db09323bab9 100644
--- a/docs/en/operations/server_settings/settings.md
+++ b/docs/en/operations/server_settings/settings.md
@@ -417,7 +417,7 @@ The value 0 means that you can delete all tables without any restrictions.
 
 ## merge_tree {#server_settings-merge_tree}
 
-Fine tuning for tables in the [ MergeTree](../../operations/table_engines/mergetree.md).
+Fine tuning for tables in the [MergeTree](../../operations/table_engines/mergetree.md).
 
 For more information, see the MergeTreeSettings.h header file.
 
diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index e30758fc943..2fa8f37e404 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -175,6 +175,34 @@ Any positive integer.
 
 **Default value**: 1048576.
 
+## min_merge_bytes_to_use_direct_io {#settings-min_merge_bytes_to_use_direct_io}
+
+The threshold for using direct I/O interface of the storage disk.
+
+ClickHouse uses this setting when merging data parts of the [MergeTree](../table_engines/mergetree.md)-family tables. During the merge, ClickHouse calculates summary storage volume of all the data to be merged. If the volume exceeds `min_merge_bytes_to_use_direct_io` bytes, than ClickHouse reads and writes the data using direct I/O interface (`O_DIRECT` option) to the storage disk.
+
+**Possible values**
+
+Positive integer.
+
+0 — The direct I/O is disabled.
+
+**Default value**: `10 * 1024 * 1024 * 1024` bytes.
+
+## min_bytes_to_use_direct_io {#settings-min_bytes_to_use_direct_io}
+
+The threshold for using direct I/O interface of the storage disk.
+
+ClickHouse uses this setting when selecting the data from tables. If summary storage volume of all the data to be read exceeds `min_bytes_to_use_direct_io` bytes, than ClickHouse reads the data from the storage disk directly with `O_DIRECT` option.
+
+**Possible values**
+
+Positive integer.
+
+0 — The direct I/O is disabled.
+
+**Default value**: 0.
+
 ## log_queries
 
 Setting up query logging.

From 0613cd26bcec37389bc8bd0b871f269de332fa48 Mon Sep 17 00:00:00 2001
From: BayoNet <da-daos@yandex.ru>
Date: Thu, 28 Feb 2019 19:53:11 +0300
Subject: [PATCH 17/63] DOCAPI-5441. Some restructurization for
 tcp_port_secure.

---
 docs/en/operations/server_settings/settings.md | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/docs/en/operations/server_settings/settings.md b/docs/en/operations/server_settings/settings.md
index be1b35f038b..952aae6979a 100644
--- a/docs/en/operations/server_settings/settings.md
+++ b/docs/en/operations/server_settings/settings.md
@@ -613,13 +613,16 @@ Port for communicating with clients over the TCP protocol.
 
 Port for communicating with clients over the secure connection by TCP protocol. Use it with [OpenSSL](#server_settings-openssl) settings.
 
-**Example**
+**Possible values**
+
+Positive integer.
+
+**Default value**
 
 ```xml
-<tcp_port>9440</tcp_port>
+<tcp_port_secure>9440</tcp_port_secure>
 ```
 
-
 ## tmp_path
 
 Path to temporary data for processing large queries.

From 47c82b6c08ddfc5af6ec2e64134928a7c9d6ccfc Mon Sep 17 00:00:00 2001
From: BayoNet <da-daos@yandex.ru>
Date: Mon, 4 Mar 2019 17:01:07 +0300
Subject: [PATCH 18/63] DOCAPI-5441: tcp_port_secure topic fix.

---
 docs/en/operations/server_settings/settings.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/server_settings/settings.md b/docs/en/operations/server_settings/settings.md
index 952aae6979a..d21b0379a90 100644
--- a/docs/en/operations/server_settings/settings.md
+++ b/docs/en/operations/server_settings/settings.md
@@ -611,7 +611,7 @@ Port for communicating with clients over the TCP protocol.
 
 ## tcp_port_secure {#server_settings-tcp_port_secure}
 
-Port for communicating with clients over the secure connection by TCP protocol. Use it with [OpenSSL](#server_settings-openssl) settings.
+Port for communicating with the clients over the secure connection by TCP protocol. Use it with [OpenSSL](#server_settings-openssl) settings.
 
 **Possible values**
 

From 646ba6726f3b5c48fe1065a61f8e31d21342b836 Mon Sep 17 00:00:00 2001
From: BayoNet <da-daos@yandex.ru>
Date: Mon, 4 Mar 2019 17:37:56 +0300
Subject: [PATCH 19/63] DOCAPI-5203: Clarification of direct I/O settings
 descriptions.

---
 docs/en/operations/settings/settings.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 2fa8f37e404..ff31b267d1d 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -177,7 +177,7 @@ Any positive integer.
 
 ## min_merge_bytes_to_use_direct_io {#settings-min_merge_bytes_to_use_direct_io}
 
-The threshold for using direct I/O interface of the storage disk.
+The minimum data volume for merge operation required for using of the direct I/O interface of the storage disk.
 
 ClickHouse uses this setting when merging data parts of the [MergeTree](../table_engines/mergetree.md)-family tables. During the merge, ClickHouse calculates summary storage volume of all the data to be merged. If the volume exceeds `min_merge_bytes_to_use_direct_io` bytes, than ClickHouse reads and writes the data using direct I/O interface (`O_DIRECT` option) to the storage disk.
 
@@ -191,9 +191,9 @@ Positive integer.
 
 ## min_bytes_to_use_direct_io {#settings-min_bytes_to_use_direct_io}
 
-The threshold for using direct I/O interface of the storage disk.
+The minimum data volume to be read from storage required for using of the direct I/O interface of the storage disk.
 
-ClickHouse uses this setting when selecting the data from tables. If summary storage volume of all the data to be read exceeds `min_bytes_to_use_direct_io` bytes, than ClickHouse reads the data from the storage disk directly with `O_DIRECT` option.
+ClickHouse uses this setting when selecting the data from tables. If summary storage volume of all the data to be read exceeds `min_bytes_to_use_direct_io` bytes, then ClickHouse reads the data from the storage disk with `O_DIRECT` option.
 
 **Possible values**
 

From fe6c988c5543a6813a3403b44078d0b4da3772fd Mon Sep 17 00:00:00 2001
From: ogorbacheva <ogorbacheva@yandex-team.ru>
Date: Mon, 4 Mar 2019 17:52:12 +0300
Subject: [PATCH 20/63] Doc fixes

---
 docs/en/operations/backup.md                  |  4 +-
 docs/ru/interfaces/formats.md                 | 44 +++++++++----------
 docs/ru/operations/settings/settings.md       |  2 +-
 .../table_engines/collapsingmergetree.md      |  2 +-
 .../operations/table_engines/replication.md   |  2 +-
 5 files changed, 26 insertions(+), 28 deletions(-)

diff --git a/docs/en/operations/backup.md b/docs/en/operations/backup.md
index fddcaba78f7..f9b0d134815 100644
--- a/docs/en/operations/backup.md
+++ b/docs/en/operations/backup.md
@@ -1,6 +1,6 @@
 # Data Backup 
 
-While [replication](table_engines/replication.md#table_engines-replication) provides protection from hardware failures, it does not protect against human errors: accidentally deleting data, deleting the wrong table or on the wrong cluster, software bugs leading to incorrect data processing or data corruption. In many cases commands like these will affect all replicas. ClickHouse has built-in safeguards to prevent some of mistakes, for example by default [you can't just drop tables with MergeTree-like engine containing more than 50Gb of data](https://github.com/yandex/ClickHouse/blob/v18.14.18-stable/dbms/programs/server/config.xml), but they don't cover all possible cases and can be circumvented.
+While [replication](table_engines/replication.md) provides protection from hardware failures, it does not protect against human errors: accidentally deleting data, deleting the wrong table or on the wrong cluster, software bugs leading to incorrect data processing or data corruption. In many cases commands like these will affect all replicas. ClickHouse has built-in safeguards to prevent some of mistakes, for example by default [you can't just drop tables with MergeTree-like engine containing more than 50Gb of data](https://github.com/yandex/ClickHouse/blob/v18.14.18-stable/dbms/programs/server/config.xml), but they don't cover all possible cases and can be circumvented.
 
 So in order to effectively mitigate possible human errors, you should carefully prepare your backup and restore strategy **in advance**. 
 
@@ -35,4 +35,4 @@ There's a third-party tool to automate this approach: [clickhouse-backup](https:
 
 [Console client](../interfaces/cli.md) can be used to run queries like `SELECT * FROM my_table;` to dump the tables into files using any of the [supported serialization formats](../interfaces/formats.md#formats). Though if you are using ClickHouse as intended and have large enough volumes of data, this will hardly be practical.
 
-[Original article](https://clickhouse.yandex/docs/en/operations/access_rights/) <!--hide-->
\ No newline at end of file
+[Original article](https://clickhouse.yandex/docs/en/operations/access_rights/) <!--hide-->
diff --git a/docs/ru/interfaces/formats.md b/docs/ru/interfaces/formats.md
index 303ed85cd73..e345ef651d3 100644
--- a/docs/ru/interfaces/formats.md
+++ b/docs/ru/interfaces/formats.md
@@ -14,7 +14,6 @@ ClickHouse может принимать (`INSERT`) и отдавать (`SELECT
 [CSVWithNames](#csvwithnames) | ✔ | ✔ |
 [Values](#values) | ✔ | ✔ |
 [Vertical](#vertical) | ✗ | ✔ |
-[VerticalRaw](#verticalraw) | ✗ | ✔ |
 [JSON](#json) | ✗ | ✔ |
 [JSONCompact](#jsoncompact) | ✗ | ✔ |
 [JSONEachRow](#jsoneachrow) | ✔ | ✔ |
@@ -353,10 +352,22 @@ SELECT * FROM t_null
 └───┴──────┘
 ```
 
+В форматах `Pretty*` строки выводятся без экранирования. Ниже приведен пример для формата [PrettyCompact](#prettycompact):
+
+``` sql
+SELECT 'String with \'quotes\' and \t character' AS Escaping_test
+```
+
+``` 
+┌─Escaping_test────────────────────────┐
+│ String with 'quotes' and 	 character │
+└──────────────────────────────────────┘
+```
+
 Для защиты от вываливания слишком большого количества данных в терминал, выводится только первые 10 000 строк. Если строк больше или равно 10 000, то будет написано "Showed first 10 000."
 Этот формат подходит только для вывода результата выполнения запроса, но не для парсинга (приёма данных для вставки в таблицу).
 
-Формат Pretty поддерживает вывод тотальных значений (при использовании WITH TOTALS) и экстремальных значений (при настройке extremes выставленной в 1). В этих случаях, после основных данных выводятся тотальные значения, и экстремальные значения, в отдельных табличках. Пример (показан для формата PrettyCompact):
+Формат `Pretty` поддерживает вывод тотальных значений (при использовании WITH TOTALS) и экстремальных значений (при настройке extremes выставленной в 1). В этих случаях, после основных данных выводятся тотальные значения, и экстремальные значения, в отдельных табличках. Пример (показан для формата [PrettyCompact](#prettycompact)):
 
 ``` sql
 SELECT EventDate, count() AS c FROM test.hits GROUP BY EventDate WITH TOTALS ORDER BY EventDate FORMAT PrettyCompact
@@ -387,7 +398,7 @@ Extremes:
 
 ## PrettyCompact {#prettycompact}
 
-Отличается от `Pretty` тем, что не рисуется сетка между строками - результат более компактный.
+Отличается от [Pretty](#pretty) тем, что не рисуется сетка между строками - результат более компактный.
 Этот формат используется по умолчанию в клиенте командной строки в интерактивном режиме.
 
 ## PrettyCompactMonoBlock {#prettycompactmonoblock}
@@ -432,6 +443,7 @@ FixedString представлены просто как последовате
 Array представлены как длина в формате varint (unsigned [LEB128](https://en.wikipedia.org/wiki/LEB128)), а затем элементы массива, подряд.
 
 Для поддержки [NULL](../query_language/syntax.md#null-literal) перед каждым значением типа [Nullable](../data_types/nullable.md
+
 ## Values
 
 Выводит каждую строку в скобках. Строки разделены запятыми. После последней строки запятой нет. Значения внутри скобок также разделены запятыми. Числа выводятся в десятичном виде без кавычек. Массивы выводятся в квадратных скобках. Строки, даты, даты-с-временем выводятся в кавычках. Правила экранирования и особенности парсинга аналогичны формату [TabSeparated](#tabseparated). При форматировании, лишние пробелы не ставятся, а при парсинге - допустимы и пропускаются (за исключением пробелов внутри значений типа массив, которые недопустимы). [NULL](../query_language/syntax.md) представляется как `NULL`.
@@ -458,34 +470,20 @@ x: 1
 y: ᴺᵁᴸᴸ
 ```
 
-Этот формат подходит только для вывода результата выполнения запроса, но не для парсинга (приёма данных для вставки в таблицу).
+В формате `Vertical` строки выводятся без экранирования. Например:
 
-## VerticalRaw {#verticalraw}
-
-Отличается от формата `Vertical` тем, что строки выводятся без экранирования.
-Этот формат подходит только для вывода результата выполнения запроса, но не для парсинга (приёма данных для вставки в таблицу).
-
-Примеры:
+``` sql
+SELECT 'string with \'quotes\' and \t with some special \n characters' AS test FORMAT Vertical
 ```
-:) SHOW CREATE TABLE geonames FORMAT VerticalRaw;
-Row 1:
-──────
-statement: CREATE TABLE default.geonames ( geonameid UInt32, date Date DEFAULT CAST('2017-12-08' AS Date)) ENGINE = MergeTree(date, geonameid, 8192)
 
-:) SELECT 'string with \'quotes\' and \t with some special \n characters' AS test FORMAT VerticalRaw;
+```
 Row 1:
 ──────
-test: string with 'quotes' and   with some special
+test: string with 'quotes' and 	 with some special
  characters
 ```
 
-Для сравнения - формат Vertical:
-```
-:) SELECT 'string with \'quotes\' and \t with some special \n characters' AS test FORMAT Vertical;
-Row 1:
-──────
-test: string with \'quotes\' and \t with some special \n characters
-```
+Этот формат подходит только для вывода результата выполнения запроса, но не для парсинга (приёма данных для вставки в таблицу).
 
 ## XML {#xml}
 
diff --git a/docs/ru/operations/settings/settings.md b/docs/ru/operations/settings/settings.md
index ed1395a1aaf..c174507859b 100644
--- a/docs/ru/operations/settings/settings.md
+++ b/docs/ru/operations/settings/settings.md
@@ -118,7 +118,7 @@ ClickHouse применяет настройку в тех случаях, ко
 
 Это намного больше, чем `max_block_size`. Это сделано, потому что некоторые движки таблиц (`*MergeTree`) будут на каждый вставляемый блок формировать кусок данных на диске, что является довольно большой сущностью. Также, в таблицах типа `*MergeTree`, данные сортируются при вставке, и достаточно большой размер блока позволяет отсортировать больше данных в оперативке.
 
-## max_replica_delay_for_distributed_queries {#settings_settings_max_replica_delay_for_distributed_queries}
+## max_replica_delay_for_distributed_queries {#settings-max_replica_delay_for_distributed_queries}
 
 Отключает отстающие реплики при распределенных запросах. Смотрите "[Репликация](../../operations/table_engines/replication.md)".
 
diff --git a/docs/ru/operations/table_engines/collapsingmergetree.md b/docs/ru/operations/table_engines/collapsingmergetree.md
index cc938de2af3..f09d84cf8e8 100644
--- a/docs/ru/operations/table_engines/collapsingmergetree.md
+++ b/docs/ru/operations/table_engines/collapsingmergetree.md
@@ -54,7 +54,7 @@ CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
 
 </details>
 
-## Сворачивание (удаление) строк {table_engine-collapsingmergetree-collapsing}
+## Сворачивание (удаление) строк {#table_engine-collapsingmergetree-collapsing}
 
 ### Данные
 
diff --git a/docs/ru/operations/table_engines/replication.md b/docs/ru/operations/table_engines/replication.md
index fe61e3a232c..efe5a2257b3 100644
--- a/docs/ru/operations/table_engines/replication.md
+++ b/docs/ru/operations/table_engines/replication.md
@@ -67,7 +67,7 @@
 
 Система следит за синхронностью данных на репликах и умеет восстанавливаться после сбоя. Восстановление после сбоя автоматическое (в случае небольших различий в данных) или полуавтоматическое (когда данные отличаются слишком сильно, что может свидетельствовать об ошибке конфигурации).
 
-## Создание реплицируемых таблиц
+## Создание реплицируемых таблиц {#creating-replicated-tables}
 
 В начало имени движка таблицы добавляется `Replicated`. Например, `ReplicatedMergeTree`.
 

From 4bae599fcdcac0394917c26d1d201fcd4a8c9479 Mon Sep 17 00:00:00 2001
From: BayoNet <da-daos@yandex.ru>
Date: Mon, 4 Mar 2019 18:34:35 +0300
Subject: [PATCH 21/63] DOCAPI-5203: The direct I/O settings are moved to right
 places.

---
 docs/en/operations/settings/settings.md       | 14 --------------
 docs/en/operations/table_engines/mergetree.md |  2 ++
 2 files changed, 2 insertions(+), 14 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index ff31b267d1d..8f3e0d525ef 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -175,20 +175,6 @@ Any positive integer.
 
 **Default value**: 1048576.
 
-## min_merge_bytes_to_use_direct_io {#settings-min_merge_bytes_to_use_direct_io}
-
-The minimum data volume for merge operation required for using of the direct I/O interface of the storage disk.
-
-ClickHouse uses this setting when merging data parts of the [MergeTree](../table_engines/mergetree.md)-family tables. During the merge, ClickHouse calculates summary storage volume of all the data to be merged. If the volume exceeds `min_merge_bytes_to_use_direct_io` bytes, than ClickHouse reads and writes the data using direct I/O interface (`O_DIRECT` option) to the storage disk.
-
-**Possible values**
-
-Positive integer.
-
-0 — The direct I/O is disabled.
-
-**Default value**: `10 * 1024 * 1024 * 1024` bytes.
-
 ## min_bytes_to_use_direct_io {#settings-min_bytes_to_use_direct_io}
 
 The minimum data volume to be read from storage required for using of the direct I/O interface of the storage disk.
diff --git a/docs/en/operations/table_engines/mergetree.md b/docs/en/operations/table_engines/mergetree.md
index 7d86776d27b..3658392c70c 100644
--- a/docs/en/operations/table_engines/mergetree.md
+++ b/docs/en/operations/table_engines/mergetree.md
@@ -70,6 +70,8 @@ For a description of request parameters, see [request description](../../query_l
 
 - `SETTINGS` — Additional parameters that control the behavior of the `MergeTree`:
     - `index_granularity` — The granularity of an index. The number of data rows between the "marks" of an index. By default, 8192. The list of all available parameters you can see in [MergeTreeSettings.h](https://github.com/yandex/ClickHouse/blob/master/dbms/src/Storages/MergeTree/MergeTreeSettings.h).
+    - `min_merge_bytes_to_use_direct_io` — The minimum data volume for merge operation required for using of the direct I/O interface of the storage disk. During the merging of the data parts, ClickHouse calculates summary storage volume of all the data to be merged. If the volume exceeds `min_merge_bytes_to_use_direct_io` bytes, thеn ClickHouse reads and writes the data using direct I/O interface (`O_DIRECT` option) to the storage disk. If `min_merge_bytes_to_use_direct_io = 0`, then the direct I/O is disabled. Default value: `10 * 1024 * 1024 * 1024` bytes.
+
 
 **Example of sections setting**
 

From 9fde4594c92a9f4d975ed299298c7c9564729e4e Mon Sep 17 00:00:00 2001
From: BayoNet <da-daos@yandex.ru>
Date: Mon, 4 Mar 2019 19:27:00 +0300
Subject: [PATCH 22/63] DOCAPI-5758: New parameter kafka_skip_broken_messages
 in the Kafka engine description.

---
 docs/en/operations/table_engines/kafka.md | 63 ++++++++++++++---------
 1 file changed, 40 insertions(+), 23 deletions(-)

diff --git a/docs/en/operations/table_engines/kafka.md b/docs/en/operations/table_engines/kafka.md
index 3927e472e50..87322afb48e 100644
--- a/docs/en/operations/table_engines/kafka.md
+++ b/docs/en/operations/table_engines/kafka.md
@@ -9,38 +9,38 @@ Kafka lets you:
 - Process streams as they become available.
 
 
-Old format:
+## Creating a Table {#table_engine-kafka-creating-a-table}
 
 ```
-Kafka(kafka_broker_list, kafka_topic_list, kafka_group_name, kafka_format
-      [, kafka_row_delimiter, kafka_schema, kafka_num_consumers])
+CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
+(
+    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1],
+    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2],
+    ...
+) ENGINE = Kafka()
+SETTINGS
+    kafka_broker_list = 'host:port',
+    kafka_topic_list = 'topic1,topic2,...',
+    kafka_group_name = 'group_name',
+    kafka_format = 'data_format'[,]
+    [kafka_row_delimiter = 'delimiter_symbol',]
+    [kafka_schema = '',]
+    [kafka_num_consumers = N,]
+    [kafka_skip_broken_messages = <0|1>]
 ```
-
-New format:
-
-```
-Kafka SETTINGS
-  kafka_broker_list = 'localhost:9092',
-  kafka_topic_list = 'topic1,topic2',
-  kafka_group_name = 'group1',
-  kafka_format = 'JSONEachRow',
-  kafka_row_delimiter = '\n',
-  kafka_schema = '',
-  kafka_num_consumers = 2
-```
-
 Required parameters:
 
-- `kafka_broker_list` – A comma-separated list of brokers (`localhost:9092`).
-- `kafka_topic_list` – A list of Kafka topics (`my_topic`).
-- `kafka_group_name` – A group of Kafka consumers (`group1`). Reading margins are tracked for each group separately. If you don't want messages to be duplicated in the cluster, use the same group name everywhere.
-- `kafka_format` – Message format. Uses the same notation as the SQL ` FORMAT` function, such as ` JSONEachRow`. For more information, see the "Formats" section.
+- `kafka_broker_list` – A comma-separated list of brokers (for example, `localhost:9092`).
+- `kafka_topic_list` – A list of Kafka topics.
+- `kafka_group_name` – A group of Kafka consumers. Reading margins are tracked for each group separately. If you don't want messages to be duplicated in the cluster, use the same group name everywhere.
+- `kafka_format` – Message format. Uses the same notation as the SQL `FORMAT` function, such as ` JSONEachRow`. For more information, see the [Formats](../../interfaces/formats.md) section.
 
 Optional parameters:
 
-- `kafka_row_delimiter` - Character-delimiter of records (rows), which ends the message.
-- `kafka_schema` – An optional parameter that must be used if the format requires a schema definition. For example, [Cap'n Proto](https://capnproto.org/) requires the path to the schema file and the name of the root `schema.capnp:Message` object.
+- `kafka_row_delimiter` – Delimiter character, which ends the message.
+- `kafka_schema` – Parameter that must be used if the format requires a schema definition. For example, [Cap'n Proto](https://capnproto.org/) requires the path to the schema file and the name of the root `schema.capnp:Message` object.
 - `kafka_num_consumers` – The number of consumers per table. Default: `1`. Specify more consumers if the throughput of one consumer is insufficient. The total number of consumers should not exceed the number of partitions in the topic, since only one consumer can be assigned per partition.
+- `kafka_skip_broken_messages` – Mode of Kafka messages parser. If `kafka_skip_broken_messages = 1` then the engine skips the Kafka messages (message equals a row of data) that can't be parsed.
 
 Examples:
 
@@ -72,6 +72,23 @@ Examples:
                        kafka_num_consumers = 4;
 ```
 
+
+<details markdown="1"><summary>Deprecated Method for Creating a Table</summary>
+
+!!! attention
+    Do not use this method in new projects and, if possible, switch the old projects to the method described above.
+
+
+```
+Kafka(kafka_broker_list, kafka_topic_list, kafka_group_name, kafka_format
+      [, kafka_row_delimiter, kafka_schema, kafka_num_consumers, kafka_skip_broken_messages])
+```
+
+</details>
+
+## Description
+
+
 The delivered messages are tracked automatically, so each message in a group is only counted once. If you want to get the data twice, then create a copy of the table with another group name.
 
 Groups are flexible and synced on the cluster. For instance, if you have 10 topics and 5 copies of a table in a cluster, then each copy gets 2 topics. If the number of copies changes, the topics are redistributed across the copies automatically. Read more about this at [http://kafka.apache.org/intro](http://kafka.apache.org/intro).

From 339047fc40bdd24272ca78b330b3f71ff2b87145 Mon Sep 17 00:00:00 2001
From: chertus <chertus@gmail.com>
Date: Mon, 4 Mar 2019 22:40:58 +0300
Subject: [PATCH 23/63] fix multiple joins asterisks qualification

---
 .../DatabaseAndTableWithAlias.cpp             |  4 +-
 .../Interpreters/DatabaseAndTableWithAlias.h  |  2 +-
 dbms/src/Interpreters/SyntaxAnalyzer.cpp      |  3 +-
 .../TranslateQualifiedNamesVisitor.cpp        | 34 +++++--------
 dbms/src/Parsers/ASTIdentifier.cpp            |  4 ++
 dbms/src/Parsers/ASTIdentifier.h              |  1 +
 .../00820_multiple_joins.reference            |  4 --
 .../0_stateless/00820_multiple_joins.sql      | 10 ++--
 .../00847_multiple_join_same_column.reference | 37 ++++++++++++++
 .../00847_multiple_join_same_column.sql       | 48 +++++++++++++++++++
 10 files changed, 111 insertions(+), 36 deletions(-)
 create mode 100644 dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference
 create mode 100644 dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql

diff --git a/dbms/src/Interpreters/DatabaseAndTableWithAlias.cpp b/dbms/src/Interpreters/DatabaseAndTableWithAlias.cpp
index c6fbfaad088..52b05fc5933 100644
--- a/dbms/src/Interpreters/DatabaseAndTableWithAlias.cpp
+++ b/dbms/src/Interpreters/DatabaseAndTableWithAlias.cpp
@@ -62,11 +62,11 @@ bool DatabaseAndTableWithAlias::satisfies(const DatabaseAndTableWithAlias & db_t
     return database == db_table.database && table == db_table.table;
 }
 
-String DatabaseAndTableWithAlias::getQualifiedNamePrefix() const
+String DatabaseAndTableWithAlias::getQualifiedNamePrefix(bool with_dot) const
 {
     if (alias.empty() && table.empty())
         return "";
-    return (!alias.empty() ? alias : table) + '.';
+    return (!alias.empty() ? alias : table) + (with_dot ? "." : "");
 }
 
 std::vector<const ASTTableExpression *> getSelectTablesExpression(const ASTSelectQuery & select_query)
diff --git a/dbms/src/Interpreters/DatabaseAndTableWithAlias.h b/dbms/src/Interpreters/DatabaseAndTableWithAlias.h
index e9d8ee409a6..0f1cbe8bbc7 100644
--- a/dbms/src/Interpreters/DatabaseAndTableWithAlias.h
+++ b/dbms/src/Interpreters/DatabaseAndTableWithAlias.h
@@ -32,7 +32,7 @@ struct DatabaseAndTableWithAlias
     DatabaseAndTableWithAlias(const ASTTableExpression & table_expression, const String & current_database = "");
 
     /// "alias." or "table." if alias is empty
-    String getQualifiedNamePrefix() const;
+    String getQualifiedNamePrefix(bool with_dot = true) const;
 
     /// Check if it satisfies another db_table name. @note opterion is not symmetric.
     bool satisfies(const DatabaseAndTableWithAlias & table, bool table_may_be_an_alias);
diff --git a/dbms/src/Interpreters/SyntaxAnalyzer.cpp b/dbms/src/Interpreters/SyntaxAnalyzer.cpp
index d3b42c57926..6d274e326b4 100644
--- a/dbms/src/Interpreters/SyntaxAnalyzer.cpp
+++ b/dbms/src/Interpreters/SyntaxAnalyzer.cpp
@@ -652,7 +652,8 @@ SyntaxAnalyzerResultPtr SyntaxAnalyzer::analyze(
     {
         if (const ASTTablesInSelectQueryElement * node = select_query->join())
         {
-            replaceJoinedTable(node);
+            if (settings.enable_optimize_predicate_expression)
+                replaceJoinedTable(node);
 
             const auto & joined_expression = static_cast<const ASTTableExpression &>(*node->table_expression);
             DatabaseAndTableWithAlias table(joined_expression, context.getCurrentDatabase());
diff --git a/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp b/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
index 07a823e3452..a0b5aed0af3 100644
--- a/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
+++ b/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
@@ -143,21 +143,14 @@ void TranslateQualifiedNamesMatcher::visit(ASTSelectQuery & select, const ASTPtr
         Visitor(data).visit(*add_node);
 }
 
-/// qualifed names for duplicates
-static std::shared_ptr<ASTIdentifier> makeIdentifier(const String & short_name, const String & long_name, bool need_long_name)
+static void addIdentifier(ASTs & nodes, const String & table_name, const String & column_name, AsteriskSemantic::RevertedAliasesPtr aliases)
 {
-    if (need_long_name)
-        return std::make_shared<ASTIdentifier>(long_name);
-    return std::make_shared<ASTIdentifier>(short_name);
-}
+    auto identifier = std::make_shared<ASTIdentifier>(std::vector<String>{table_name, column_name});
 
-static void addIdentifier(ASTs & nodes, std::shared_ptr<ASTIdentifier> identifier, const String & long_name,
-                          AsteriskSemantic::RevertedAliasesPtr aliases)
-{
     bool added = false;
-    if (aliases && aliases->count(long_name))
+    if (aliases && aliases->count(identifier->name))
     {
-        for (const String & alias : (*aliases)[long_name])
+        for (const String & alias : (*aliases)[identifier->name])
         {
             nodes.push_back(identifier->clone());
             nodes.back()->setAlias(alias);
@@ -173,7 +166,6 @@ static void addIdentifier(ASTs & nodes, std::shared_ptr<ASTIdentifier> identifie
 void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPtr &, Data & data)
 {
     const auto & tables_with_columns = data.tables;
-    const auto & source_columns = data.source_columns;
 
     ASTs old_children;
     if (data.processAsterisks())
@@ -208,16 +200,14 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
         if (const auto * asterisk = typeid_cast<const ASTAsterisk *>(child.get()))
         {
             bool first_table = true;
-            for (const auto & [table_name, table_columns] : tables_with_columns)
+            for (const auto & [table, table_columns] : tables_with_columns)
             {
                 for (const auto & column_name : table_columns)
                 {
                     if (first_table || !data.join_using_columns.count(column_name))
                     {
-                        bool need_prefix = !first_table && source_columns.count(column_name);
-                        String long_name = table_name.getQualifiedNamePrefix() + column_name;
-                        auto identifier = makeIdentifier(column_name, long_name, need_prefix);
-                        addIdentifier(node.children, identifier, long_name, AsteriskSemantic::getAliases(*asterisk));
+                        String table_name = table.getQualifiedNamePrefix(false);
+                        addIdentifier(node.children, table_name, column_name, AsteriskSemantic::getAliases(*asterisk));
                     }
                 }
 
@@ -229,16 +219,14 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
             DatabaseAndTableWithAlias ident_db_and_name(qualified_asterisk->children[0]);
 
             bool first_table = true;
-            for (const auto & [table_name, table_columns] : tables_with_columns)
+            for (const auto & [table, table_columns] : tables_with_columns)
             {
-                if (ident_db_and_name.satisfies(table_name, true))
+                if (ident_db_and_name.satisfies(table, true))
                 {
                     for (const auto & column_name : table_columns)
                     {
-                        bool need_prefix = !first_table && source_columns.count(column_name);
-                        String long_name = table_name.getQualifiedNamePrefix() + column_name;
-                        auto identifier = makeIdentifier(column_name, long_name, need_prefix);
-                        addIdentifier(node.children, identifier, long_name, AsteriskSemantic::getAliases(*qualified_asterisk));
+                        String table_name = table.getQualifiedNamePrefix(false);
+                        addIdentifier(node.children, table_name, column_name, AsteriskSemantic::getAliases(*qualified_asterisk));
                     }
                     break;
                 }
diff --git a/dbms/src/Parsers/ASTIdentifier.cpp b/dbms/src/Parsers/ASTIdentifier.cpp
index 406a405b02c..c8b3d719b3b 100644
--- a/dbms/src/Parsers/ASTIdentifier.cpp
+++ b/dbms/src/Parsers/ASTIdentifier.cpp
@@ -29,6 +29,10 @@ ASTIdentifier::ASTIdentifier(const String & name_, std::vector<String> && name_p
 {
 }
 
+ASTIdentifier::ASTIdentifier(std::vector<String> && name_parts_)
+    : ASTIdentifier(name_parts_.at(0) + '.' + name_parts_.at(1), std::move(name_parts_))
+{}
+
 void ASTIdentifier::setShortName(const String & new_name)
 {
     name = new_name;
diff --git a/dbms/src/Parsers/ASTIdentifier.h b/dbms/src/Parsers/ASTIdentifier.h
index 995b725185c..1439ab2dcbd 100644
--- a/dbms/src/Parsers/ASTIdentifier.h
+++ b/dbms/src/Parsers/ASTIdentifier.h
@@ -22,6 +22,7 @@ public:
     String name;
 
     ASTIdentifier(const String & name_, std::vector<String> && name_parts_ = {});
+    ASTIdentifier(std::vector<String> && name_parts_);
 
     /** Get the text that identifies this element. */
     String getID(char delim) const override { return "Identifier" + (delim + name); }
diff --git a/dbms/tests/queries/0_stateless/00820_multiple_joins.reference b/dbms/tests/queries/0_stateless/00820_multiple_joins.reference
index 2e7d8660562..93744e2c46d 100644
--- a/dbms/tests/queries/0_stateless/00820_multiple_joins.reference
+++ b/dbms/tests/queries/0_stateless/00820_multiple_joins.reference
@@ -32,7 +32,3 @@
 6	6	60	60
 12	12	120	120
 18	18	180	180
-0	0	0	0	0	0	0
-6	6	60	60	66	66	120
-12	12	120	120	132	132	240
-18	18	180	180	198	198	360
diff --git a/dbms/tests/queries/0_stateless/00820_multiple_joins.sql b/dbms/tests/queries/0_stateless/00820_multiple_joins.sql
index c19f4467934..b61777419d9 100644
--- a/dbms/tests/queries/0_stateless/00820_multiple_joins.sql
+++ b/dbms/tests/queries/0_stateless/00820_multiple_joins.sql
@@ -69,11 +69,11 @@ from table1 as t1
 join table2 as t2 on t1.a = t2.a
 join table3 as t3 on t2.b = t3.b; -- { serverError 48 }
 
-select t1.a as t1_a, t2.a as t2_a, t2.b as t2_b, t3.b as t3_b,
-    (t1.a + table2.b) as t1_t2_x, (table1.a + table3.b) as t1_t3_x, (t2.b + t3.b) as t2_t3_x
-from table1 as t1
-join table2 as t2 on t1_a = t2_a
-join table3 as t3 on t2_b = t3_b;
+--select t1.a as t1_a, t2.a as t2_a, t2.b as t2_b, t3.b as t3_b,
+--    (t1.a + table2.b) as t1_t2_x, (table1.a + table3.b) as t1_t3_x, (t2.b + t3.b) as t2_t3_x
+--from table1 as t1
+--join table2 as t2 on t1_a = t2_a
+--join table3 as t3 on t2_b = t3_b;
 
 --select (t1.a + table2.b) as t1_t2_x, (table1.a + table3.b) as t1_t3_x, (t2.b + t3.b) as t2_t3_x
 --from table1 as t1
diff --git a/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference
new file mode 100644
index 00000000000..d4d045a7796
--- /dev/null
+++ b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference
@@ -0,0 +1,37 @@
+Row 1:
+──────
+t.a: 1
+s.b: 1
+s.a: 1
+s.b: 1
+y.a: 1
+y.b: 1
+
+Row 2:
+──────
+t.a: 2
+s.b: 0
+s.a: 0
+s.b: 0
+y.a: 0
+y.b: 0
+┌─t.a─┬─s.b─┬─s.a─┬─s.b─┬─y.a─┬─y.b─┐
+│   1 │   1 │   1 │   1 │   1 │   1 │
+│   2 │   0 │   0 │   0 │   0 │   0 │
+└─────┴─────┴─────┴─────┴─────┴─────┘
+┌─t_a─┐
+│   1 │
+│   2 │
+└─────┘
+┌─t.a─┬─s_a─┐
+│   1 │   1 │
+│   2 │   0 │
+└─────┴─────┘
+┌─t.a─┬─t.a─┬─t_b─┐
+│   1 │   1 │   1 │
+│   2 │   2 │   2 │
+└─────┴─────┴─────┘
+┌─s.a─┬─s.a─┐
+│   1 │   1 │
+│   0 │   0 │
+└─────┴─────┘
diff --git a/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql
new file mode 100644
index 00000000000..08aca31f99e
--- /dev/null
+++ b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql
@@ -0,0 +1,48 @@
+use test;
+
+drop table if exists t;
+drop table if exists s;
+drop table if exists y;
+
+create table t(a Int64, b Int64) engine = TinyLog;
+create table s(a Int64, b Int64) engine = TinyLog;
+create table y(a Int64, b Int64) engine = TinyLog;
+
+insert into t values (1,1), (2,2);
+insert into s values (1,1);
+insert into y values (1,1);
+
+select t.a, s.b, s.a, s.b, y.a, y.b from t
+left join s on (t.a = s.a and t.b = s.b)
+left join y on (y.a = s.a and y.b = s.b) format Vertical;
+
+select t.a, s.b, s.a, s.b, y.a, y.b from t
+left join s on (t.a = s.a and s.b = t.b)
+left join y on (y.a = s.a and y.b = s.b) format PrettyCompactNoEscapes;
+
+select t.a as t_a from t
+left join s on s.a = t_a format PrettyCompactNoEscapes;
+
+select t.a, s.a as s_a from t
+left join s on s.a = t.a
+left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+select t.a, t.a, t.b as t_b from t
+left join s on s.a = t.a
+left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+select s.a, s.a from t
+left join s on s.a = t.a
+left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+--select t.a, t.a, t.b as t_b, t.b from t
+--left join s on s.a = t.a
+--left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+--select t.a, t.a, s.b as s_b, s.b from t
+--left join s on s.a = t.a
+--left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+drop table t;
+drop table s;
+drop table y;

From 16c967002e528644963a8600cd8a97458c34005a Mon Sep 17 00:00:00 2001
From: BayoNet <da-daos@yandex.ru>
Date: Tue, 5 Mar 2019 13:16:45 +0300
Subject: [PATCH 24/63] DOCAPI-5203: Fix in terms of direct I/O.

---
 docs/en/operations/settings/settings.md       | 2 +-
 docs/en/operations/table_engines/mergetree.md | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 8f3e0d525ef..fff660999e2 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -177,7 +177,7 @@ Any positive integer.
 
 ## min_bytes_to_use_direct_io {#settings-min_bytes_to_use_direct_io}
 
-The minimum data volume to be read from storage required for using of the direct I/O interface of the storage disk.
+The minimum data volume to be read from storage required for using of the direct I/O access to the storage disk.
 
 ClickHouse uses this setting when selecting the data from tables. If summary storage volume of all the data to be read exceeds `min_bytes_to_use_direct_io` bytes, then ClickHouse reads the data from the storage disk with `O_DIRECT` option.
 
diff --git a/docs/en/operations/table_engines/mergetree.md b/docs/en/operations/table_engines/mergetree.md
index 3658392c70c..53bb909b16d 100644
--- a/docs/en/operations/table_engines/mergetree.md
+++ b/docs/en/operations/table_engines/mergetree.md
@@ -70,7 +70,7 @@ For a description of request parameters, see [request description](../../query_l
 
 - `SETTINGS` — Additional parameters that control the behavior of the `MergeTree`:
     - `index_granularity` — The granularity of an index. The number of data rows between the "marks" of an index. By default, 8192. The list of all available parameters you can see in [MergeTreeSettings.h](https://github.com/yandex/ClickHouse/blob/master/dbms/src/Storages/MergeTree/MergeTreeSettings.h).
-    - `min_merge_bytes_to_use_direct_io` — The minimum data volume for merge operation required for using of the direct I/O interface of the storage disk. During the merging of the data parts, ClickHouse calculates summary storage volume of all the data to be merged. If the volume exceeds `min_merge_bytes_to_use_direct_io` bytes, thеn ClickHouse reads and writes the data using direct I/O interface (`O_DIRECT` option) to the storage disk. If `min_merge_bytes_to_use_direct_io = 0`, then the direct I/O is disabled. Default value: `10 * 1024 * 1024 * 1024` bytes.
+    - `min_merge_bytes_to_use_direct_io` — The minimum data volume for merge operation required for using of the direct I/O access to the storage disk. During the merging of the data parts, ClickHouse calculates summary storage volume of all the data to be merged. If the volume exceeds `min_merge_bytes_to_use_direct_io` bytes, thеn ClickHouse reads and writes the data using direct I/O interface (`O_DIRECT` option) to the storage disk. If `min_merge_bytes_to_use_direct_io = 0`, then the direct I/O is disabled. Default value: `10 * 1024 * 1024 * 1024` bytes.
 
 
 **Example of sections setting**

From a8106360bd00297b18bd8a238afa0905d807150b Mon Sep 17 00:00:00 2001
From: chertus <chertus@gmail.com>
Date: Tue, 5 Mar 2019 13:57:05 +0300
Subject: [PATCH 25/63] fix ASTIdentifier print (compound could be short)

---
 dbms/src/Parsers/ASTIdentifier.cpp | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/dbms/src/Parsers/ASTIdentifier.cpp b/dbms/src/Parsers/ASTIdentifier.cpp
index c8b3d719b3b..1a9db37391a 100644
--- a/dbms/src/Parsers/ASTIdentifier.cpp
+++ b/dbms/src/Parsers/ASTIdentifier.cpp
@@ -52,9 +52,8 @@ void ASTIdentifier::formatImplWithoutAlias(const FormatSettings & settings, Form
         settings.ostr << (settings.hilite ? hilite_none : "");
     };
 
-    /// A simple or compound identifier?
-
-    if (name_parts.size() > 1)
+    /// It could be compound but short
+    if (!isShort())
     {
         for (size_t i = 0, size = name_parts.size(); i < size; ++i)
         {

From 52c9d4e1ad001de14f25e81e589fc9124b51c12d Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 5 Mar 2019 13:55:26 +0300
Subject: [PATCH 26/63] (De)Serialize set index with multiple bulks. #4486

---
 .../src/Storages/MergeTree/MergeTreeIndices.h |  1 +
 .../MergeTree/MergeTreeSetSkippingIndex.cpp   | 23 +++++++++++++++++--
 2 files changed, 22 insertions(+), 2 deletions(-)

diff --git a/dbms/src/Storages/MergeTree/MergeTreeIndices.h b/dbms/src/Storages/MergeTree/MergeTreeIndices.h
index 6738d667b44..1d62e9e9e9c 100644
--- a/dbms/src/Storages/MergeTree/MergeTreeIndices.h
+++ b/dbms/src/Storages/MergeTree/MergeTreeIndices.h
@@ -11,6 +11,7 @@
 #include <Storages/MergeTree/MarkRange.h>
 #include <Interpreters/ExpressionActions.h>
 #include <Parsers/ASTIndexDeclaration.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 
 constexpr auto INDEX_FILE_PREFIX = "skp_idx_";
 
diff --git a/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp b/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
index 69323fe8bb4..686d36b2c5b 100644
--- a/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
+++ b/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
@@ -47,7 +47,16 @@ void MergeTreeSetIndexGranule::serializeBinary(WriteBuffer & ostr) const
     for (size_t i = 0; i < index.columns.size(); ++i)
     {
         const auto & type = index.data_types[i];
-        type->serializeBinaryBulk(*columns[i], ostr, 0, size());
+
+        IDataType::SerializeBinaryBulkSettings settings;
+        settings.getter = [&ostr](IDataType::SubstreamPath) -> WriteBuffer * { return &ostr; };
+        settings.position_independent_encoding = false;
+        settings.low_cardinality_max_dictionary_size = 0;
+
+        IDataType::SerializeBinaryBulkStatePtr state;
+        type->serializeBinaryBulkStatePrefix(settings, state);
+        type->serializeBinaryBulkWithMultipleStreams(*columns[i], 0, size(), settings, state);
+        type->serializeBinaryBulkStateSuffix(settings, state);
     }
 }
 
@@ -66,11 +75,21 @@ void MergeTreeSetIndexGranule::deserializeBinary(ReadBuffer & istr)
     size_type->deserializeBinary(field_rows, istr);
     size_t rows_to_read = field_rows.get<size_t>();
 
+    if (rows_to_read == 0)
+        return;
+
     for (size_t i = 0; i < index.columns.size(); ++i)
     {
         const auto & type = index.data_types[i];
         auto new_column = type->createColumn();
-        type->deserializeBinaryBulk(*new_column, istr, rows_to_read, 0);
+
+        IDataType::DeserializeBinaryBulkSettings settings;
+        settings.getter = [&](IDataType::SubstreamPath) -> ReadBuffer * { return &istr; };
+        settings.position_independent_encoding = false;
+
+        IDataType::DeserializeBinaryBulkStatePtr state;
+        type->deserializeBinaryBulkStatePrefix(settings, state);
+        type->deserializeBinaryBulkWithMultipleStreams(*new_column, rows_to_read, settings, state);
 
         block.insert(ColumnWithTypeAndName(new_column->getPtr(), type, index.columns[i]));
     }

From 4b18b7dcdc23cf7f9c64d824974bd6de95600c09 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 5 Mar 2019 14:47:40 +0300
Subject: [PATCH 27/63] Support Nullable columns for Set index. #4486

---
 .../MergeTree/MergeTreeSetSkippingIndex.cpp    | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp b/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
index 686d36b2c5b..8c889fbdea7 100644
--- a/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
+++ b/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
@@ -196,10 +196,24 @@ bool SetIndexCondition::mayBeTrueOnGranule(MergeTreeIndexGranulePtr idx_granule)
     Block result = granule->getElementsBlock();
     actions->execute(result);
 
-    const auto & column = result.getByName(expression_ast->getColumnName()).column;
+    auto column = result.getByName(expression_ast->getColumnName()).column->convertToFullColumnIfLowCardinality();
+    auto * col_uint8 = typeid_cast<const ColumnUInt8 *>(column.get());
+
+    const NullMap * null_map = nullptr;
+
+    if (auto * col_nullable = typeid_cast<const ColumnNullable *>(column.get()))
+    {
+        col_uint8 = typeid_cast<const ColumnUInt8 *>(&col_nullable->getNestedColumn());
+        null_map = &col_nullable->getNullMapData();
+    }
+
+    if (!col_uint8)
+        throw Exception("ColumnUInt8 expected as Set index condition result.", ErrorCodes::LOGICAL_ERROR);
+
+    auto & condition = col_uint8->getData();
 
     for (size_t i = 0; i < column->size(); ++i)
-        if (column->getInt(i) & 1)
+        if ((!null_map || (*null_map)[i] == 0) && condition[i] & 1)
             return true;
 
     return false;

From 04bfc4743b398ea6556804fa46acd5a0c7769e9a Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 5 Mar 2019 15:13:49 +0300
Subject: [PATCH 28/63] Added tests for Set index with Nullable and
 LowCardinality types. #4486

---
 ...ith_nullable_and_low_cardinality.reference | 30 ++++++++
 ...ndex_with_nullable_and_low_cardinality.sql | 69 +++++++++++++++++++
 ...nullable_and_low_cardinality_bug.reference |  1 +
 ..._with_nullable_and_low_cardinality_bug.sql | 20 ++++++
 4 files changed, 120 insertions(+)
 create mode 100644 dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality.reference
 create mode 100644 dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality.sql
 create mode 100644 dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality_bug.reference
 create mode 100644 dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality_bug.sql

diff --git a/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality.reference b/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality.reference
new file mode 100644
index 00000000000..f3918a338c4
--- /dev/null
+++ b/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality.reference
@@ -0,0 +1,30 @@
+1	a
+-
+2	b
+-
+--
+1	a
+-
+2	b
+-
+--
+1	a
+-
+2	b
+-
+----
+1	a
+-
+2	b
+-
+--
+1	a
+-
+2	b
+-
+--
+1	a
+-
+2	b
+-
+----
diff --git a/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality.sql b/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality.sql
new file mode 100644
index 00000000000..363e0e9c0b5
--- /dev/null
+++ b/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality.sql
@@ -0,0 +1,69 @@
+SET allow_experimental_data_skipping_indices=1;
+
+drop table if exists test.nullable_set_index;
+create table test.nullable_set_index (a UInt64, b Nullable(String), INDEX b_index b TYPE set(0) GRANULARITY 8192) engine = MergeTree order by a;
+insert into test.nullable_set_index values (1, 'a');
+insert into test.nullable_set_index values (2, 'b');
+select * from test.nullable_set_index where b = 'a';
+select '-';
+select * from test.nullable_set_index where b = 'b';
+select '-';
+select * from test.nullable_set_index where b = 'c';
+select '--';
+
+drop table if exists test.nullable_set_index;
+create table test.nullable_set_index (a UInt64, b Nullable(String), INDEX b_index b TYPE set(1) GRANULARITY 8192) engine = MergeTree order by a;
+insert into test.nullable_set_index values (1, 'a');
+insert into test.nullable_set_index values (2, 'b');
+select * from test.nullable_set_index where b = 'a';
+select '-';
+select * from test.nullable_set_index where b = 'b';
+select '-';
+select * from test.nullable_set_index where b = 'c';
+select '--';
+
+drop table if exists test.nullable_set_index;
+create table test.nullable_set_index (a UInt64, b Nullable(String), INDEX b_index b TYPE set(0) GRANULARITY 8192) engine = MergeTree order by a;
+insert into test.nullable_set_index values (1, 'a'), (2, 'b');
+select * from test.nullable_set_index where b = 'a';
+select '-';
+select * from test.nullable_set_index where b = 'b';
+select '-';
+select * from test.nullable_set_index where b = 'c';
+select '----';
+
+
+drop table if exists test.nullable_set_index;
+create table test.nullable_set_index (a UInt64, b LowCardinality(Nullable(String)), INDEX b_index b TYPE set(0) GRANULARITY 8192) engine = MergeTree order by a;
+insert into test.nullable_set_index values (1, 'a');
+insert into test.nullable_set_index values (2, 'b');
+select * from test.nullable_set_index where b = 'a';
+select '-';
+select * from test.nullable_set_index where b = 'b';
+select '-';
+select * from test.nullable_set_index where b = 'c';
+select '--';
+
+drop table if exists test.nullable_set_index;
+create table test.nullable_set_index (a UInt64, b LowCardinality(Nullable(String)), INDEX b_index b TYPE set(1) GRANULARITY 8192) engine = MergeTree order by a;
+insert into test.nullable_set_index values (1, 'a');
+insert into test.nullable_set_index values (2, 'b');
+select * from test.nullable_set_index where b = 'a';
+select '-';
+select * from test.nullable_set_index where b = 'b';
+select '-';
+select * from test.nullable_set_index where b = 'c';
+select '--';
+
+drop table if exists test.nullable_set_index;
+create table test.nullable_set_index (a UInt64, b LowCardinality(Nullable(String)), INDEX b_index b TYPE set(0) GRANULARITY 8192) engine = MergeTree order by a;
+insert into test.nullable_set_index values (1, 'a'), (2, 'b');
+select * from test.nullable_set_index where b = 'a';
+select '-';
+select * from test.nullable_set_index where b = 'b';
+select '-';
+select * from test.nullable_set_index where b = 'c';
+select '----';
+
+drop table if exists test.nullable_set_index;
+
diff --git a/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality_bug.reference b/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality_bug.reference
new file mode 100644
index 00000000000..051c3fcdbcf
--- /dev/null
+++ b/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality_bug.reference
@@ -0,0 +1 @@
+subscribe	alice
diff --git a/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality_bug.sql b/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality_bug.sql
new file mode 100644
index 00000000000..5bec1210a1e
--- /dev/null
+++ b/dbms/tests/queries/0_stateless/00907_set_index_with_nullable_and_low_cardinality_bug.sql
@@ -0,0 +1,20 @@
+SET allow_experimental_data_skipping_indices=1;
+
+drop table if exists test.null_lc_set_index;
+
+CREATE TABLE test.null_lc_set_index (
+  timestamp         DateTime,
+  action            LowCardinality(Nullable(String)),
+  user              LowCardinality(Nullable(String)),
+  INDEX test_user_idx (user) TYPE set(0) GRANULARITY 8192
+) ENGINE=MergeTree
+  PARTITION BY toYYYYMMDD(timestamp)
+  ORDER BY (timestamp, action, cityHash64(user))
+  SAMPLE BY cityHash64(user);
+INSERT INTO test.null_lc_set_index VALUES (1550883010, 'subscribe', 'alice');
+INSERT INTO test.null_lc_set_index VALUES (1550883020, 'follow', 'bob');
+
+SELECT action, user FROM test.null_lc_set_index WHERE user = 'alice';
+
+drop table if exists test.null_lc_set_index;
+

From ea4d3ec66178dbd4beeab556ce86d28f90909ebe Mon Sep 17 00:00:00 2001
From: chertus <chertus@gmail.com>
Date: Tue, 5 Mar 2019 15:34:48 +0300
Subject: [PATCH 29/63] some multiple join fixes

---
 .../JoinToSubqueryTransformVisitor.cpp        | 25 +++++++++++++------
 .../00820_multiple_joins.reference            |  4 +++
 .../0_stateless/00820_multiple_joins.sql      | 10 ++++----
 .../00847_multiple_join_same_column.reference | 16 +++++++++---
 .../00847_multiple_join_same_column.sql       | 20 +++++++--------
 5 files changed, 48 insertions(+), 27 deletions(-)

diff --git a/dbms/src/Interpreters/JoinToSubqueryTransformVisitor.cpp b/dbms/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
index 55a036f7d74..5a1f7260a4f 100644
--- a/dbms/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
+++ b/dbms/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
@@ -36,9 +36,10 @@ struct ColumnAliasesMatcher
     {
         const std::vector<DatabaseAndTableWithAlias> tables;
         bool public_names;
-        AsteriskSemantic::RevertedAliases rev_aliases;
-        std::unordered_map<String, String> aliases;
+        AsteriskSemantic::RevertedAliases rev_aliases;  /// long_name -> aliases
+        std::unordered_map<String, String> aliases;     /// alias -> long_name
         std::vector<std::pair<ASTIdentifier *, bool>> compound_identifiers;
+        std::set<String> allowed_long_names;            /// original names allowed as aliases '--t.x as t.x' (select expressions only).
 
         Data(std::vector<DatabaseAndTableWithAlias> && tables_)
             : tables(tables_)
@@ -51,29 +52,37 @@ struct ColumnAliasesMatcher
 
             for (auto & [identifier, is_public] : compound_identifiers)
             {
-                auto it = rev_aliases.find(identifier->name);
+                String long_name = identifier->name;
+
+                auto it = rev_aliases.find(long_name);
                 if (it == rev_aliases.end())
                 {
                     bool last_table = IdentifierSemantic::canReferColumnToTable(*identifier, tables.back());
                     if (!last_table)
                     {
-                        String long_name = identifier->name;
                         String alias = hide_prefix + long_name;
                         aliases[alias] = long_name;
                         rev_aliases[long_name].push_back(alias);
 
                         identifier->setShortName(alias);
                         if (is_public)
+                        {
                             identifier->setAlias(long_name);
+                            allowed_long_names.insert(long_name);
+                        }
                     }
                     else if (is_public)
-                        identifier->setAlias(identifier->name); /// prevent crop long to short name
+                        identifier->setAlias(long_name); /// prevent crop long to short name
                 }
                 else
                 {
                     if (it->second.empty())
-                        throw Exception("No alias for '" + identifier->name + "'", ErrorCodes::LOGICAL_ERROR);
-                    identifier->setShortName(it->second[0]);
+                        throw Exception("No alias for '" + long_name + "'", ErrorCodes::LOGICAL_ERROR);
+
+                    if (is_public && allowed_long_names.count(long_name))
+                        ; /// leave original name unchanged for correct output
+                    else
+                        identifier->setShortName(it->second[0]);
                 }
             }
         }
@@ -131,7 +140,7 @@ struct ColumnAliasesMatcher
                 node.setAlias("");
             }
         }
-        else
+        else if (node.compound())
             data.compound_identifiers.emplace_back(&node, data.public_names);
     }
 };
diff --git a/dbms/tests/queries/0_stateless/00820_multiple_joins.reference b/dbms/tests/queries/0_stateless/00820_multiple_joins.reference
index 93744e2c46d..2e7d8660562 100644
--- a/dbms/tests/queries/0_stateless/00820_multiple_joins.reference
+++ b/dbms/tests/queries/0_stateless/00820_multiple_joins.reference
@@ -32,3 +32,7 @@
 6	6	60	60
 12	12	120	120
 18	18	180	180
+0	0	0	0	0	0	0
+6	6	60	60	66	66	120
+12	12	120	120	132	132	240
+18	18	180	180	198	198	360
diff --git a/dbms/tests/queries/0_stateless/00820_multiple_joins.sql b/dbms/tests/queries/0_stateless/00820_multiple_joins.sql
index b61777419d9..c19f4467934 100644
--- a/dbms/tests/queries/0_stateless/00820_multiple_joins.sql
+++ b/dbms/tests/queries/0_stateless/00820_multiple_joins.sql
@@ -69,11 +69,11 @@ from table1 as t1
 join table2 as t2 on t1.a = t2.a
 join table3 as t3 on t2.b = t3.b; -- { serverError 48 }
 
---select t1.a as t1_a, t2.a as t2_a, t2.b as t2_b, t3.b as t3_b,
---    (t1.a + table2.b) as t1_t2_x, (table1.a + table3.b) as t1_t3_x, (t2.b + t3.b) as t2_t3_x
---from table1 as t1
---join table2 as t2 on t1_a = t2_a
---join table3 as t3 on t2_b = t3_b;
+select t1.a as t1_a, t2.a as t2_a, t2.b as t2_b, t3.b as t3_b,
+    (t1.a + table2.b) as t1_t2_x, (table1.a + table3.b) as t1_t3_x, (t2.b + t3.b) as t2_t3_x
+from table1 as t1
+join table2 as t2 on t1_a = t2_a
+join table3 as t3 on t2_b = t3_b;
 
 --select (t1.a + table2.b) as t1_t2_x, (table1.a + table3.b) as t1_t3_x, (t2.b + t3.b) as t2_t3_x
 --from table1 as t1
diff --git a/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference
index d4d045a7796..1685a298042 100644
--- a/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference
+++ b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.reference
@@ -31,7 +31,15 @@ y.b: 0
 │   1 │   1 │   1 │
 │   2 │   2 │   2 │
 └─────┴─────┴─────┘
-┌─s.a─┬─s.a─┐
-│   1 │   1 │
-│   0 │   0 │
-└─────┴─────┘
+┌─s.a─┬─s.a─┬─s_b─┬─s_b─┐
+│   1 │   1 │   1 │   1 │
+│   0 │   0 │   0 │   0 │
+└─────┴─────┴─────┴─────┘
+┌─y.a─┬─y.a─┬─y_b─┬─y_b─┐
+│   1 │   1 │   1 │   1 │
+│   0 │   0 │   0 │   0 │
+└─────┴─────┴─────┴─────┘
+┌─t_a─┬─t_a─┬─s_a─┬─s_a─┬─y_a─┬─y_a─┐
+│   1 │   1 │   1 │   1 │   1 │   1 │
+│   2 │   2 │   0 │   0 │   0 │   0 │
+└─────┴─────┴─────┴─────┴─────┴─────┘
diff --git a/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql
index 08aca31f99e..b4ce61e3ee7 100644
--- a/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql
+++ b/dbms/tests/queries/0_stateless/00847_multiple_join_same_column.sql
@@ -28,21 +28,21 @@ left join s on s.a = t.a
 left join y on y.b = s.b format PrettyCompactNoEscapes;
 
 select t.a, t.a, t.b as t_b from t
+left join s on t.a = s.a
+left join y on y.b = s.b format PrettyCompactNoEscapes;
+
+select s.a, s.a, s.b as s_b, s.b from t
+left join s on s.a = t.a
+left join y on s.b = y.b format PrettyCompactNoEscapes;
+
+select y.a, y.a, y.b as y_b, y.b from t
 left join s on s.a = t.a
 left join y on y.b = s.b format PrettyCompactNoEscapes;
 
-select s.a, s.a from t
-left join s on s.a = t.a
+select t.a, t.a as t_a, s.a, s.a as s_a, y.a, y.a as y_a from t
+left join s on t.a = s.a
 left join y on y.b = s.b format PrettyCompactNoEscapes;
 
---select t.a, t.a, t.b as t_b, t.b from t
---left join s on s.a = t.a
---left join y on y.b = s.b format PrettyCompactNoEscapes;
-
---select t.a, t.a, s.b as s_b, s.b from t
---left join s on s.a = t.a
---left join y on y.b = s.b format PrettyCompactNoEscapes;
-
 drop table t;
 drop table s;
 drop table y;

From 0c0d9343d46d20db0e403d2364de460a666020d0 Mon Sep 17 00:00:00 2001
From: chertus <chertus@gmail.com>
Date: Tue, 5 Mar 2019 15:49:00 +0300
Subject: [PATCH 30/63] update ASTIdentifier prints for push down predicate
 test reference (long vs short names)

---
 .../0_stateless/00597_push_down_predicate.reference    | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/dbms/tests/queries/0_stateless/00597_push_down_predicate.reference b/dbms/tests/queries/0_stateless/00597_push_down_predicate.reference
index ff97111f6b7..94adaffd52f 100644
--- a/dbms/tests/queries/0_stateless/00597_push_down_predicate.reference
+++ b/dbms/tests/queries/0_stateless/00597_push_down_predicate.reference
@@ -20,7 +20,7 @@ SELECT \n    a, \n    b\nFROM \n(\n    SELECT \n        toUInt64(sum(id) AS b) A
 3	3
 SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        name, \n        value, \n        min(id) AS id\n    FROM test.test \n    GROUP BY \n        date, \n        name, \n        value\n    HAVING id = 1\n) \nWHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT \n    a, \n    b\nFROM \n(\n    SELECT \n        toUInt64(sum(id) AS b) AS a, \n        b\n    FROM test.test AS table_alias \n    HAVING b = 3\n) AS outer_table_alias \nWHERE outer_table_alias.b = 3
+SELECT \n    a, \n    b\nFROM \n(\n    SELECT \n        toUInt64(sum(id) AS b) AS a, \n        b\n    FROM test.test AS table_alias \n    HAVING b = 3\n) AS outer_table_alias \nWHERE b = 3
 3	3
 SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n    WHERE id = 1\n) \nWHERE id = 1
 2000-01-01	1	test string 1	1
@@ -32,9 +32,9 @@ SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n
 2000-01-01	1	test string 1	1
 SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM \n    (\n        SELECT \n            date, \n            id, \n            name, \n            value\n        FROM test.test \n        WHERE id = 1\n    ) \n    WHERE id = 1\n) \nWHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n    WHERE id = 1\n) AS b \nWHERE b.id = 1
+SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n    WHERE id = 1\n) AS b \nWHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM \n    (\n        SELECT \n            date, \n            id, \n            name, \n            value\n        FROM test.test \n        WHERE id = 1\n    ) AS a \n    WHERE id = 1\n) AS b \nWHERE b.id = 1
+SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM \n    (\n        SELECT \n            date, \n            id, \n            name, \n            value\n        FROM test.test \n        WHERE id = 1\n    ) AS a \n    WHERE id = 1\n) AS b \nWHERE id = 1
 2000-01-01	1	test string 1	1
 SELECT \n    id, \n    date, \n    value\nFROM \n(\n    SELECT \n        id, \n        date, \n        min(value) AS value\n    FROM test.test \n    WHERE id = 1\n    GROUP BY \n        id, \n        date\n) \nWHERE id = 1
 1	2000-01-01	1
@@ -45,11 +45,11 @@ SELECT \n    date, \n    id, \n    name, \n    value, \n    date, \n    name, \n
 2000-01-01	1	test string 1	1	2000-01-01	test string 1	1
 SELECT \n    id, \n    date, \n    name, \n    value\nFROM \n(\n    SELECT toInt8(1) AS id\n) \nANY LEFT JOIN test.test USING (id)\nWHERE value = 1
 1	2000-01-01	test string 1	1
-SELECT b.value\nFROM \n(\n    SELECT toInt8(1) AS id\n) \nANY LEFT JOIN test.test AS b USING (id)\nWHERE value = 1
+SELECT value\nFROM \n(\n    SELECT toInt8(1) AS id\n) \nANY LEFT JOIN test.test AS b USING (id)\nWHERE value = 1
 1
 SELECT \n    date, \n    id, \n    name, \n    value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value, \n        date, \n        name, \n        value\n    FROM \n    (\n        SELECT \n            date, \n            id, \n            name, \n            value\n        FROM test.test \n        WHERE id = 1\n    ) \n    ANY LEFT JOIN \n    (\n        SELECT *\n        FROM test.test \n        WHERE id = 1\n    ) USING (id)\n    WHERE id = 1\n) \nWHERE id = 1
 2000-01-01	1	test string 1	1
-SELECT \n    date, \n    id, \n    name, \n    value, \n    `b.date`, \n    `b.name`, \n    `b.value`\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n) \nANY LEFT JOIN \n(\n    SELECT *\n    FROM test.test \n    WHERE id = 1\n) AS b USING (id)\nWHERE b.id = 1
+SELECT \n    date, \n    id, \n    name, \n    value, \n    b.date, \n    b.name, \n    b.value\nFROM \n(\n    SELECT \n        date, \n        id, \n        name, \n        value\n    FROM test.test \n) \nANY LEFT JOIN \n(\n    SELECT *\n    FROM test.test \n    WHERE id = 1\n) AS b USING (id)\nWHERE b.id = 1
 2000-01-01	1	test string 1	1	2000-01-01	test string 1	1
 SELECT \n    id, \n    date, \n    name, \n    value\nFROM \n(\n    SELECT \n        toInt8(1) AS id, \n        toDate(\'2000-01-01\') AS date\n    FROM system.numbers \n    LIMIT 1\n) \nANY LEFT JOIN \n(\n    SELECT *\n    FROM test.test \n    WHERE date = toDate(\'2000-01-01\')\n) AS b USING (date, id)\nWHERE b.date = toDate(\'2000-01-01\')
 1	2000-01-01	test string 1	1

From 72fe0115d1aabebf891719a44afd634121d17461 Mon Sep 17 00:00:00 2001
From: chertus <chertus@gmail.com>
Date: Tue, 5 Mar 2019 16:53:39 +0300
Subject: [PATCH 31/63] move join convertions to InterpreterSelectQuery

---
 .../Interpreters/InterpreterSelectQuery.cpp    | 14 ++++++++++++++
 dbms/src/Interpreters/executeQuery.cpp         | 18 ------------------
 2 files changed, 14 insertions(+), 18 deletions(-)

diff --git a/dbms/src/Interpreters/InterpreterSelectQuery.cpp b/dbms/src/Interpreters/InterpreterSelectQuery.cpp
index f2a76a20d0a..ebbfcf6d133 100644
--- a/dbms/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterSelectQuery.cpp
@@ -38,6 +38,8 @@
 #include <Interpreters/convertFieldToType.h>
 #include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/DatabaseAndTableWithAlias.h>
+#include <Interpreters/JoinToSubqueryTransformVisitor.h>
+#include <Interpreters/CrossToInnerJoinVisitor.h>
 
 #include <Storages/MergeTree/MergeTreeWhereOptimizer.h>
 #include <Storages/IStorage.h>
@@ -155,6 +157,18 @@ InterpreterSelectQuery::InterpreterSelectQuery(
         throw Exception("Too deep subqueries. Maximum: " + settings.max_subquery_depth.toString(),
             ErrorCodes::TOO_DEEP_SUBQUERIES);
 
+    if (settings.allow_experimental_multiple_joins_emulation)
+    {
+        JoinToSubqueryTransformVisitor::Data join_to_subs_data;
+        JoinToSubqueryTransformVisitor(join_to_subs_data).visit(query_ptr);
+    }
+
+    if (settings.allow_experimental_cross_to_join_conversion)
+    {
+        CrossToInnerJoinVisitor::Data cross_to_inner;
+        CrossToInnerJoinVisitor(cross_to_inner).visit(query_ptr);
+    }
+
     max_streams = settings.max_threads;
 
     ASTPtr table_expression = extractTableExpression(query, 0);
diff --git a/dbms/src/Interpreters/executeQuery.cpp b/dbms/src/Interpreters/executeQuery.cpp
index a5856fb6173..d8b4ff4ebe0 100644
--- a/dbms/src/Interpreters/executeQuery.cpp
+++ b/dbms/src/Interpreters/executeQuery.cpp
@@ -21,8 +21,6 @@
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
 
-#include <Interpreters/JoinToSubqueryTransformVisitor.h>
-#include <Interpreters/CrossToInnerJoinVisitor.h>
 #include <Interpreters/Quota.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/ProcessList.h>
@@ -196,22 +194,6 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
         if (!internal)
             logQuery(query.substr(0, settings.log_queries_cut_to_length), context);
 
-        if (!internal && settings.allow_experimental_multiple_joins_emulation)
-        {
-            JoinToSubqueryTransformVisitor::Data join_to_subs_data;
-            JoinToSubqueryTransformVisitor(join_to_subs_data).visit(ast);
-            if (join_to_subs_data.done)
-                logQuery(queryToString(*ast), context);
-        }
-
-        if (!internal && settings.allow_experimental_cross_to_join_conversion)
-        {
-            CrossToInnerJoinVisitor::Data cross_to_inner;
-            CrossToInnerJoinVisitor(cross_to_inner).visit(ast);
-            if (cross_to_inner.done)
-                logQuery(queryToString(*ast), context);
-        }
-
         /// Check the limits.
         checkASTSizeLimits(*ast, settings);
 

From 22f699c8a0a278623142c13d23ba88293d4a4d52 Mon Sep 17 00:00:00 2001
From: chertus <chertus@gmail.com>
Date: Tue, 5 Mar 2019 18:16:59 +0300
Subject: [PATCH 32/63] fix CrossToInnerJoin (empty where crash & where for one
 table wrong result)

---
 dbms/src/Interpreters/CrossToInnerJoinVisitor.cpp        | 9 ++++++---
 .../0_stateless/00826_cross_to_inner_join.reference      | 4 +++-
 .../queries/0_stateless/00826_cross_to_inner_join.sql    | 5 +++++
 3 files changed, 14 insertions(+), 4 deletions(-)

diff --git a/dbms/src/Interpreters/CrossToInnerJoinVisitor.cpp b/dbms/src/Interpreters/CrossToInnerJoinVisitor.cpp
index 43f29046e9b..8c74ddf699a 100644
--- a/dbms/src/Interpreters/CrossToInnerJoinVisitor.cpp
+++ b/dbms/src/Interpreters/CrossToInnerJoinVisitor.cpp
@@ -192,6 +192,9 @@ void CrossToInnerJoinMatcher::visit(ASTSelectQuery & select, ASTPtr & ast, Data
     using CheckExpressionMatcher = OneTypeMatcher<CheckExpressionVisitorData, false>;
     using CheckExpressionVisitor = InDepthNodeVisitor<CheckExpressionMatcher, true>;
 
+    if (!select.where_expression)
+        return;
+
     std::vector<DatabaseAndTableWithAlias> table_names;
     ASTPtr ast_join = getCrossJoin(select, table_names);
     if (!ast_join)
@@ -215,10 +218,10 @@ void CrossToInnerJoinMatcher::visit(ASTSelectQuery & select, ASTPtr & ast, Data
             select.where_expression.reset();
 
         join.children.push_back(join.on_expression);
+
+        ast = ast->clone(); /// rewrite AST in right manner
+        data.done = true;
     }
-
-    ast = ast->clone(); /// rewrite AST in right manner
-    data.done = true;
 }
 
 }
diff --git a/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.reference b/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.reference
index 73c8a9f9ce4..93cdf438a0f 100644
--- a/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.reference
+++ b/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.reference
@@ -1,3 +1,5 @@
+0	0
+0	0
 cross
 1	1	1	1
 1	1	1	2
@@ -67,7 +69,7 @@ Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  Expression
 Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 2)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1 (alias x)\n     TablesInSelectQueryElement (children 2)\n      TableJoin (children 1)\n       Function and (children 1)\n        ExpressionList (children 2)\n         Function equals (children 1)\n          ExpressionList (children 2)\n           Identifier x.a\n           Identifier y.a\n         Function equals (children 1)\n          ExpressionList (children 2)\n           Identifier x.b\n           Identifier y.b\n      TableExpression (children 1)\n       Identifier t1 (alias y)\n
 cross one table expr
 Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 3)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableExpression (children 1)\n       Identifier t2\n      TableJoin\n    Function equals (children 1)\n     ExpressionList (children 2)\n      Identifier t1.a\n      Identifier t1.b\n
-Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 3)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableJoin\n      TableExpression (children 1)\n       Identifier t2\n    Function equals (children 1)\n     ExpressionList (children 2)\n      Identifier t1.a\n      Identifier t1.b\n
+Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 3)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableExpression (children 1)\n       Identifier t2\n      TableJoin\n    Function equals (children 1)\n     ExpressionList (children 2)\n      Identifier t1.a\n      Identifier t1.b\n
 cross multiple ands
 Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 3)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableExpression (children 1)\n       Identifier t2\n      TableJoin\n    Function and (children 1)\n     ExpressionList (children 2)\n      Function equals (children 1)\n       ExpressionList (children 2)\n        Identifier t1.a\n        Identifier t2.a\n      Function equals (children 1)\n       ExpressionList (children 2)\n        Identifier t1.b\n        Identifier t2.b\n
 Explain ParsedAST (children 1)\n SelectWithUnionQuery (children 1)\n  ExpressionList (children 1)\n   SelectQuery (children 2)\n    ExpressionList (children 1)\n     Asterisk\n    TablesInSelectQuery (children 2)\n     TablesInSelectQueryElement (children 1)\n      TableExpression (children 1)\n       Identifier t1\n     TablesInSelectQueryElement (children 2)\n      TableJoin (children 1)\n       Function and (children 1)\n        ExpressionList (children 2)\n         Function equals (children 1)\n          ExpressionList (children 2)\n           Identifier t1.a\n           Identifier t2.a\n         Function equals (children 1)\n          ExpressionList (children 2)\n           Identifier t1.b\n           Identifier t2.b\n      TableExpression (children 1)\n       Identifier t2\n
diff --git a/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.sql b/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.sql
index 26d8d5abd57..218ea1f1e45 100644
--- a/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.sql
+++ b/dbms/tests/queries/0_stateless/00826_cross_to_inner_join.sql
@@ -1,6 +1,11 @@
 SET enable_debug_queries = 1;
 USE test;
 
+set allow_experimental_cross_to_join_conversion = 0;
+select * from system.one cross join system.one;
+set allow_experimental_cross_to_join_conversion = 1;
+select * from system.one cross join system.one;
+
 DROP TABLE IF EXISTS t1;
 DROP TABLE IF EXISTS t2;
 

From 049d49333dc12c5004f9e8a6618f2d850c0f869f Mon Sep 17 00:00:00 2001
From: chertus <chertus@gmail.com>
Date: Tue, 5 Mar 2019 18:21:52 +0300
Subject: [PATCH 33/63] undo last change

---
 .../Interpreters/InterpreterSelectQuery.cpp    | 14 --------------
 dbms/src/Interpreters/executeQuery.cpp         | 18 ++++++++++++++++++
 2 files changed, 18 insertions(+), 14 deletions(-)

diff --git a/dbms/src/Interpreters/InterpreterSelectQuery.cpp b/dbms/src/Interpreters/InterpreterSelectQuery.cpp
index ebbfcf6d133..f2a76a20d0a 100644
--- a/dbms/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/dbms/src/Interpreters/InterpreterSelectQuery.cpp
@@ -38,8 +38,6 @@
 #include <Interpreters/convertFieldToType.h>
 #include <Interpreters/ExpressionAnalyzer.h>
 #include <Interpreters/DatabaseAndTableWithAlias.h>
-#include <Interpreters/JoinToSubqueryTransformVisitor.h>
-#include <Interpreters/CrossToInnerJoinVisitor.h>
 
 #include <Storages/MergeTree/MergeTreeWhereOptimizer.h>
 #include <Storages/IStorage.h>
@@ -157,18 +155,6 @@ InterpreterSelectQuery::InterpreterSelectQuery(
         throw Exception("Too deep subqueries. Maximum: " + settings.max_subquery_depth.toString(),
             ErrorCodes::TOO_DEEP_SUBQUERIES);
 
-    if (settings.allow_experimental_multiple_joins_emulation)
-    {
-        JoinToSubqueryTransformVisitor::Data join_to_subs_data;
-        JoinToSubqueryTransformVisitor(join_to_subs_data).visit(query_ptr);
-    }
-
-    if (settings.allow_experimental_cross_to_join_conversion)
-    {
-        CrossToInnerJoinVisitor::Data cross_to_inner;
-        CrossToInnerJoinVisitor(cross_to_inner).visit(query_ptr);
-    }
-
     max_streams = settings.max_threads;
 
     ASTPtr table_expression = extractTableExpression(query, 0);
diff --git a/dbms/src/Interpreters/executeQuery.cpp b/dbms/src/Interpreters/executeQuery.cpp
index d8b4ff4ebe0..a5856fb6173 100644
--- a/dbms/src/Interpreters/executeQuery.cpp
+++ b/dbms/src/Interpreters/executeQuery.cpp
@@ -21,6 +21,8 @@
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
 
+#include <Interpreters/JoinToSubqueryTransformVisitor.h>
+#include <Interpreters/CrossToInnerJoinVisitor.h>
 #include <Interpreters/Quota.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/ProcessList.h>
@@ -194,6 +196,22 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
         if (!internal)
             logQuery(query.substr(0, settings.log_queries_cut_to_length), context);
 
+        if (!internal && settings.allow_experimental_multiple_joins_emulation)
+        {
+            JoinToSubqueryTransformVisitor::Data join_to_subs_data;
+            JoinToSubqueryTransformVisitor(join_to_subs_data).visit(ast);
+            if (join_to_subs_data.done)
+                logQuery(queryToString(*ast), context);
+        }
+
+        if (!internal && settings.allow_experimental_cross_to_join_conversion)
+        {
+            CrossToInnerJoinVisitor::Data cross_to_inner;
+            CrossToInnerJoinVisitor(cross_to_inner).visit(ast);
+            if (cross_to_inner.done)
+                logQuery(queryToString(*ast), context);
+        }
+
         /// Check the limits.
         checkASTSizeLimits(*ast, settings);
 

From 4f80afb158575480c196af057d49e80ba1f05108 Mon Sep 17 00:00:00 2001
From: chertus <chertus@gmail.com>
Date: Tue, 5 Mar 2019 19:34:10 +0300
Subject: [PATCH 34/63] fix gcc build

---
 dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp b/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
index a0b5aed0af3..3d8a67ae766 100644
--- a/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
+++ b/dbms/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
@@ -218,7 +218,6 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
         {
             DatabaseAndTableWithAlias ident_db_and_name(qualified_asterisk->children[0]);
 
-            bool first_table = true;
             for (const auto & [table, table_columns] : tables_with_columns)
             {
                 if (ident_db_and_name.satisfies(table, true))
@@ -230,8 +229,6 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
                     }
                     break;
                 }
-
-                first_table = false;
             }
         }
         else

From 3bcab129661120869df892851394a1a1af135be2 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nik-kochetov@yandex-team.ru>
Date: Tue, 5 Mar 2019 19:52:29 +0300
Subject: [PATCH 35/63] Fix test.

---
 dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp b/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
index 8c889fbdea7..227c6bfd7f7 100644
--- a/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
+++ b/dbms/src/Storages/MergeTree/MergeTreeSetSkippingIndex.cpp
@@ -18,7 +18,7 @@ namespace ErrorCodes
 }
 
 /// 0b11 -- can be true and false at the same time
-const Field UNKNOWN_FIELD(3);
+const Field UNKNOWN_FIELD(3u);
 
 
 MergeTreeSetIndexGranule::MergeTreeSetIndexGranule(const MergeTreeSetSkippingIndex & index)

From fae0b054f91bd1c69479fa4afb621cbf9242b7f7 Mon Sep 17 00:00:00 2001
From: proller <proller@github.com>
Date: Tue, 5 Mar 2019 20:51:04 +0300
Subject: [PATCH 36/63] Arcadia fix

---
 dbms/src/DataTypes/IDataType.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/dbms/src/DataTypes/IDataType.h b/dbms/src/DataTypes/IDataType.h
index c1c621eb19e..aa253fbdc08 100644
--- a/dbms/src/DataTypes/IDataType.h
+++ b/dbms/src/DataTypes/IDataType.h
@@ -262,8 +262,10 @@ protected:
 
     /** Text serialization with escaping but without quoting.
       */
+public: // used somewhere in arcadia
     virtual void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const = 0;
 
+protected:
     virtual void deserializeTextEscaped(IColumn & column, ReadBuffer & istr, const FormatSettings &) const = 0;
 
     /** Text serialization as a literal that may be inserted into a query.

From ddbada664602c21cfe17b1e0cfb9d98b3b42303c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Tue, 5 Mar 2019 23:34:37 +0300
Subject: [PATCH 37/63] Fixed build #4583

---
 dbms/src/Dictionaries/readInvalidateQuery.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/dbms/src/Dictionaries/readInvalidateQuery.h b/dbms/src/Dictionaries/readInvalidateQuery.h
index a906c8f887f..48fbfa03629 100644
--- a/dbms/src/Dictionaries/readInvalidateQuery.h
+++ b/dbms/src/Dictionaries/readInvalidateQuery.h
@@ -1,11 +1,11 @@
 #pragma once
 #include <string>
 
-class IBlockInputStream;
-
 namespace DB
 {
 
+class IBlockInputStream;
+
 /// Using in MySQLDictionarySource and XDBCDictionarySource after processing invalidate_query.
 std::string readInvalidateQuery(IBlockInputStream & block_input_stream);
 

From 899b2548c77ba527df51c79306d6d81918a6efe0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Tue, 5 Mar 2019 23:49:21 +0300
Subject: [PATCH 38/63] Added comment #4572

---
 dbms/src/Common/ThreadPool.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/dbms/src/Common/ThreadPool.cpp b/dbms/src/Common/ThreadPool.cpp
index a985e0486be..6ed350240c6 100644
--- a/dbms/src/Common/ThreadPool.cpp
+++ b/dbms/src/Common/ThreadPool.cpp
@@ -157,6 +157,7 @@ void ThreadPoolImpl<Thread>::worker(typename std::list<Thread>::iterator thread_
             }
             else
             {
+                /// shutdown is true, simply finish the thread.
                 return;
             }
         }

From 224839a58a1df77a937e3e234e3ecae344e6aef5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 00:53:16 +0300
Subject: [PATCH 39/63] Attempt to read the code #4475

---
 dbms/src/DataTypes/DataTypeArray.cpp          |  9 ++
 dbms/src/DataTypes/DataTypeArray.h            |  3 +
 .../Functions/arrayEnumerateDenseRanked.cpp   |  1 +
 dbms/src/Functions/arrayEnumerateRanked.cpp   | 88 ++++++++-----------
 dbms/src/Functions/arrayEnumerateRanked.h     |  6 +-
 5 files changed, 53 insertions(+), 54 deletions(-)

diff --git a/dbms/src/DataTypes/DataTypeArray.cpp b/dbms/src/DataTypes/DataTypeArray.cpp
index c1b19d506fe..82de731f4ad 100644
--- a/dbms/src/DataTypes/DataTypeArray.cpp
+++ b/dbms/src/DataTypes/DataTypeArray.cpp
@@ -498,6 +498,15 @@ bool DataTypeArray::equals(const IDataType & rhs) const
 }
 
 
+size_t DataTypeArray::getNumberOfDimensions() const
+{
+    const DataTypeArray * nested_array = typeid_cast<const DataTypeArray *>(nested.get());
+    if (!nested_array)
+        return 1;
+    return 1 + nested_array->getNumberOfDimensions();   /// Every modern C++ compiler optimizes tail recursion.
+}
+
+
 static DataTypePtr create(const ASTPtr & arguments)
 {
     if (!arguments || arguments->children.size() != 1)
diff --git a/dbms/src/DataTypes/DataTypeArray.h b/dbms/src/DataTypes/DataTypeArray.h
index 58ea41236f9..1451f27dfbe 100644
--- a/dbms/src/DataTypes/DataTypeArray.h
+++ b/dbms/src/DataTypes/DataTypeArray.h
@@ -112,6 +112,9 @@ public:
     }
 
     const DataTypePtr & getNestedType() const { return nested; }
+
+    /// 1 for plain array, 2 for array of arrays and so on.
+    size_t getNumberOfDimensions() const;
 };
 
 }
diff --git a/dbms/src/Functions/arrayEnumerateDenseRanked.cpp b/dbms/src/Functions/arrayEnumerateDenseRanked.cpp
index 05e597e3e73..cc81e35cbe7 100644
--- a/dbms/src/Functions/arrayEnumerateDenseRanked.cpp
+++ b/dbms/src/Functions/arrayEnumerateDenseRanked.cpp
@@ -4,6 +4,7 @@
 
 namespace DB
 {
+
 class FunctionArrayEnumerateDenseRanked : public FunctionArrayEnumerateRankedExtended<FunctionArrayEnumerateDenseRanked>
 {
     using Base = FunctionArrayEnumerateRankedExtended<FunctionArrayEnumerateDenseRanked>;
diff --git a/dbms/src/Functions/arrayEnumerateRanked.cpp b/dbms/src/Functions/arrayEnumerateRanked.cpp
index ff95344dd57..8341bae97bc 100644
--- a/dbms/src/Functions/arrayEnumerateRanked.cpp
+++ b/dbms/src/Functions/arrayEnumerateRanked.cpp
@@ -1,61 +1,53 @@
+#include <algorithm>
+#include <Columns/ColumnConst.h>
 #include "arrayEnumerateRanked.h"
 
+
 namespace DB
 {
+
 ArraysDepths getArraysDepths(const ColumnsWithTypeAndName & arguments)
 {
     const size_t num_arguments = arguments.size();
+
     DepthType clear_depth = 1;
-    DepthType max_array_depth = 0;
     DepthTypes depths;
 
+    /// function signature is the following:
+    /// f(c0, arr1, c1, arr2, c2, ...)
+    ///
+    /// c0 is something called "clear_depth" here.
+    /// cN... - how deep to look into the corresponding arrN, (called "depths" here)
+    ///   may be omitted - then it means "look at the full depth".
+
     size_t array_num = 0;
-    DepthType last_array_depth = 0;
+    DepthType prev_array_depth = 0;
     for (size_t i = 0; i < num_arguments; ++i)
     {
-        const auto type = arguments[i].type;
+        const DataTypePtr & type = arguments[i].type;
+        const DataTypeArray * type_array = typeid_cast<const DataTypeArray *>(type.get());
 
-        if (isArray(type))
+        if (type_array)
         {
-            if (depths.size() < array_num && last_array_depth)
+            if (depths.size() < array_num && prev_array_depth)
             {
-                depths.emplace_back(last_array_depth);
-                last_array_depth = 0;
+                depths.emplace_back(prev_array_depth);
+                prev_array_depth = 0;
             }
 
-            DepthType depth = 0;
-            auto sub_type = type;
-            do
-            {
-                auto sub_type_array = typeid_cast<const DataTypeArray *>(sub_type.get());
-                if (!sub_type_array)
-                    break;
-                sub_type = sub_type_array->getNestedType();
-                ++depth;
-            } while (isArray(sub_type));
-            last_array_depth = depth;
+            prev_array_depth = type_array->getNumberOfDimensions();
             ++array_num;
         }
-
-        if (!arguments[i].column)
-            continue;
-
-        const IColumn * non_const = nullptr;
-        if (auto const_array_column = typeid_cast<const ColumnConst *>(arguments[i].column.get()))
-            non_const = const_array_column->getDataColumnPtr().get();
-        const auto array = typeid_cast<const ColumnArray *>(non_const ? non_const : arguments[i].column.get());
-
-        if (!array)
+        else
         {
             const auto & depth_column = arguments[i].column;
 
             if (depth_column && depth_column->isColumnConst())
             {
-                auto value = depth_column->getUInt(0);
+                UInt64 value = static_cast<const ColumnConst &>(*depth_column).getValue<UInt64>();
                 if (!value)
-                    throw Exception(
-                        "Arguments for function arrayEnumerateUniqRanked/arrayEnumerateDenseRanked incorrect: depth ("
-                            + std::to_string(value) + ") cant be 0.",
+                    throw Exception("Incorrect arguments for function arrayEnumerateUniqRanked or arrayEnumerateDenseRanked: depth ("
+                        + std::to_string(value) + ") cannot be 0.",
                         ErrorCodes::BAD_ARGUMENTS);
 
                 if (i == 0)
@@ -65,38 +57,30 @@ ArraysDepths getArraysDepths(const ColumnsWithTypeAndName & arguments)
                 else
                 {
                     if (depths.size() >= array_num)
-                    {
-                        throw Exception(
-                            "Arguments for function arrayEnumerateUniqRanked/arrayEnumerateDenseRanked incorrect: depth ("
-                                + std::to_string(value) + ") for missing array.",
+                        throw Exception("Incorrect arguments for function arrayEnumerateUniqRanked or arrayEnumerateDenseRanked: depth ("
+                            + std::to_string(value) + ") for missing array.",
                             ErrorCodes::BAD_ARGUMENTS);
-                    }
+
                     depths.emplace_back(value);
                 }
             }
         }
     }
+
     if (depths.size() < array_num)
-    {
-        depths.emplace_back(last_array_depth);
-    }
-
-
-    for (auto & depth : depths)
-    {
-        if (max_array_depth < depth)
-            max_array_depth = depth;
-    }
+        depths.emplace_back(prev_array_depth);
 
     if (depths.empty())
-        throw Exception(
-            "Arguments for function arrayEnumerateUniqRanked/arrayEnumerateDenseRanked incorrect: At least one array should be passed.",
+        throw Exception("Incorrect arguments for function arrayEnumerateUniqRanked or arrayEnumerateDenseRanked: at least one array should be passed.",
             ErrorCodes::BAD_ARGUMENTS);
 
+    DepthType max_array_depth = 0;
+    for (auto depth : depths)
+        max_array_depth = std::max(depth, max_array_depth);
+
     if (clear_depth > max_array_depth)
-        throw Exception(
-            "Arguments for function arrayEnumerateUniqRanked/arrayEnumerateDenseRanked incorrect: clear_depth ("
-                + std::to_string(clear_depth) + ") cant be larger than max_array_depth (" + std::to_string(max_array_depth) + ").",
+        throw Exception("Incorrect arguments for function arrayEnumerateUniqRanked or arrayEnumerateDenseRanked: clear_depth ("
+            + std::to_string(clear_depth) + ") cant be larger than max_array_depth (" + std::to_string(max_array_depth) + ").",
             ErrorCodes::BAD_ARGUMENTS);
 
     return {clear_depth, depths, max_array_depth};
diff --git a/dbms/src/Functions/arrayEnumerateRanked.h b/dbms/src/Functions/arrayEnumerateRanked.h
index 8e87d38f025..1fd6906a8db 100644
--- a/dbms/src/Functions/arrayEnumerateRanked.h
+++ b/dbms/src/Functions/arrayEnumerateRanked.h
@@ -33,6 +33,7 @@ struct ArraysDepths
     DepthTypes depths;
     DepthType max_array_depth;
 };
+
 /// Return depth info about passed arrays
 ArraysDepths getArraysDepths(const ColumnsWithTypeAndName & arguments);
 
@@ -55,7 +56,7 @@ public:
                     + ", should be at least 1.",
                 ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH);
 
-        const auto & arrays_depths = getArraysDepths(arguments);
+        const ArraysDepths arrays_depths = getArraysDepths(arguments);
 
         DataTypePtr type = std::make_shared<DataTypeUInt32>();
         for (DepthType i = 0; i < arrays_depths.max_array_depth; ++i)
@@ -113,7 +114,8 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeImpl(
 
     const auto & arrays_depths = getArraysDepths(args);
 
-    auto get_array_column = [&](const auto & column) -> const DB::ColumnArray * {
+    auto get_array_column = [&](const auto & column) -> const DB::ColumnArray *
+    {
         const ColumnArray * array = checkAndGetColumn<ColumnArray>(column);
         if (!array)
         {

From b5b3f52f0f6cf865e3c91f0ac02f75f4d3f30589 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 01:43:18 +0300
Subject: [PATCH 40/63] Added documentation

---
 dbms/src/Functions/arrayEnumerateRanked.h | 53 ++++++++++++++++++++++-
 1 file changed, 52 insertions(+), 1 deletion(-)

diff --git a/dbms/src/Functions/arrayEnumerateRanked.h b/dbms/src/Functions/arrayEnumerateRanked.h
index 1fd6906a8db..6e825901260 100644
--- a/dbms/src/Functions/arrayEnumerateRanked.h
+++ b/dbms/src/Functions/arrayEnumerateRanked.h
@@ -12,6 +12,47 @@
 #include <Common/HashTable/ClearableHashMap.h>
 
 
+/** The function will enumerate distinct values of the passed multidimensional arrays looking inside at the specified depths.
+  * This is very unusual function made as a special order for Yandex.Metrica.
+  *
+  * arrayEnumerateUniqRanked(['hello', 'world', 'hello']) = [1, 1, 2]
+  * - it returns similar structured array containing number of occurence of the corresponding value.
+  *
+  * arrayEnumerateUniqRanked([['hello', 'world'], ['hello'], ['hello']], 1) = [1, 1, 2]
+  * - look at the depth 1 by default. Elements are ['hello', 'world'], ['hello'], ['hello'].
+  *
+  * arrayEnumerateUniqRanked([['hello', 'world'], ['hello'], ['hello']]) = [[1,1],[2],[3]]
+  * - look at the depth 2. Return similar structured array.
+  * arrayEnumerateUniqRanked([['hello', 'world'], ['hello'], ['hello']], 2) = [[1,1],[2],[3]]
+  * - look at the maximum depth by default.
+  *
+  * We may pass multiple array arguments. Their elements will be processed as zipped to tuple.
+  *
+  * arrayEnumerateUniqRanked(['hello', 'hello', 'world', 'world'], ['a', 'b', 'b', 'b']) = [1, 1, 1, 2]
+  *
+  * We may provide arrays of different depths to look at different arguments.
+  *
+  * arrayEnumerateUniqRanked([['hello', 'world'], ['hello'], ['world'], ['world']], ['a', 'b', 'b', 'b']) = [[1,1],[1],[1],[2]]
+  * arrayEnumerateUniqRanked([['hello', 'world'], ['hello'], ['world'], ['world']], 1, ['a', 'b', 'b', 'b'], 1) = [1, 1, 1, 2]
+  *
+  * When depths are different, we process less deep arrays as promoted to deeper arrays of similar structure by duplicating elements.
+  *
+  * arrayEnumerateUniqRanked(
+  *     [['hello', 'world'], ['hello'], ['world'], ['world']],
+  *     ['a', 'b', 'b', 'b'])
+  * = arrayEnumerateUniqRanked(
+  *     [['hello', 'world'], ['hello'], ['world'], ['world']],
+  *     [['a', 'a'], ['b'], ['b'], ['b']])
+  *
+  * Finally, we can provide extra first argument named "clear_depth" (it can be considered as 1 by default).
+  * Array elements at the clear_depth will be enumerated as separate elements (enumeration counter is reset for each new element).
+  *
+  * SELECT arrayEnumerateUniqRanked(1, [['hello', 'world'], ['hello'], ['world'], ['world']]) = [[1,1],[2],[2],[3]]
+  * SELECT arrayEnumerateUniqRanked(2, [['hello', 'world'], ['hello'], ['world'], ['world']]) = [[1,1],[1],[1],[1]]
+  * SELECT arrayEnumerateUniqRanked(1, [['hello', 'world', 'hello'], ['hello'], ['world'], ['world']]) = [[1,1,2],[3],[2],[3]]
+  * SELECT arrayEnumerateUniqRanked(2, [['hello', 'world', 'hello'], ['hello'], ['world'], ['world']]) = [[1,1,2],[1],[1],[1]]
+  */
+
 namespace DB
 {
 namespace ErrorCodes
@@ -27,10 +68,18 @@ class FunctionArrayEnumerateDenseRanked;
 
 using DepthType = uint32_t;
 using DepthTypes = std::vector<DepthType>;
+
 struct ArraysDepths
 {
+    /// Enumerate elements at the specified level separately.
     DepthType clear_depth;
+
+    /// Effective depth is the array depth by default or lower value, specified as a constant argument following the array.
+    /// f([[1, 2], [3]]) - effective depth is 2.
+    /// f([[1, 2], [3]], 1) - effective depth is 1.
     DepthTypes depths;
+
+    /// Maximum effective depth.
     DepthType max_array_depth;
 };
 
@@ -58,6 +107,8 @@ public:
 
         const ArraysDepths arrays_depths = getArraysDepths(arguments);
 
+        /// Return type is the array of the depth as the maximum effective depth of arguments, containing UInt32.
+
         DataTypePtr type = std::make_shared<DataTypeUInt32>();
         for (DepthType i = 0; i < arrays_depths.max_array_depth; ++i)
             type = std::make_shared<DataTypeArray>(type);
@@ -112,7 +163,7 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeImpl(
     for (size_t i = 0; i < arguments.size(); ++i)
         args.emplace_back(block.getByPosition(arguments[i]));
 
-    const auto & arrays_depths = getArraysDepths(args);
+    const ArraysDepths arrays_depths = getArraysDepths(args);
 
     auto get_array_column = [&](const auto & column) -> const DB::ColumnArray *
     {

From 5a644f0052c5568aa8bb99a30335d202fef15558 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 02:05:47 +0300
Subject: [PATCH 41/63] Miscellaneous

---
 dbms/src/Functions/arrayEnumerateRanked.h | 31 +++++++++++++----------
 1 file changed, 18 insertions(+), 13 deletions(-)

diff --git a/dbms/src/Functions/arrayEnumerateRanked.h b/dbms/src/Functions/arrayEnumerateRanked.h
index 6e825901260..9056a5cff98 100644
--- a/dbms/src/Functions/arrayEnumerateRanked.h
+++ b/dbms/src/Functions/arrayEnumerateRanked.h
@@ -131,15 +131,15 @@ private:
 
 
 /// Hash a set of keys into a UInt128 value.
-static inline UInt128 ALWAYS_INLINE hash128depths(const std::vector<size_t> & indexes, const ColumnRawPtrs & key_columns)
+static inline UInt128 ALWAYS_INLINE hash128depths(const std::vector<size_t> & indices, const ColumnRawPtrs & key_columns)
 {
     UInt128 key;
     SipHash hash;
 
     for (size_t j = 0, keys_size = key_columns.size(); j < keys_size; ++j)
     {
-        // Debug: const auto & field = (*key_columns[j])[indexes[j]]; DUMP(j, indexes[j], field);
-        key_columns[j]->updateHashWithValue(indexes[j], hash);
+        // Debug: const auto & field = (*key_columns[j])[indices[j]]; DUMP(j, indices[j], field);
+        key_columns[j]->updateHashWithValue(indices[j], hash);
     }
 
     hash.get128(key.low, key.high);
@@ -165,6 +165,7 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeImpl(
 
     const ArraysDepths arrays_depths = getArraysDepths(args);
 
+    /// If the column is Array - return it. If the const Array - materialize it, keep ownership and return.
     auto get_array_column = [&](const auto & column) -> const DB::ColumnArray *
     {
         const ColumnArray * array = checkAndGetColumn<ColumnArray>(column);
@@ -199,7 +200,7 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeImpl(
             if (*offsets_by_depth[0] != array->getOffsets())
             {
                 throw Exception(
-                    "Lengths and depths of all arrays passed to " + getName() + " must be equal.",
+                    "Lengths and effective depths of all arrays passed to " + getName() + " must be equal.",
                     ErrorCodes::SIZES_OF_ARRAYS_DOESNT_MATCH);
             }
         }
@@ -223,7 +224,7 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeImpl(
                 if (*offsets_by_depth[col_depth] != array->getOffsets())
                 {
                     throw Exception(
-                        "Lengths and depths of all arrays passed to " + getName() + " must be equal.",
+                        "Lengths and effective depths of all arrays passed to " + getName() + " must be equal.",
                         ErrorCodes::SIZES_OF_ARRAYS_DOESNT_MATCH);
                 }
             }
@@ -233,7 +234,7 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeImpl(
         {
             throw Exception(
                 getName() + ": Passed array number " + std::to_string(array_num) + " depth ("
-                    + std::to_string(arrays_depths.depths[array_num]) + ") more than actual array depth (" + std::to_string(col_depth)
+                    + std::to_string(arrays_depths.depths[array_num]) + ") is more than the actual array depth (" + std::to_string(col_depth)
                     + ").",
                 ErrorCodes::SIZES_OF_ARRAYS_DOESNT_MATCH);
         }
@@ -304,6 +305,7 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeMethodImpl(
     const ArraysDepths & arrays_depths,
     ColumnUInt32::Container & res_values)
 {
+    /// Offsets at the depth we want to look.
     const size_t current_offset_depth = arrays_depths.max_array_depth;
     const auto & offsets = *offsets_by_depth[current_offset_depth - 1];
 
@@ -317,22 +319,24 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeMethodImpl(
         HashTableAllocatorWithStackMemory<(1ULL << INITIAL_SIZE_DEGREE) * sizeof(UInt128)>>;
     Map indices;
 
-    std::vector<size_t> indexes_by_depth(arrays_depths.max_array_depth);
+    std::vector<size_t> indices_by_depth(arrays_depths.max_array_depth);
     std::vector<size_t> current_offset_n_by_depth(arrays_depths.max_array_depth);
 
     UInt32 rank = 0;
 
-    std::vector<size_t> columns_indexes(columns.size());
+    std::vector<size_t> columns_indices(columns.size());
+
     for (size_t off : offsets)
     {
         bool want_clear = false;
 
+        /// For each element at the depth we want to look.
         for (size_t j = prev_off; j < off; ++j)
         {
             for (size_t col_n = 0; col_n < columns.size(); ++col_n)
-                columns_indexes[col_n] = indexes_by_depth[arrays_depths.depths[col_n] - 1];
+                columns_indices[col_n] = indices_by_depth[arrays_depths.depths[col_n] - 1];
 
-            auto hash = hash128depths(columns_indexes, columns);
+            auto hash = hash128depths(columns_indices, columns);
 
             if constexpr (std::is_same_v<Derived, FunctionArrayEnumerateUniqRanked>)
             {
@@ -350,13 +354,13 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeMethodImpl(
                 res_values[j] = idx;
             }
 
-            // Debug: DUMP(off, prev_off, j, columns_indexes, res_values[j], columns);
+            // Debug: DUMP(off, prev_off, j, columns_indices, res_values[j], columns);
 
             for (int depth = current_offset_depth - 1; depth >= 0; --depth)
             {
-                ++indexes_by_depth[depth];
+                ++indices_by_depth[depth];
 
-                if (indexes_by_depth[depth] == (*offsets_by_depth[depth])[current_offset_n_by_depth[depth]])
+                if (indices_by_depth[depth] == (*offsets_by_depth[depth])[current_offset_n_by_depth[depth]])
                 {
                     if (static_cast<int>(arrays_depths.clear_depth) == depth + 1)
                         want_clear = true;
@@ -368,6 +372,7 @@ void FunctionArrayEnumerateRankedExtended<Derived>::executeMethodImpl(
                 }
             }
         }
+
         if (want_clear)
         {
             want_clear = false;

From dd40956d8b0b233c2c0de7c7be543fc86116a5bc Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 02:31:34 +0300
Subject: [PATCH 42/63] Fixed test

---
 dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql b/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
index 0682da084c1..0557f4adf85 100644
--- a/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
+++ b/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
@@ -170,5 +170,5 @@ SELECT arrayEnumerateUniqRanked([1,2], 1, 2); -- { serverError 36 }
 SELECT arrayEnumerateUniqRanked([1,2], 1, 3, 4, 5); -- { serverError 36 }
 SELECT arrayEnumerateUniqRanked([1,2], 1, 3, [4], 5); -- { serverError 36 }
 SELECT arrayEnumerateDenseRanked([[[[[[[[[[42]]]]]]]]]]);
-SELECT arrayEnumerateUniqRanked('wat', [1,2]); -- { serverError 48 }
-SELECT arrayEnumerateUniqRanked(1, [1,2], 'boom'); -- { serverError 48 }
+SELECT arrayEnumerateUniqRanked('wat', [1,2]); -- { serverError 170 }
+SELECT arrayEnumerateUniqRanked(1, [1,2], 'boom'); -- { serverError 170 }

From ffc9fbf769492c4f10e43722326060d401ba0981 Mon Sep 17 00:00:00 2001
From: proller <proller@users.noreply.github.com>
Date: Wed, 6 Mar 2019 02:53:35 +0300
Subject: [PATCH 43/63]  Build fixes (#4600)

* Add Y_IGNORE

* Build fixes
---
 dbms/src/Formats/ProtobufWriter.h | 46 +++++++++++++++----------------
 1 file changed, 23 insertions(+), 23 deletions(-)

diff --git a/dbms/src/Formats/ProtobufWriter.h b/dbms/src/Formats/ProtobufWriter.h
index aaa9b9a2f9b..aba3a2b2dc6 100644
--- a/dbms/src/Formats/ProtobufWriter.h
+++ b/dbms/src/Formats/ProtobufWriter.h
@@ -238,29 +238,29 @@ using ConstAggregateDataPtr = const char *;
 class ProtobufWriter
 {
 public:
-    bool writeNumber(Int8 value) { return false; }
-    bool writeNumber(UInt8 value) { return false; }
-    bool writeNumber(Int16 value) { return false; }
-    bool writeNumber(UInt16 value) { return false; }
-    bool writeNumber(Int32 value) { return false; }
-    bool writeNumber(UInt32 value) { return false; }
-    bool writeNumber(Int64 value) { return false; }
-    bool writeNumber(UInt64 value) { return false; }
-    bool writeNumber(UInt128 value) { return false; }
-    bool writeNumber(Float32 value) { return false; }
-    bool writeNumber(Float64 value) { return false; }
-    bool writeString(const StringRef & value) { return false; }
-    void prepareEnumMapping(const std::vector<std::pair<std::string, Int8>> & name_value_pairs) {}
-    void prepareEnumMapping(const std::vector<std::pair<std::string, Int16>> & name_value_pairs) {}
-    bool writeEnum(Int8 value) { return false; }
-    bool writeEnum(Int16 value) { return false; }
-    bool writeUUID(const UUID & value) { return false; }
-    bool writeDate(DayNum date) { return false; }
-    bool writeDateTime(time_t tm) { return false; }
-    bool writeDecimal(Decimal32 decimal, UInt32 scale) { return false; }
-    bool writeDecimal(Decimal64 decimal, UInt32 scale) { return false; }
-    bool writeDecimal(const Decimal128 & decimal, UInt32 scale) { return false; }
-    bool writeAggregateFunction(const AggregateFunctionPtr & function, ConstAggregateDataPtr place) { return false; }
+    bool writeNumber(Int8 /* value */) { return false; }
+    bool writeNumber(UInt8 /* value */) { return false; }
+    bool writeNumber(Int16 /* value */) { return false; }
+    bool writeNumber(UInt16 /* value */) { return false; }
+    bool writeNumber(Int32 /* value */) { return false; }
+    bool writeNumber(UInt32 /* value */) { return false; }
+    bool writeNumber(Int64 /* value */) { return false; }
+    bool writeNumber(UInt64 /* value */) { return false; }
+    bool writeNumber(UInt128 /* value */) { return false; }
+    bool writeNumber(Float32 /* value */) { return false; }
+    bool writeNumber(Float64 /* value */) { return false; }
+    bool writeString(const StringRef & /* value */) { return false; }
+    void prepareEnumMapping(const std::vector<std::pair<std::string, Int8>> & /* name_value_pairs */) {}
+    void prepareEnumMapping(const std::vector<std::pair<std::string, Int16>> & /* name_value_pairs */) {}
+    bool writeEnum(Int8 /* value */) { return false; }
+    bool writeEnum(Int16 /* value */) { return false; }
+    bool writeUUID(const UUID & /* value */) { return false; }
+    bool writeDate(DayNum /* date */) { return false; }
+    bool writeDateTime(time_t /* tm */) { return false; }
+    bool writeDecimal(Decimal32 /* decimal */, UInt32 /* scale */) { return false; }
+    bool writeDecimal(Decimal64 /* decimal */, UInt32 /* scale */) { return false; }
+    bool writeDecimal(const Decimal128 & /* decimal */, UInt32 /* scale */) { return false; }
+    bool writeAggregateFunction(const AggregateFunctionPtr & /* function */, ConstAggregateDataPtr /* place */) { return false; }
 };
 
 }

From 2e6dde45b4ca812118ab1f8a6f3e50a64ddecae9 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 03:09:49 +0300
Subject: [PATCH 44/63] Update GraphiteRollupSortedBlockInputStream.cpp

---
 .../GraphiteRollupSortedBlockInputStream.cpp  | 75 +++++++++----------
 1 file changed, 37 insertions(+), 38 deletions(-)

diff --git a/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp b/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp
index 6c1983568bb..fb24d8c37a4 100644
--- a/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp
+++ b/dbms/src/DataStreams/GraphiteRollupSortedBlockInputStream.cpp
@@ -49,54 +49,53 @@ Graphite::RollupRule GraphiteRollupSortedBlockInputStream::selectPatternForPath(
     const Graphite::Pattern * first_match = &undef_pattern;
 
     for (const auto & pattern : params.patterns)
-        if (!pattern.regexp || pattern.regexp->match(path.data, path.size))
+    {
+        if (!pattern.regexp)
         {
-            if (!pattern.regexp)
+            /// Default pattern
+            if (first_match->type == first_match->TypeUndef && pattern.type == pattern.TypeAll)
             {
-                /// Default pattern
-                if (first_match->type == first_match->TypeUndef && pattern.type == pattern.TypeAll)
-                {
-                    /// There is only default pattern for both retention and aggregation
-                    return std::pair(&pattern, &pattern);
-                }
-                if (pattern.type != first_match->type)
-                {
-                    if (first_match->type == first_match->TypeRetention)
-                    {
-                        return std::pair(first_match, &pattern);
-                    }
-                    if (first_match->type == first_match->TypeAggregation)
-                    {
-                        return std::pair(&pattern, first_match);
-                    }
-                }
+                /// There is only default pattern for both retention and aggregation
+                return std::pair(&pattern, &pattern);
             }
-            else
+            if (pattern.type != first_match->type)
             {
-                /// General pattern with matched path
-                if (pattern.type == pattern.TypeAll)
+                if (first_match->type == first_match->TypeRetention)
                 {
-                   /// Only for not default patterns with both function and retention parameters
-                   return std::pair(&pattern, &pattern);
+                    return std::pair(first_match, &pattern);
                 }
-                if (first_match->type == first_match->TypeUndef)
+                if (first_match->type == first_match->TypeAggregation)
                 {
-                    first_match = &pattern;
-                    continue;
-                }
-                if (pattern.type != first_match->type)
-                {
-                    if (first_match->type == first_match->TypeRetention)
-                    {
-                        return std::pair(first_match, &pattern);
-                    }
-                    if (first_match->type == first_match->TypeAggregation)
-                    {
-                        return std::pair(&pattern, first_match);
-                    }
+                    return std::pair(&pattern, first_match);
                 }
             }
         }
+        else if (pattern.regexp->match(path.data, path.size))
+        {
+            /// General pattern with matched path
+            if (pattern.type == pattern.TypeAll)
+            {
+               /// Only for not default patterns with both function and retention parameters
+               return std::pair(&pattern, &pattern);
+            }
+            if (first_match->type == first_match->TypeUndef)
+            {
+                first_match = &pattern;
+                continue;
+            }
+            if (pattern.type != first_match->type)
+            {
+                if (first_match->type == first_match->TypeRetention)
+                {
+                    return std::pair(first_match, &pattern);
+                }
+                if (first_match->type == first_match->TypeAggregation)
+                {
+                    return std::pair(&pattern, first_match);
+                }
+            }
+        }
+    }
 
     return {nullptr, nullptr};
 }

From 01f7efe61534388f9d6cf693a11c2b2136176531 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 03:44:25 +0300
Subject: [PATCH 45/63] Added support for clang-9

---
 dbms/CMakeLists.txt | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/dbms/CMakeLists.txt b/dbms/CMakeLists.txt
index 76d4ebd7dbf..8de06ff6ac0 100644
--- a/dbms/CMakeLists.txt
+++ b/dbms/CMakeLists.txt
@@ -59,6 +59,14 @@ if (CMAKE_CXX_COMPILER_ID STREQUAL "Clang")
     if (NOT CMAKE_CXX_COMPILER_VERSION VERSION_LESS 8)
         set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wextra-semi-stmt -Wshadow-field -Wstring-plus-int")
     endif ()
+
+    if (NOT CMAKE_CXX_COMPILER_VERSION VERSION_LESS 9)
+        set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wextra-semi-stmt -Wshadow-field -Wstring-plus-int")
+
+        if (WEVERYTHING)
+            set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-ctad-maybe-unsupported")
+        endif ()
+    endif ()
 endif ()
 
 if (USE_DEBUG_HELPERS)
@@ -200,7 +208,7 @@ target_link_libraries (clickhouse_common_io
         PRIVATE
     ${CMAKE_DL_LIBS}
         PUBLIC
-    roaring	
+    roaring
 )
 
 

From 98fe1a6e8bbd0a781d3cb90198cd545ef4f261ae Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 04:01:53 +0300
Subject: [PATCH 46/63] Update CMakeLists.txt

---
 dbms/CMakeLists.txt | 2 --
 1 file changed, 2 deletions(-)

diff --git a/dbms/CMakeLists.txt b/dbms/CMakeLists.txt
index 8de06ff6ac0..900b1e0a650 100644
--- a/dbms/CMakeLists.txt
+++ b/dbms/CMakeLists.txt
@@ -61,8 +61,6 @@ if (CMAKE_CXX_COMPILER_ID STREQUAL "Clang")
     endif ()
 
     if (NOT CMAKE_CXX_COMPILER_VERSION VERSION_LESS 9)
-        set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wextra-semi-stmt -Wshadow-field -Wstring-plus-int")
-
         if (WEVERYTHING)
             set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wno-ctad-maybe-unsupported")
         endif ()

From bc30ed92d445a49272b22821cf36d54b3b452f68 Mon Sep 17 00:00:00 2001
From: Alexey Zatelepin <ztlpn@yandex-team.ru>
Date: Wed, 6 Mar 2019 15:25:59 +0300
Subject: [PATCH 47/63] fix order of destruction of table locks and child
 streams

Incorrect order could lead to a very rare `mutex lock failed: Invalid argument`
error when MergeTree table was dropped and its parts were deleted defore the destruction
of streams that were reading from that parts.
---
 dbms/src/DataStreams/IBlockInputStream.h | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/dbms/src/DataStreams/IBlockInputStream.h b/dbms/src/DataStreams/IBlockInputStream.h
index 05b5e059454..759f3df3e51 100644
--- a/dbms/src/DataStreams/IBlockInputStream.h
+++ b/dbms/src/DataStreams/IBlockInputStream.h
@@ -242,6 +242,10 @@ public:
     void enableExtremes() { enabled_extremes = true; }
 
 protected:
+    /// Order is important: `table_locks` must be destroyed after `children` so that tables from
+    /// which child streams read are protected by the locks during the lifetime of the child streams.
+    TableStructureReadLocks table_locks;
+
     BlockInputStreams children;
     std::shared_mutex children_mutex;
 
@@ -268,8 +272,6 @@ protected:
     }
 
 private:
-    TableStructureReadLocks table_locks;
-
     bool enabled_extremes = false;
 
     /// The limit on the number of rows/bytes has been exceeded, and you need to stop execution on the next `read` call, as if the thread has run out.

From aff14bc899bdf9788b4748481595c6518595df46 Mon Sep 17 00:00:00 2001
From: Alexey Zatelepin <ztlpn@yandex-team.ru>
Date: Wed, 6 Mar 2019 16:48:59 +0300
Subject: [PATCH 48/63] clarify comment

---
 dbms/src/DataStreams/IBlockInputStream.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dbms/src/DataStreams/IBlockInputStream.h b/dbms/src/DataStreams/IBlockInputStream.h
index 759f3df3e51..8a2b1e9b148 100644
--- a/dbms/src/DataStreams/IBlockInputStream.h
+++ b/dbms/src/DataStreams/IBlockInputStream.h
@@ -116,7 +116,7 @@ public:
       */
     size_t checkDepth(size_t max_depth) const { return checkDepthImpl(max_depth, max_depth); }
 
-    /// Do not allow to change the table while the blocks stream is alive.
+    /// Do not allow to change the table while the blocks stream and its children are alive.
     void addTableLock(const TableStructureReadLockPtr & lock) { table_locks.push_back(lock); }
 
     /// Get information about execution speed.

From 142258f76fef7474ed93f8c620324a44db9121df Mon Sep 17 00:00:00 2001
From: proller <proller@github.com>
Date: Wed, 6 Mar 2019 19:00:07 +0300
Subject: [PATCH 49/63] Remove debian epoch from changelog

---
 debian/changelog.in | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/debian/changelog.in b/debian/changelog.in
index 4a74214c022..ce2ee757999 100644
--- a/debian/changelog.in
+++ b/debian/changelog.in
@@ -1,4 +1,4 @@
-clickhouse (2:@VERSION_STRING@) unstable; urgency=low
+clickhouse (@VERSION_STRING@) unstable; urgency=low
 
   * Modified source code
 

From 7d0be1e1f6e424cdbfc259cad03d0814b115f0d2 Mon Sep 17 00:00:00 2001
From: Vasily Vasilkov <vasily.vasilkov@gmail.com>
Date: Wed, 6 Mar 2019 20:32:19 +0400
Subject: [PATCH 50/63] Add one more Java/Kotlin library for ClickHouse

---
 docs/en/interfaces/third-party/client_libraries.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/en/interfaces/third-party/client_libraries.md b/docs/en/interfaces/third-party/client_libraries.md
index 5878d6e0200..a5b9991a418 100644
--- a/docs/en/interfaces/third-party/client_libraries.md
+++ b/docs/en/interfaces/third-party/client_libraries.md
@@ -32,6 +32,7 @@
     - [RClickhouse](https://github.com/IMSMWU/RClickhouse)
 - Java
     - [clickhouse-client-java](https://github.com/VirtusAI/clickhouse-client-java)
+    - [clickhouse-client](https://github.com/Ecwid/clickhouse-client)    
 - Scala
     - [clickhouse-scala-client](https://github.com/crobox/clickhouse-scala-client)
 - Kotlin

From 89917ced9e43d4cd3b253e079e22c97bf39f784d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 19:46:05 +0300
Subject: [PATCH 51/63] Fixed undefined behaviour in ThreadPool #4572

---
 dbms/src/Common/ThreadPool.h | 51 +++++++++++++++++++++++++++---------
 1 file changed, 38 insertions(+), 13 deletions(-)

diff --git a/dbms/src/Common/ThreadPool.h b/dbms/src/Common/ThreadPool.h
index d828de3fea2..35c3395cc64 100644
--- a/dbms/src/Common/ThreadPool.h
+++ b/dbms/src/Common/ThreadPool.h
@@ -133,18 +133,17 @@ public:
 
     template <typename Function, typename... Args>
     explicit ThreadFromGlobalPool(Function && func, Args &&... args)
+        : state(std::make_shared<SharedState>(true))
     {
-        mutex = std::make_shared<std::mutex>();
-
-        /// The function object must be copyable, so we wrap lock_guard in shared_ptr.
+        /// NOTE: If this will throw an exception, the descructor won't be called.
         GlobalThreadPool::instance().scheduleOrThrow([
-            mutex = mutex,
-            lock = std::make_shared<std::lock_guard<std::mutex>>(*mutex),
+            state = state,
             func = std::forward<Function>(func),
             args = std::make_tuple(std::forward<Args>(args)...)]
         {
             DB::ThreadStatus thread_status;
             std::apply(func, args);
+            state->finish();
         });
     }
 
@@ -157,7 +156,7 @@ public:
     {
         if (joinable())
             std::terminate();
-        mutex = std::move(rhs.mutex);
+        state = std::move(rhs.state);
         return *this;
     }
 
@@ -171,26 +170,52 @@ public:
     {
         if (!joinable())
             std::terminate();
-        {
-            std::lock_guard lock(*mutex);
-        }
-        mutex.reset();
+
+        state->wait();
+        state.reset();
     }
 
     void detach()
     {
         if (!joinable())
             std::terminate();
-        mutex.reset();
+        state.reset();
     }
 
     bool joinable() const
     {
-        return static_cast<bool>(mutex);
+        return state != nullptr;
     }
 
 private:
-    std::shared_ptr<std::mutex> mutex;  /// Object must be moveable.
+    /// The state used in this object and inside the thread job.
+    class SharedState
+    {
+    private:
+        bool active;
+        std::mutex mutex;
+        std::condition_variable done_event;
+
+    public:
+        SharedState(bool active) : active(active) {}
+
+        void finish()
+        {
+            {
+                std::lock_guard lock(mutex);
+                active = false;
+            }
+            done_event.notify_one();
+        }
+
+        void wait()
+        {
+            std::unique_lock lock(mutex);
+            done_event.wait(lock, [this]{ return !active; });
+        }
+    };
+
+    std::shared_ptr<SharedState> state;
 };
 
 

From 9a56294fdf56f3a52fa1427204da7481ba79ef0f Mon Sep 17 00:00:00 2001
From: Maxim Akhmedov <max42@yandex-team.ru>
Date: Wed, 6 Mar 2019 19:41:35 +0300
Subject: [PATCH 52/63] CHYT-67: introduce host context for using CH as a
 library.

---
 dbms/programs/server/HTTPHandler.cpp |  2 ++
 dbms/programs/server/HTTPHandler.h   |  3 +++
 dbms/programs/server/TCPHandler.cpp  | 10 ++++++++--
 dbms/programs/server/TCPHandler.h    |  3 +++
 dbms/programs/server/config.xml      |  4 ++--
 dbms/src/Interpreters/Context.cpp    | 13 +++++++++++++
 dbms/src/Interpreters/Context.h      | 18 ++++++++++++++++++
 7 files changed, 49 insertions(+), 4 deletions(-)

diff --git a/dbms/programs/server/HTTPHandler.cpp b/dbms/programs/server/HTTPHandler.cpp
index 6e94d59be07..763a30c1928 100644
--- a/dbms/programs/server/HTTPHandler.cpp
+++ b/dbms/programs/server/HTTPHandler.cpp
@@ -602,6 +602,8 @@ void HTTPHandler::processQuery(
         });
     }
 
+    customizeContext(context);
+
     executeQuery(*in, *used_output.out_maybe_delayed_and_compressed, /* allow_into_outfile = */ false, context,
         [&response] (const String & content_type) { response.setContentType(content_type); },
         [&response] (const String & current_query_id) { response.add("Query-Id", current_query_id); });
diff --git a/dbms/programs/server/HTTPHandler.h b/dbms/programs/server/HTTPHandler.h
index 58cb6bb67f1..fb6c9fb532c 100644
--- a/dbms/programs/server/HTTPHandler.h
+++ b/dbms/programs/server/HTTPHandler.h
@@ -28,6 +28,9 @@ public:
 
     void handleRequest(Poco::Net::HTTPServerRequest & request, Poco::Net::HTTPServerResponse & response) override;
 
+    /// This method is called right before the query execution.
+    virtual void customizeContext(DB::Context& /* context */) {}
+
 private:
     struct Output
     {
diff --git a/dbms/programs/server/TCPHandler.cpp b/dbms/programs/server/TCPHandler.cpp
index 013f047ae67..1935ea87025 100644
--- a/dbms/programs/server/TCPHandler.cpp
+++ b/dbms/programs/server/TCPHandler.cpp
@@ -120,10 +120,11 @@ void TCPHandler::runImpl()
 
     connection_context.setProgressCallback([this] (const Progress & value) { return this->updateProgress(value); });
 
+    /// Restore context of request.
+    query_context = connection_context;
+
     while (1)
     {
-        /// Restore context of request.
-        query_context = connection_context;
 
         /// We are waiting for a packet from the client. Thus, every `POLL_INTERVAL` seconds check whether we need to shut down.
         while (!static_cast<ReadBufferFromPocoSocket &>(*in).poll(global_settings.poll_interval * 1000000) && !server.isCancelled())
@@ -185,6 +186,8 @@ void TCPHandler::runImpl()
                 state.maybe_compressed_in.reset(); /// For more accurate accounting by MemoryTracker.
             });
 
+            customizeContext(query_context);
+
             bool may_have_embedded_data = client_revision >= DBMS_MIN_REVISION_WITH_CLIENT_SUPPORT_EMBEDDED_DATA;
             /// Processing Query
             state.io = executeQuery(state.query, query_context, false, state.stage, may_have_embedded_data);
@@ -207,6 +210,9 @@ void TCPHandler::runImpl()
             sendLogs();
             sendEndOfStream();
 
+            /// Restore context of request.
+            query_context = connection_context;
+
             query_scope.reset();
             state.reset();
         }
diff --git a/dbms/programs/server/TCPHandler.h b/dbms/programs/server/TCPHandler.h
index 19641e88d25..bd375dc5296 100644
--- a/dbms/programs/server/TCPHandler.h
+++ b/dbms/programs/server/TCPHandler.h
@@ -95,6 +95,9 @@ public:
 
     void run();
 
+    /// This method is called right before the query execution.
+    virtual void customizeContext(DB::Context & /*context*/) {}
+
 private:
     IServer & server;
     Poco::Logger * log;
diff --git a/dbms/programs/server/config.xml b/dbms/programs/server/config.xml
index 154ebf6c35e..7a53e7185a0 100644
--- a/dbms/programs/server/config.xml
+++ b/dbms/programs/server/config.xml
@@ -318,10 +318,10 @@
     -->
 
     <!-- Path to file with region hierarchy. -->
-    <!-- <path_to_regions_hierarchy_file>/opt/geo/regions_hierarchy.txt</path_to_regions_hierarchy_file> -->
+    <path_to_regions_hierarchy_file>../../../../geo/regions_hierarchy.txt</path_to_regions_hierarchy_file>
 
     <!-- Path to directory with files containing names of regions -->
-    <!-- <path_to_regions_names_files>/opt/geo/</path_to_regions_names_files> -->
+    <path_to_regions_names_files>../../../../geo/</path_to_regions_names_files>
 
 
     <!-- Configuration of external dictionaries. See:
diff --git a/dbms/src/Interpreters/Context.cpp b/dbms/src/Interpreters/Context.cpp
index 8c2e2b8178c..b7613116f2d 100644
--- a/dbms/src/Interpreters/Context.cpp
+++ b/dbms/src/Interpreters/Context.cpp
@@ -1818,6 +1818,19 @@ void Context::addXDBCBridgeCommand(std::unique_ptr<ShellCommand> cmd)
     shared->bridge_commands.emplace_back(std::move(cmd));
 }
 
+
+IHostContextPtr & Context::getHostContext()
+{
+    return host_context;
+}
+
+
+const IHostContextPtr & Context::getHostContext() const
+{
+    return host_context;
+}
+
+
 std::shared_ptr<ActionLocksManager> Context::getActionLocksManager()
 {
     auto lock = getLock();
diff --git a/dbms/src/Interpreters/Context.h b/dbms/src/Interpreters/Context.h
index df1e23d885b..8b4e66094ff 100644
--- a/dbms/src/Interpreters/Context.h
+++ b/dbms/src/Interpreters/Context.h
@@ -99,6 +99,15 @@ using TableAndCreateASTs = std::map<String, TableAndCreateAST>;
 /// Callback for external tables initializer
 using ExternalTablesInitializer = std::function<void(Context &)>;
 
+/// An empty interface for an arbitrary object that may be attached by a shared pointer
+/// to query context, when using ClickHouse as a library.
+struct IHostContext
+{
+    virtual ~IHostContext() = default;
+};
+
+using IHostContextPtr = std::shared_ptr<IHostContext>;
+
 /** A set of known objects that can be used in the query.
   * Consists of a shared part (always common to all sessions and queries)
   *  and copied part (which can be its own for each session or query).
@@ -139,6 +148,12 @@ private:
     using DatabasePtr = std::shared_ptr<IDatabase>;
     using Databases = std::map<String, std::shared_ptr<IDatabase>>;
 
+    IHostContextPtr host_context;  /// Arbitrary object that may used to attach some host specific information to query context,
+                                   /// when using ClickHouse as a library in some project. For example, it may contain host
+                                   /// logger, some query identification information, profiling guards, etc. This field is
+                                   /// to be customized in HTTP and TCP servers by overloading the customizeContext(DB::Context&)
+                                   /// methods.
+
     /// Use copy constructor or createGlobal() instead
     Context();
 
@@ -452,6 +467,9 @@ public:
     /// Add started bridge command. It will be killed after context destruction
     void addXDBCBridgeCommand(std::unique_ptr<ShellCommand> cmd);
 
+    IHostContextPtr & getHostContext();
+    const IHostContextPtr & getHostContext() const;
+
 private:
     /** Check if the current client has access to the specified database.
       * If access is denied, throw an exception.

From a233b93b6a193cc1c55ceec702d809a9aeb2bb0c Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 6 Mar 2019 20:10:26 +0300
Subject: [PATCH 53/63] Fix kill_not_initialized_query again

---
 ...00909_kill_not_initialized_query.reference |  1 +
 .../00909_kill_not_initialized_query.sh       | 25 ++++++++++++++++---
 2 files changed, 22 insertions(+), 4 deletions(-)

diff --git a/dbms/tests/queries/0_stateless/00909_kill_not_initialized_query.reference b/dbms/tests/queries/0_stateless/00909_kill_not_initialized_query.reference
index 573541ac970..aa47d0d46d4 100644
--- a/dbms/tests/queries/0_stateless/00909_kill_not_initialized_query.reference
+++ b/dbms/tests/queries/0_stateless/00909_kill_not_initialized_query.reference
@@ -1 +1,2 @@
 0
+0
diff --git a/dbms/tests/queries/0_stateless/00909_kill_not_initialized_query.sh b/dbms/tests/queries/0_stateless/00909_kill_not_initialized_query.sh
index 443b2463a33..76d6424e690 100755
--- a/dbms/tests/queries/0_stateless/00909_kill_not_initialized_query.sh
+++ b/dbms/tests/queries/0_stateless/00909_kill_not_initialized_query.sh
@@ -10,20 +10,37 @@ $CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS test.cannot_kill_query"
 $CLICKHOUSE_CLIENT -q "CREATE TABLE test.cannot_kill_query (x UInt64) ENGINE = MergeTree ORDER BY x" &> /dev/null
 $CLICKHOUSE_CLIENT -q "INSERT INTO test.cannot_kill_query SELECT * FROM numbers(10000000)" &> /dev/null
 
+# This SELECT query will run for a long time. It's used as bloker for ALTER query. It will be killed with SYNC kill.
 query_for_pending="SELECT count() FROM test.cannot_kill_query WHERE NOT ignore(sleep(1)) SETTINGS max_threads=1, max_block_size=1"
 $CLICKHOUSE_CLIENT -q "$query_for_pending" &>/dev/null &
 
+sleep 1 # queries should be in strict order
+
+# This ALTER query will wait until $query_for_pending finished. Also it will block $query_to_kill.
 $CLICKHOUSE_CLIENT -q "ALTER TABLE test.cannot_kill_query MODIFY COLUMN x UInt64" &>/dev/null &
 
+sleep 1
+
+# This SELECT query will also run for a long time. Also it's blocked by ALTER query. It will be killed with ASYNC kill.
+# This is main idea which we check -- blocked queries can be killed with ASYNC kill.
 query_to_kill="SELECT sum(1) FROM test.cannot_kill_query WHERE NOT ignore(sleep(1)) SETTINGS max_threads=1"
 $CLICKHOUSE_CLIENT -q "$query_to_kill" &>/dev/null &
 
-sleep 3 # just to be sure that 'KILL ...' will be executed after 'SELECT ... WHERE NOT ignore(sleep(1))'
+sleep 1 # just to be sure that kill of $query_to_kill will be executed after $query_to_kill.
 
-timeout 15 $CLICKHOUSE_CLIENT -q "KILL QUERY WHERE query='$query_to_kill' SYNC" &>/dev/null
+# Kill $query_to_kill with ASYNC kill. We will check that information about KILL is not lost.
+$CLICKHOUSE_CLIENT -q "KILL QUERY WHERE query='$query_to_kill' ASYNC" &>/dev/null
 
+sleep 1
+
+# Kill $query_for_pending SYNC. This query is not blocker, so it should be killed fast.
+timeout 5 $CLICKHOUSE_CLIENT -q "KILL QUERY WHERE query='$query_for_pending' SYNC" &>/dev/null
+
+# But let's sleep a little time, just to be sure
+sleep 3
+
+# Both queries have to be killed, doesn't matter with SYNC or ASYNC kill
+$CLICKHOUSE_CLIENT -q "SELECT count() FROM system.processes where query='$query_for_pending'"
 $CLICKHOUSE_CLIENT -q "SELECT count() FROM system.processes where query='$query_to_kill'"
 
-$CLICKHOUSE_CLIENT -q "KILL QUERY WHERE query='$query_for_pending'" &>/dev/null & # kill pending query
-
 $CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS test.cannot_kill_query" &>/dev/null

From 9159d602f5a137ec180791170dc26ecbb160baab Mon Sep 17 00:00:00 2001
From: proller <proller@github.com>
Date: Wed, 6 Mar 2019 20:19:26 +0300
Subject: [PATCH 54/63] Fix bug in arrayEnumerateRanked

---
 dbms/src/Functions/arrayEnumerateRanked.cpp                 | 6 +++---
 dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql | 4 ++++
 2 files changed, 7 insertions(+), 3 deletions(-)

diff --git a/dbms/src/Functions/arrayEnumerateRanked.cpp b/dbms/src/Functions/arrayEnumerateRanked.cpp
index ff95344dd57..a85beac4feb 100644
--- a/dbms/src/Functions/arrayEnumerateRanked.cpp
+++ b/dbms/src/Functions/arrayEnumerateRanked.cpp
@@ -51,11 +51,11 @@ ArraysDepths getArraysDepths(const ColumnsWithTypeAndName & arguments)
 
             if (depth_column && depth_column->isColumnConst())
             {
-                auto value = depth_column->getUInt(0);
-                if (!value)
+                auto value = depth_column->getInt(0);
+                if (value <= 0)
                     throw Exception(
                         "Arguments for function arrayEnumerateUniqRanked/arrayEnumerateDenseRanked incorrect: depth ("
-                            + std::to_string(value) + ") cant be 0.",
+                            + std::to_string(value) + ") cant be less or equal 0.",
                         ErrorCodes::BAD_ARGUMENTS);
 
                 if (i == 0)
diff --git a/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql b/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
index 0682da084c1..97201d1a929 100644
--- a/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
+++ b/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
@@ -172,3 +172,7 @@ SELECT arrayEnumerateUniqRanked([1,2], 1, 3, [4], 5); -- { serverError 36 }
 SELECT arrayEnumerateDenseRanked([[[[[[[[[[42]]]]]]]]]]);
 SELECT arrayEnumerateUniqRanked('wat', [1,2]); -- { serverError 48 }
 SELECT arrayEnumerateUniqRanked(1, [1,2], 'boom'); -- { serverError 48 }
+SELECT arrayEnumerateDenseRanked(['\0'], -8363126); -- { serverError 36 }
+SELECT arrayEnumerateDenseRanked(-10, ['\0'], -8363126); -- { serverError 36 }
+SELECT arrayEnumerateDenseRanked(1, ['\0'], -8363126); -- { serverError 36 }
+SELECT arrayEnumerateDenseRanked(-101, ['\0']); -- { serverError 36 }

From 41469cc874b8a03bdad13cd00822b656f840bb49 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 20:54:20 +0300
Subject: [PATCH 55/63] More simple #4572

---
 dbms/src/Common/ThreadPool.h | 33 ++++-----------------------------
 1 file changed, 4 insertions(+), 29 deletions(-)

diff --git a/dbms/src/Common/ThreadPool.h b/dbms/src/Common/ThreadPool.h
index 35c3395cc64..1cda735cc6f 100644
--- a/dbms/src/Common/ThreadPool.h
+++ b/dbms/src/Common/ThreadPool.h
@@ -10,6 +10,7 @@
 #include <optional>
 #include <ext/singleton.h>
 
+#include <Poco/Event.h>
 #include <Common/ThreadStatus.h>
 
 
@@ -133,7 +134,7 @@ public:
 
     template <typename Function, typename... Args>
     explicit ThreadFromGlobalPool(Function && func, Args &&... args)
-        : state(std::make_shared<SharedState>(true))
+        : state(std::make_shared<Poco::Event>())
     {
         /// NOTE: If this will throw an exception, the descructor won't be called.
         GlobalThreadPool::instance().scheduleOrThrow([
@@ -143,7 +144,7 @@ public:
         {
             DB::ThreadStatus thread_status;
             std::apply(func, args);
-            state->finish();
+            state->set();
         });
     }
 
@@ -189,33 +190,7 @@ public:
 
 private:
     /// The state used in this object and inside the thread job.
-    class SharedState
-    {
-    private:
-        bool active;
-        std::mutex mutex;
-        std::condition_variable done_event;
-
-    public:
-        SharedState(bool active) : active(active) {}
-
-        void finish()
-        {
-            {
-                std::lock_guard lock(mutex);
-                active = false;
-            }
-            done_event.notify_one();
-        }
-
-        void wait()
-        {
-            std::unique_lock lock(mutex);
-            done_event.wait(lock, [this]{ return !active; });
-        }
-    };
-
-    std::shared_ptr<SharedState> state;
+    std::shared_ptr<Poco::Event> state;
 };
 
 

From 47df38f7a05c184a8e5b870ff05ec481d2a5ffc8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 21:09:25 +0300
Subject: [PATCH 56/63] Adapted test for TSan #4572

---
 dbms/src/Common/tests/thread_pool_3.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/dbms/src/Common/tests/thread_pool_3.cpp b/dbms/src/Common/tests/thread_pool_3.cpp
index 687c344288d..924895de308 100644
--- a/dbms/src/Common/tests/thread_pool_3.cpp
+++ b/dbms/src/Common/tests/thread_pool_3.cpp
@@ -1,4 +1,4 @@
-#include <atomic>
+#include <mutex>
 #include <iostream>
 #include <Common/ThreadPool.h>
 
@@ -10,8 +10,9 @@ void test()
 {
     Pool pool(10, 2, 10);
 
+    std::mutex mutex;
     for (size_t i = 0; i < 10; ++i)
-        pool.schedule([]{ std::cerr << '.'; });
+        pool.schedule([&]{ std::lock_guard lock(mutex); std::cerr << '.'; });
     pool.wait();
 }
 

From 482d153dcd7a986dbf0b82498bb84a814471c90a Mon Sep 17 00:00:00 2001
From: proller <proller@users.noreply.github.com>
Date: Wed, 6 Mar 2019 21:37:16 +0300
Subject: [PATCH 57/63] clickhouse-odbc #157 : Remove LowCardinality from type
 (#4381)

* clickhouse-odbc #157 : Remove LowCardinality from type

* Update ODBCDriver2BlockOutputStream.cpp

* fix
---
 dbms/src/Formats/ODBCDriver2BlockOutputStream.cpp | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/dbms/src/Formats/ODBCDriver2BlockOutputStream.cpp b/dbms/src/Formats/ODBCDriver2BlockOutputStream.cpp
index 64d2216dd0e..8e9dbfdd5c2 100644
--- a/dbms/src/Formats/ODBCDriver2BlockOutputStream.cpp
+++ b/dbms/src/Formats/ODBCDriver2BlockOutputStream.cpp
@@ -3,6 +3,7 @@
 #include <Formats/ODBCDriver2BlockOutputStream.h>
 #include <IO/WriteBuffer.h>
 #include <IO/WriteHelpers.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 
 namespace DB
 {
@@ -82,8 +83,10 @@ void ODBCDriver2BlockOutputStream::writePrefix()
     writeODBCString(out, "type");
     for (size_t i = 0; i < columns; ++i)
     {
-        const ColumnWithTypeAndName & col = header.getByPosition(i);
-        writeODBCString(out, col.type->getName());
+        auto type = header.getByPosition(i).type;
+        if (type->lowCardinality())
+            type = recursiveRemoveLowCardinality(type);
+        writeODBCString(out, type->getName());
     }
 }
 

From 61e82da684b453a1035bb1bbb6486ad367b44935 Mon Sep 17 00:00:00 2001
From: alexey-milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 21:38:26 +0300
Subject: [PATCH 58/63] Update TCPHandler.cpp

---
 dbms/programs/server/TCPHandler.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dbms/programs/server/TCPHandler.cpp b/dbms/programs/server/TCPHandler.cpp
index 1935ea87025..3693f949358 100644
--- a/dbms/programs/server/TCPHandler.cpp
+++ b/dbms/programs/server/TCPHandler.cpp
@@ -120,7 +120,7 @@ void TCPHandler::runImpl()
 
     connection_context.setProgressCallback([this] (const Progress & value) { return this->updateProgress(value); });
 
-    /// Restore context of request.
+    /// Set context of request.
     query_context = connection_context;
 
     while (1)

From ee15cb237cfd10be9a38c377c1b34a87cea28b2f Mon Sep 17 00:00:00 2001
From: proller <proller@github.com>
Date: Wed, 6 Mar 2019 22:19:21 +0300
Subject: [PATCH 59/63] Better fix

---
 dbms/src/Functions/arrayEnumerateRanked.cpp          |  7 ++++++-
 .../0_stateless/00909_arrayEnumerateUniq.reference   |  2 ++
 .../queries/0_stateless/00909_arrayEnumerateUniq.sql | 12 ++++++++----
 3 files changed, 16 insertions(+), 5 deletions(-)

diff --git a/dbms/src/Functions/arrayEnumerateRanked.cpp b/dbms/src/Functions/arrayEnumerateRanked.cpp
index a85beac4feb..a1a28616437 100644
--- a/dbms/src/Functions/arrayEnumerateRanked.cpp
+++ b/dbms/src/Functions/arrayEnumerateRanked.cpp
@@ -71,17 +71,22 @@ ArraysDepths getArraysDepths(const ColumnsWithTypeAndName & arguments)
                                 + std::to_string(value) + ") for missing array.",
                             ErrorCodes::BAD_ARGUMENTS);
                     }
+                    if (value > last_array_depth)
+                        throw Exception(
+                            "Arguments for function arrayEnumerateUniqRanked/arrayEnumerateDenseRanked incorrect: depth="
+                                + std::to_string(value) + " for array with depth=" + std::to_string(last_array_depth) + ".",
+                            ErrorCodes::BAD_ARGUMENTS);
                     depths.emplace_back(value);
                 }
             }
         }
     }
+
     if (depths.size() < array_num)
     {
         depths.emplace_back(last_array_depth);
     }
 
-
     for (auto & depth : depths)
     {
         if (max_array_depth < depth)
diff --git a/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.reference b/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.reference
index 1bfd81d796d..38b6b827a05 100644
--- a/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.reference
+++ b/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.reference
@@ -178,3 +178,5 @@ arrayEnumerateUniq(a1, a2) =
 [1,2]
 [1,1]
 [[[[[[[[[[1]]]]]]]]]]
+[1,2,1,3]
+[1,2,1,3]
diff --git a/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql b/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
index 97201d1a929..077cd5c6631 100644
--- a/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
+++ b/dbms/tests/queries/0_stateless/00909_arrayEnumerateUniq.sql
@@ -145,11 +145,11 @@ SELECT arrayEnumerateUniqRanked(); -- { serverError 42 }
 SELECT arrayEnumerateUniqRanked([]);
 SELECT arrayEnumerateUniqRanked(1); -- { serverError 36 }
 SELECT arrayEnumerateUniqRanked(2,[]); -- { serverError 36 }
-SELECT arrayEnumerateUniqRanked(2,[],2); -- { serverError 190 }
+SELECT arrayEnumerateUniqRanked(2,[],2); -- { serverError 36 }
 SELECT arrayEnumerateUniqRanked(2,[],[]); -- { serverError 36 }
-SELECT arrayEnumerateUniqRanked(2,[],[],3); -- { serverError 190 }
-SELECT arrayEnumerateUniqRanked([],2); -- { serverError 190 }
-SELECT arrayEnumerateUniqRanked([],2,[]); -- { serverError 190 }
+SELECT arrayEnumerateUniqRanked(2,[],[],3); -- { serverError 36 }
+SELECT arrayEnumerateUniqRanked([],2); -- { serverError 36 }
+SELECT arrayEnumerateUniqRanked([],2,[]); -- { serverError 36 }
 SELECT arrayEnumerateUniqRanked(0,[],0); -- { serverError 36 }
 SELECT arrayEnumerateUniqRanked(0,0,0); -- { serverError 36 }
 SELECT arrayEnumerateUniqRanked(1,1,1); -- { serverError 36 }
@@ -176,3 +176,7 @@ SELECT arrayEnumerateDenseRanked(['\0'], -8363126); -- { serverError 36 }
 SELECT arrayEnumerateDenseRanked(-10, ['\0'], -8363126); -- { serverError 36 }
 SELECT arrayEnumerateDenseRanked(1, ['\0'], -8363126); -- { serverError 36 }
 SELECT arrayEnumerateDenseRanked(-101, ['\0']); -- { serverError 36 }
+SELECT arrayEnumerateDenseRanked(1.1, [10,20,10,30]);
+SELECT arrayEnumerateDenseRanked([10,20,10,30], 0.4); -- { serverError 36 }
+SELECT arrayEnumerateDenseRanked([10,20,10,30], 1.8);
+SELECT arrayEnumerateUniqRanked(1, [], 1000000000); -- { serverError 36 }

From 28bc3fd7d8410c885d591280393c7e72f66b8527 Mon Sep 17 00:00:00 2001
From: Maxim Akhmedov <max42@yandex-team.ru>
Date: Wed, 6 Mar 2019 22:28:48 +0300
Subject: [PATCH 60/63] Remove accidental modification of unrelated file.

---
 dbms/programs/server/config.xml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/dbms/programs/server/config.xml b/dbms/programs/server/config.xml
index 7a53e7185a0..154ebf6c35e 100644
--- a/dbms/programs/server/config.xml
+++ b/dbms/programs/server/config.xml
@@ -318,10 +318,10 @@
     -->
 
     <!-- Path to file with region hierarchy. -->
-    <path_to_regions_hierarchy_file>../../../../geo/regions_hierarchy.txt</path_to_regions_hierarchy_file>
+    <!-- <path_to_regions_hierarchy_file>/opt/geo/regions_hierarchy.txt</path_to_regions_hierarchy_file> -->
 
     <!-- Path to directory with files containing names of regions -->
-    <path_to_regions_names_files>../../../../geo/</path_to_regions_names_files>
+    <!-- <path_to_regions_names_files>/opt/geo/</path_to_regions_names_files> -->
 
 
     <!-- Configuration of external dictionaries. See:

From f49562bff3496bd288288c1934fa07ca1ac3c03a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Wed, 6 Mar 2019 22:57:54 +0300
Subject: [PATCH 61/63] Flush query metrics before joining thread #4612

---
 dbms/src/Common/ThreadPool.h | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/dbms/src/Common/ThreadPool.h b/dbms/src/Common/ThreadPool.h
index 1cda735cc6f..a0dae3f810c 100644
--- a/dbms/src/Common/ThreadPool.h
+++ b/dbms/src/Common/ThreadPool.h
@@ -142,8 +142,10 @@ public:
             func = std::forward<Function>(func),
             args = std::make_tuple(std::forward<Args>(args)...)]
         {
-            DB::ThreadStatus thread_status;
-            std::apply(func, args);
+            {
+                DB::ThreadStatus thread_status;
+                std::apply(func, args);
+            }
             state->set();
         });
     }

From 55cf27da07ea5da200a4e455a5a6feadc743638f Mon Sep 17 00:00:00 2001
From: proller <proller@github.com>
Date: Wed, 6 Mar 2019 23:06:07 +0300
Subject: [PATCH 62/63] Build fix (copier)

---
 dbms/programs/copier/CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dbms/programs/copier/CMakeLists.txt b/dbms/programs/copier/CMakeLists.txt
index c9f8e44bce8..1be75dff22d 100644
--- a/dbms/programs/copier/CMakeLists.txt
+++ b/dbms/programs/copier/CMakeLists.txt
@@ -1,5 +1,5 @@
 set(CLICKHOUSE_COPIER_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/ClusterCopier.cpp)
-set(CLICKHOUSE_COPIER_LINK PRIVATE clickhouse_functions clickhouse_aggregate_functions daemon)
+set(CLICKHOUSE_COPIER_LINK PRIVATE clickhouse_functions clickhouse_table_functions clickhouse_aggregate_functions daemon)
 #set(CLICKHOUSE_COPIER_INCLUDE SYSTEM PRIVATE ...)
 
 clickhouse_program_add(copier)

From 15576ca809d5c85232d10a07c988faeb7c11b69b Mon Sep 17 00:00:00 2001
From: Maxim Akhmedov <max42@yandex-team.ru>
Date: Thu, 7 Mar 2019 00:32:26 +0300
Subject: [PATCH 63/63] Better lifetime of query context in TCP handler.

---
 dbms/programs/server/TCPHandler.cpp | 55 ++++++++++++++---------------
 dbms/programs/server/TCPHandler.h   |  2 +-
 2 files changed, 28 insertions(+), 29 deletions(-)

diff --git a/dbms/programs/server/TCPHandler.cpp b/dbms/programs/server/TCPHandler.cpp
index 3693f949358..e3582b9ff01 100644
--- a/dbms/programs/server/TCPHandler.cpp
+++ b/dbms/programs/server/TCPHandler.cpp
@@ -120,11 +120,10 @@ void TCPHandler::runImpl()
 
     connection_context.setProgressCallback([this] (const Progress & value) { return this->updateProgress(value); });
 
-    /// Set context of request.
-    query_context = connection_context;
-
     while (1)
     {
+        /// Set context of request.
+        query_context = connection_context;
 
         /// We are waiting for a packet from the client. Thus, every `POLL_INTERVAL` seconds check whether we need to shut down.
         while (!static_cast<ReadBufferFromPocoSocket &>(*in).poll(global_settings.poll_interval * 1000000) && !server.isCancelled())
@@ -159,22 +158,22 @@ void TCPHandler::runImpl()
             if (!receivePacket())
                 continue;
 
-            query_scope.emplace(query_context);
+            query_scope.emplace(*query_context);
 
-            send_exception_with_stack_trace = query_context.getSettingsRef().calculate_text_stack_trace;
+            send_exception_with_stack_trace = query_context->getSettingsRef().calculate_text_stack_trace;
 
             /// Should we send internal logs to client?
             if (client_revision >= DBMS_MIN_REVISION_WITH_SERVER_LOGS
-                && query_context.getSettingsRef().send_logs_level.value != LogsLevel::none)
+                && query_context->getSettingsRef().send_logs_level.value != LogsLevel::none)
             {
                 state.logs_queue = std::make_shared<InternalTextLogsQueue>();
-                state.logs_queue->max_priority = Poco::Logger::parseLevel(query_context.getSettingsRef().send_logs_level.toString());
+                state.logs_queue->max_priority = Poco::Logger::parseLevel(query_context->getSettingsRef().send_logs_level.toString());
                 CurrentThread::attachInternalTextLogsQueue(state.logs_queue);
             }
 
-            query_context.setExternalTablesInitializer([&global_settings, this] (Context & context)
+            query_context->setExternalTablesInitializer([&global_settings, this] (Context & context)
             {
-                if (&context != &query_context)
+                if (&context != &*query_context)
                     throw Exception("Unexpected context in external tables initializer", ErrorCodes::LOGICAL_ERROR);
 
                 /// Get blocks of temporary tables
@@ -186,11 +185,11 @@ void TCPHandler::runImpl()
                 state.maybe_compressed_in.reset(); /// For more accurate accounting by MemoryTracker.
             });
 
-            customizeContext(query_context);
+            customizeContext(*query_context);
 
             bool may_have_embedded_data = client_revision >= DBMS_MIN_REVISION_WITH_CLIENT_SUPPORT_EMBEDDED_DATA;
             /// Processing Query
-            state.io = executeQuery(state.query, query_context, false, state.stage, may_have_embedded_data);
+            state.io = executeQuery(state.query, *query_context, false, state.stage, may_have_embedded_data);
 
             if (state.io.out)
                 state.need_receive_data_for_insert = true;
@@ -210,9 +209,6 @@ void TCPHandler::runImpl()
             sendLogs();
             sendEndOfStream();
 
-            /// Restore context of request.
-            query_context = connection_context;
-
             query_scope.reset();
             state.reset();
         }
@@ -299,6 +295,9 @@ void TCPHandler::runImpl()
         LOG_INFO(log, std::fixed << std::setprecision(3)
             << "Processed in " << watch.elapsedSeconds() << " sec.");
 
+        /// It is important to destroy query context here. We do not want it to live arbitrarily longer than the query.
+        query_context.reset();
+
         if (network_error)
             break;
     }
@@ -307,7 +306,7 @@ void TCPHandler::runImpl()
 
 void TCPHandler::readData(const Settings & global_settings)
 {
-    const auto receive_timeout = query_context.getSettingsRef().receive_timeout.value;
+    const auto receive_timeout = query_context->getSettingsRef().receive_timeout.value;
 
     /// Poll interval should not be greater than receive_timeout
     const size_t default_poll_interval = global_settings.poll_interval.value * 1000000;
@@ -370,8 +369,8 @@ void TCPHandler::processInsertQuery(const Settings & global_settings)
     /// Send ColumnsDescription for insertion table
     if (client_revision >= DBMS_MIN_REVISION_WITH_COLUMN_DEFAULTS_METADATA)
     {
-        const auto & db_and_table = query_context.getInsertionTable();
-        if (auto * columns = ColumnsDescription::loadFromContext(query_context, db_and_table.first, db_and_table.second))
+        const auto & db_and_table = query_context->getInsertionTable();
+        if (auto * columns = ColumnsDescription::loadFromContext(*query_context, db_and_table.first, db_and_table.second))
             sendTableColumns(*columns);
     }
 
@@ -414,7 +413,7 @@ void TCPHandler::processOrdinaryQuery()
                 }
                 else
                 {
-                    if (after_send_progress.elapsed() / 1000 >= query_context.getSettingsRef().interactive_delay)
+                    if (after_send_progress.elapsed() / 1000 >= query_context->getSettingsRef().interactive_delay)
                     {
                         /// Some time passed and there is a progress.
                         after_send_progress.restart();
@@ -423,7 +422,7 @@ void TCPHandler::processOrdinaryQuery()
 
                     sendLogs();
 
-                    if (async_in.poll(query_context.getSettingsRef().interactive_delay / 1000))
+                    if (async_in.poll(query_context->getSettingsRef().interactive_delay / 1000))
                     {
                         /// There is the following result block.
                         block = async_in.read();
@@ -651,11 +650,11 @@ void TCPHandler::receiveQuery()
     state.is_empty = false;
     readStringBinary(state.query_id, *in);
 
-    query_context.setCurrentQueryId(state.query_id);
+    query_context->setCurrentQueryId(state.query_id);
 
     /// Client info
     {
-        ClientInfo & client_info = query_context.getClientInfo();
+        ClientInfo & client_info = query_context->getClientInfo();
         if (client_revision >= DBMS_MIN_REVISION_WITH_CLIENT_INFO)
             client_info.read(*in, client_revision);
 
@@ -683,7 +682,7 @@ void TCPHandler::receiveQuery()
     }
 
     /// Per query settings.
-    Settings & settings = query_context.getSettingsRef();
+    Settings & settings = query_context->getSettingsRef();
     settings.deserialize(*in);
 
     /// Sync timeouts on client and server during current query to avoid dangling queries on server
@@ -721,16 +720,16 @@ bool TCPHandler::receiveData()
         {
             StoragePtr storage;
             /// If such a table does not exist, create it.
-            if (!(storage = query_context.tryGetExternalTable(external_table_name)))
+            if (!(storage = query_context->tryGetExternalTable(external_table_name)))
             {
                 NamesAndTypesList columns = block.getNamesAndTypesList();
                 storage = StorageMemory::create(external_table_name,
                     ColumnsDescription{columns, NamesAndTypesList{}, NamesAndTypesList{}, ColumnDefaults{}, ColumnComments{}, ColumnCodecs{}});
                 storage->startup();
-                query_context.addExternalTable(external_table_name, storage);
+                query_context->addExternalTable(external_table_name, storage);
             }
             /// The data will be written directly to the table.
-            state.io.out = storage->write(ASTPtr(), query_context);
+            state.io.out = storage->write(ASTPtr(), *query_context);
         }
         if (block)
             state.io.out->write(block);
@@ -769,10 +768,10 @@ void TCPHandler::initBlockOutput(const Block & block)
     {
         if (!state.maybe_compressed_out)
         {
-            std::string method = query_context.getSettingsRef().network_compression_method;
+            std::string method = query_context->getSettingsRef().network_compression_method;
             std::optional<int> level;
             if (method == "ZSTD")
-                level = query_context.getSettingsRef().network_zstd_compression_level;
+                level = query_context->getSettingsRef().network_zstd_compression_level;
 
             if (state.compression == Protocol::Compression::Enable)
                 state.maybe_compressed_out = std::make_shared<CompressedWriteBuffer>(
@@ -808,7 +807,7 @@ bool TCPHandler::isQueryCancelled()
     if (state.is_cancelled || state.sent_all_data)
         return true;
 
-    if (after_check_cancelled.elapsed() / 1000 < query_context.getSettingsRef().interactive_delay)
+    if (after_check_cancelled.elapsed() / 1000 < query_context->getSettingsRef().interactive_delay)
         return false;
 
     after_check_cancelled.restart();
diff --git a/dbms/programs/server/TCPHandler.h b/dbms/programs/server/TCPHandler.h
index bd375dc5296..38ab27fd67b 100644
--- a/dbms/programs/server/TCPHandler.h
+++ b/dbms/programs/server/TCPHandler.h
@@ -109,7 +109,7 @@ private:
     UInt64 client_revision = 0;
 
     Context connection_context;
-    Context query_context;
+    std::optional<Context> query_context;
 
     /// Streams for reading/writing from/to client connection socket.
     std::shared_ptr<ReadBuffer> in;