mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-11-23 08:02:02 +00:00
Merge branch 'master' into fix-backup-without-native-copy
This commit is contained in:
commit
ef8faeffc0
20
.clang-tidy
20
.clang-tidy
@ -22,6 +22,7 @@ Checks: [
|
|||||||
'-bugprone-exception-escape',
|
'-bugprone-exception-escape',
|
||||||
'-bugprone-forward-declaration-namespace',
|
'-bugprone-forward-declaration-namespace',
|
||||||
'-bugprone-implicit-widening-of-multiplication-result',
|
'-bugprone-implicit-widening-of-multiplication-result',
|
||||||
|
'-bugprone-multi-level-implicit-pointer-conversion',
|
||||||
'-bugprone-narrowing-conversions',
|
'-bugprone-narrowing-conversions',
|
||||||
'-bugprone-not-null-terminated-result',
|
'-bugprone-not-null-terminated-result',
|
||||||
'-bugprone-reserved-identifier', # useful but too slow, TODO retry when https://reviews.llvm.org/rG1c282052624f9d0bd273bde0b47b30c96699c6c7 is merged
|
'-bugprone-reserved-identifier', # useful but too slow, TODO retry when https://reviews.llvm.org/rG1c282052624f9d0bd273bde0b47b30c96699c6c7 is merged
|
||||||
@ -98,6 +99,7 @@ Checks: [
|
|||||||
'-modernize-use-nodiscard',
|
'-modernize-use-nodiscard',
|
||||||
'-modernize-use-trailing-return-type',
|
'-modernize-use-trailing-return-type',
|
||||||
|
|
||||||
|
'-performance-enum-size',
|
||||||
'-performance-inefficient-string-concatenation',
|
'-performance-inefficient-string-concatenation',
|
||||||
'-performance-no-int-to-ptr',
|
'-performance-no-int-to-ptr',
|
||||||
'-performance-avoid-endl',
|
'-performance-avoid-endl',
|
||||||
@ -105,6 +107,7 @@ Checks: [
|
|||||||
|
|
||||||
'-portability-simd-intrinsics',
|
'-portability-simd-intrinsics',
|
||||||
|
|
||||||
|
'-readability-avoid-nested-conditional-operator',
|
||||||
'-readability-avoid-unconditional-preprocessor-if',
|
'-readability-avoid-unconditional-preprocessor-if',
|
||||||
'-readability-braces-around-statements',
|
'-readability-braces-around-statements',
|
||||||
'-readability-convert-member-functions-to-static',
|
'-readability-convert-member-functions-to-static',
|
||||||
@ -118,6 +121,12 @@ Checks: [
|
|||||||
'-readability-magic-numbers',
|
'-readability-magic-numbers',
|
||||||
'-readability-named-parameter',
|
'-readability-named-parameter',
|
||||||
'-readability-redundant-declaration',
|
'-readability-redundant-declaration',
|
||||||
|
'-readability-redundant-inline-specifier',
|
||||||
|
'-readability-redundant-member-init', # Useful but triggers another problem. Imagine a struct S with multiple String members. Structs are often instantiated via designated
|
||||||
|
# initializer S s{.s1 = [...], .s2 = [...], [...]}. In this case, compiler warning `missing-field-initializers` requires to specify all members which are not in-struct
|
||||||
|
# initialized (example: s1 in struct S { String s1; String s2{};}; is not in-struct initialized, therefore it must be specified at instantiation time). As explicitly
|
||||||
|
# specifying all members is tedious for large structs, `missing-field-initializers` makes programmers initialize as many members as possible in-struct. Clang-tidy
|
||||||
|
# warning `readability-redundant-member-init` does the opposite thing, both are not compatible with each other.
|
||||||
'-readability-simplify-boolean-expr',
|
'-readability-simplify-boolean-expr',
|
||||||
'-readability-suspicious-call-argument',
|
'-readability-suspicious-call-argument',
|
||||||
'-readability-uppercase-literal-suffix',
|
'-readability-uppercase-literal-suffix',
|
||||||
@ -125,17 +134,6 @@ Checks: [
|
|||||||
|
|
||||||
'-zircon-*',
|
'-zircon-*',
|
||||||
|
|
||||||
# These are new in clang-18, and we have to sort them out:
|
|
||||||
'-readability-avoid-nested-conditional-operator',
|
|
||||||
'-modernize-use-designated-initializers',
|
|
||||||
'-performance-enum-size',
|
|
||||||
'-readability-redundant-inline-specifier',
|
|
||||||
'-readability-redundant-member-init',
|
|
||||||
'-bugprone-crtp-constructor-accessibility',
|
|
||||||
'-bugprone-suspicious-stringview-data-usage',
|
|
||||||
'-bugprone-multi-level-implicit-pointer-conversion',
|
|
||||||
'-cert-err33-c',
|
|
||||||
|
|
||||||
# This is a good check, but clang-tidy crashes, see https://github.com/llvm/llvm-project/issues/91872
|
# This is a good check, but clang-tidy crashes, see https://github.com/llvm/llvm-project/issues/91872
|
||||||
'-modernize-use-constraints',
|
'-modernize-use-constraints',
|
||||||
# https://github.com/abseil/abseil-cpp/issues/1667
|
# https://github.com/abseil/abseil-cpp/issues/1667
|
||||||
|
40
.github/workflows/pull_request.yml
vendored
40
.github/workflows/pull_request.yml
vendored
@ -130,15 +130,21 @@ jobs:
|
|||||||
with:
|
with:
|
||||||
stage: Tests_2
|
stage: Tests_2
|
||||||
data: ${{ needs.RunConfig.outputs.data }}
|
data: ${{ needs.RunConfig.outputs.data }}
|
||||||
|
# stage for jobs that do not prohibit merge
|
||||||
|
Tests_3:
|
||||||
|
needs: [RunConfig, Tests_1, Tests_2]
|
||||||
|
if: ${{ !failure() && !cancelled() && contains(fromJson(needs.RunConfig.outputs.data).stages_data.stages_to_do, 'Tests_3') }}
|
||||||
|
uses: ./.github/workflows/reusable_test_stage.yml
|
||||||
|
with:
|
||||||
|
stage: Tests_3
|
||||||
|
data: ${{ needs.RunConfig.outputs.data }}
|
||||||
|
|
||||||
################################# Reports #################################
|
################################# Reports #################################
|
||||||
# Reports should by run even if Builds_1/2 fail, so put them separatly in wf (not in Tests_1/2)
|
# Reports should by run even if Builds_1/2 fail, so put them separately in wf (not in Tests_1/2)
|
||||||
Builds_1_Report:
|
Builds_1_Report:
|
||||||
# run report check for failed builds to indicate the CI error
|
# run report check for failed builds to indicate the CI error
|
||||||
if: ${{ !cancelled() && contains(fromJson(needs.RunConfig.outputs.data).jobs_data.jobs_to_do, 'ClickHouse build check') }}
|
if: ${{ !cancelled() && needs.StyleCheck.result == 'success' && contains(fromJson(needs.RunConfig.outputs.data).jobs_data.jobs_to_do, 'ClickHouse build check') }}
|
||||||
needs:
|
needs: [RunConfig, StyleCheck, Builds_1]
|
||||||
- RunConfig
|
|
||||||
- Builds_1
|
|
||||||
uses: ./.github/workflows/reusable_test.yml
|
uses: ./.github/workflows/reusable_test.yml
|
||||||
with:
|
with:
|
||||||
test_name: ClickHouse build check
|
test_name: ClickHouse build check
|
||||||
@ -146,25 +152,39 @@ jobs:
|
|||||||
data: ${{ needs.RunConfig.outputs.data }}
|
data: ${{ needs.RunConfig.outputs.data }}
|
||||||
Builds_2_Report:
|
Builds_2_Report:
|
||||||
# run report check for failed builds to indicate the CI error
|
# run report check for failed builds to indicate the CI error
|
||||||
if: ${{ !cancelled() && contains(fromJson(needs.RunConfig.outputs.data).jobs_data.jobs_to_do, 'ClickHouse special build check') }}
|
if: ${{ !cancelled() && needs.StyleCheck.result == 'success' && contains(fromJson(needs.RunConfig.outputs.data).jobs_data.jobs_to_do, 'ClickHouse special build check') }}
|
||||||
needs:
|
needs: [RunConfig, StyleCheck, Builds_2]
|
||||||
- RunConfig
|
|
||||||
- Builds_2
|
|
||||||
uses: ./.github/workflows/reusable_test.yml
|
uses: ./.github/workflows/reusable_test.yml
|
||||||
with:
|
with:
|
||||||
test_name: ClickHouse special build check
|
test_name: ClickHouse special build check
|
||||||
runner_type: style-checker-aarch64
|
runner_type: style-checker-aarch64
|
||||||
data: ${{ needs.RunConfig.outputs.data }}
|
data: ${{ needs.RunConfig.outputs.data }}
|
||||||
|
|
||||||
|
CheckReadyForMerge:
|
||||||
|
if: ${{ !cancelled() && needs.StyleCheck.result == 'success' }}
|
||||||
|
needs: [RunConfig, BuildDockers, StyleCheck, FastTest, Builds_1, Builds_2, Builds_1_Report, Builds_2_Report, Tests_1, Tests_2]
|
||||||
|
runs-on: [self-hosted, style-checker-aarch64]
|
||||||
|
steps:
|
||||||
|
- name: Check out repository code
|
||||||
|
uses: ClickHouse/checkout@v1
|
||||||
|
with:
|
||||||
|
filter: tree:0
|
||||||
|
- name: Check and set merge status
|
||||||
|
run: |
|
||||||
|
cd "$GITHUB_WORKSPACE/tests/ci"
|
||||||
|
python3 merge_pr.py --set-ci-status --wf-status ${{ contains(needs.*.result, 'failure') && 'failure' || 'success' }}
|
||||||
|
|
||||||
################################# Stage Final #################################
|
################################# Stage Final #################################
|
||||||
#
|
#
|
||||||
FinishCheck:
|
FinishCheck:
|
||||||
if: ${{ !failure() && !cancelled() }}
|
if: ${{ !failure() && !cancelled() }}
|
||||||
needs: [RunConfig, BuildDockers, StyleCheck, FastTest, Builds_1, Builds_2, Builds_1_Report, Builds_2_Report, Tests_1, Tests_2]
|
needs: [RunConfig, BuildDockers, StyleCheck, FastTest, Builds_1, Builds_2, Builds_1_Report, Builds_2_Report, Tests_1, Tests_2, Tests_3]
|
||||||
runs-on: [self-hosted, style-checker]
|
runs-on: [self-hosted, style-checker]
|
||||||
steps:
|
steps:
|
||||||
- name: Check out repository code
|
- name: Check out repository code
|
||||||
uses: ClickHouse/checkout@v1
|
uses: ClickHouse/checkout@v1
|
||||||
|
with:
|
||||||
|
filter: tree:0
|
||||||
- name: Finish label
|
- name: Finish label
|
||||||
run: |
|
run: |
|
||||||
cd "$GITHUB_WORKSPACE/tests/ci"
|
cd "$GITHUB_WORKSPACE/tests/ci"
|
||||||
|
@ -61,9 +61,11 @@ if (ENABLE_CHECK_HEAVY_BUILDS)
|
|||||||
# set CPU time limit to 1000 seconds
|
# set CPU time limit to 1000 seconds
|
||||||
set (RLIMIT_CPU 1000)
|
set (RLIMIT_CPU 1000)
|
||||||
|
|
||||||
# Sanitizers are too heavy
|
# Sanitizers are too heavy. Some architectures too.
|
||||||
if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE)
|
if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE OR ARCH_RISCV64 OR ARCH_LOONGARCH64)
|
||||||
set (RLIMIT_DATA 10000000000) # 10G
|
# Twice as large
|
||||||
|
set (RLIMIT_DATA 10000000000)
|
||||||
|
set (RLIMIT_AS 20000000000)
|
||||||
endif()
|
endif()
|
||||||
|
|
||||||
# For some files currently building RISCV64 might be too slow. TODO: Improve compilation times per file
|
# For some files currently building RISCV64 might be too slow. TODO: Improve compilation times per file
|
||||||
|
@ -9,11 +9,18 @@
|
|||||||
bool cgroupsV2Enabled()
|
bool cgroupsV2Enabled()
|
||||||
{
|
{
|
||||||
#if defined(OS_LINUX)
|
#if defined(OS_LINUX)
|
||||||
|
try
|
||||||
|
{
|
||||||
/// This file exists iff the host has cgroups v2 enabled.
|
/// This file exists iff the host has cgroups v2 enabled.
|
||||||
auto controllers_file = default_cgroups_mount / "cgroup.controllers";
|
auto controllers_file = default_cgroups_mount / "cgroup.controllers";
|
||||||
if (!std::filesystem::exists(controllers_file))
|
if (!std::filesystem::exists(controllers_file))
|
||||||
return false;
|
return false;
|
||||||
return true;
|
return true;
|
||||||
|
}
|
||||||
|
catch (const std::filesystem::filesystem_error &) /// all "underlying OS API errors", typically: permission denied
|
||||||
|
{
|
||||||
|
return false; /// not logging the exception as most callers fall back to cgroups v1
|
||||||
|
}
|
||||||
#else
|
#else
|
||||||
return false;
|
return false;
|
||||||
#endif
|
#endif
|
||||||
|
2
contrib/libunwind
vendored
2
contrib/libunwind
vendored
@ -1 +1 @@
|
|||||||
Subproject commit 854538ce337d631b619010528adff22cd58f9dce
|
Subproject commit d6a01c46327e56fd86beb8aaa31591fcd9a6b7df
|
@ -160,10 +160,17 @@ function clone_submodules
|
|||||||
|
|
||||||
git submodule sync
|
git submodule sync
|
||||||
git submodule init
|
git submodule init
|
||||||
|
|
||||||
|
# Network is unreliable
|
||||||
|
for _ in {1..10}
|
||||||
|
do
|
||||||
# --jobs does not work as fast as real parallel running
|
# --jobs does not work as fast as real parallel running
|
||||||
printf '%s\0' "${SUBMODULES_TO_UPDATE[@]}" | \
|
printf '%s\0' "${SUBMODULES_TO_UPDATE[@]}" | \
|
||||||
xargs --max-procs=100 --null --no-run-if-empty --max-args=1 \
|
xargs --max-procs=100 --null --no-run-if-empty --max-args=1 \
|
||||||
git submodule update --depth 1 --single-branch
|
git submodule update --depth 1 --single-branch && break
|
||||||
|
sleep 1
|
||||||
|
done
|
||||||
|
|
||||||
git submodule foreach git reset --hard
|
git submodule foreach git reset --hard
|
||||||
git submodule foreach git checkout @ -f
|
git submodule foreach git checkout @ -f
|
||||||
git submodule foreach git clean -xfd
|
git submodule foreach git clean -xfd
|
||||||
|
@ -58,8 +58,14 @@ echo "ATTACH DATABASE system ENGINE=Ordinary" > /var/lib/clickhouse/metadata/sys
|
|||||||
# Install previous release packages
|
# Install previous release packages
|
||||||
install_packages previous_release_package_folder
|
install_packages previous_release_package_folder
|
||||||
|
|
||||||
# Save old settings from system table for settings changes check
|
# NOTE: we need to run clickhouse-local under script to get settings without any adjustments, like clickhouse-local does in case of stdout is not a tty
|
||||||
clickhouse-local -q "select * from system.settings format Native" > old_settings.native
|
function save_settings_clean()
|
||||||
|
{
|
||||||
|
local out=$1 && shift
|
||||||
|
script -q -c "clickhouse-local -q \"select * from system.settings into outfile '$out'\"" --log-out /dev/null
|
||||||
|
}
|
||||||
|
|
||||||
|
save_settings_clean 'old_settings.native'
|
||||||
|
|
||||||
# Initial run without S3 to create system.*_log on local file system to make it
|
# Initial run without S3 to create system.*_log on local file system to make it
|
||||||
# available for dump via clickhouse-local
|
# available for dump via clickhouse-local
|
||||||
@ -183,7 +189,7 @@ configure
|
|||||||
IS_SANITIZED=$(clickhouse-local --query "SELECT value LIKE '%-fsanitize=%' FROM system.build_options WHERE name = 'CXX_FLAGS'")
|
IS_SANITIZED=$(clickhouse-local --query "SELECT value LIKE '%-fsanitize=%' FROM system.build_options WHERE name = 'CXX_FLAGS'")
|
||||||
if [ "${IS_SANITIZED}" -eq "0" ]
|
if [ "${IS_SANITIZED}" -eq "0" ]
|
||||||
then
|
then
|
||||||
clickhouse-local -q "select * from system.settings format Native" > new_settings.native
|
save_settings_clean 'new_settings.native'
|
||||||
clickhouse-local -nmq "
|
clickhouse-local -nmq "
|
||||||
CREATE TABLE old_settings AS file('old_settings.native');
|
CREATE TABLE old_settings AS file('old_settings.native');
|
||||||
CREATE TABLE new_settings AS file('new_settings.native');
|
CREATE TABLE new_settings AS file('new_settings.native');
|
||||||
|
@ -22,7 +22,7 @@ description: In order to effectively mitigate possible human errors, you should
|
|||||||
TEMPORARY TABLE table_name [AS table_name_in_backup] |
|
TEMPORARY TABLE table_name [AS table_name_in_backup] |
|
||||||
VIEW view_name [AS view_name_in_backup]
|
VIEW view_name [AS view_name_in_backup]
|
||||||
ALL TEMPORARY TABLES [EXCEPT ...] |
|
ALL TEMPORARY TABLES [EXCEPT ...] |
|
||||||
ALL DATABASES [EXCEPT ...] } [,...]
|
ALL [EXCEPT ...] } [,...]
|
||||||
[ON CLUSTER 'cluster_name']
|
[ON CLUSTER 'cluster_name']
|
||||||
TO|FROM File('<path>/<filename>') | Disk('<disk_name>', '<path>/') | S3('<S3 endpoint>/<path>', '<Access key ID>', '<Secret access key>')
|
TO|FROM File('<path>/<filename>') | Disk('<disk_name>', '<path>/') | S3('<S3 endpoint>/<path>', '<Access key ID>', '<Secret access key>')
|
||||||
[SETTINGS base_backup = File('<path>/<filename>') | Disk(...) | S3('<S3 endpoint>/<path>', '<Access key ID>', '<Secret access key>')]
|
[SETTINGS base_backup = File('<path>/<filename>') | Disk(...) | S3('<S3 endpoint>/<path>', '<Access key ID>', '<Secret access key>')]
|
||||||
|
@ -7,27 +7,27 @@ title: "External Disks for Storing Data"
|
|||||||
|
|
||||||
Data, processed in ClickHouse, is usually stored in the local file system — on the same machine with the ClickHouse server. That requires large-capacity disks, which can be expensive enough. To avoid that you can store the data remotely. Various storages are supported:
|
Data, processed in ClickHouse, is usually stored in the local file system — on the same machine with the ClickHouse server. That requires large-capacity disks, which can be expensive enough. To avoid that you can store the data remotely. Various storages are supported:
|
||||||
1. [Amazon S3](https://aws.amazon.com/s3/) object storage.
|
1. [Amazon S3](https://aws.amazon.com/s3/) object storage.
|
||||||
2. The Hadoop Distributed File System ([HDFS](https://hadoop.apache.org/docs/current/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html))
|
2. [Azure Blob Storage](https://azure.microsoft.com/en-us/products/storage/blobs).
|
||||||
3. [Azure Blob Storage](https://azure.microsoft.com/en-us/products/storage/blobs).
|
3. Unsupported: The Hadoop Distributed File System ([HDFS](https://hadoop.apache.org/docs/current/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html))
|
||||||
|
|
||||||
:::note ClickHouse also has support for external table engines, which are different from external storage option described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` family or `Log` family tables.
|
:::note ClickHouse also has support for external table engines, which are different from external storage option described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` family or `Log` family tables.
|
||||||
1. to work with data stored on `Amazon S3` disks, use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine.
|
1. to work with data stored on `Amazon S3` disks, use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine.
|
||||||
2. to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine.
|
2. to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/azureBlobStorage.md) table engine.
|
||||||
3. to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/azureBlobStorage.md) table engine.
|
3. Unsupported: to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine.
|
||||||
:::
|
:::
|
||||||
|
|
||||||
## Configuring external storage {#configuring-external-storage}
|
## Configuring external storage {#configuring-external-storage}
|
||||||
|
|
||||||
[MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md) and [Log](/docs/en/engines/table-engines/log-family/log.md) family table engines can store data to `S3`, `AzureBlobStorage`, `HDFS` using a disk with types `s3`, `azure_blob_storage`, `hdfs` accordingly.
|
[MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md) and [Log](/docs/en/engines/table-engines/log-family/log.md) family table engines can store data to `S3`, `AzureBlobStorage`, `HDFS` (unsupported) using a disk with types `s3`, `azure_blob_storage`, `hdfs` (unsupported) accordingly.
|
||||||
|
|
||||||
Disk configuration requires:
|
Disk configuration requires:
|
||||||
1. `type` section, equal to one of `s3`, `azure_blob_storage`, `hdfs`, `local_blob_storage`, `web`.
|
1. `type` section, equal to one of `s3`, `azure_blob_storage`, `hdfs` (unsupported), `local_blob_storage`, `web`.
|
||||||
2. Configuration of a specific external storage type.
|
2. Configuration of a specific external storage type.
|
||||||
|
|
||||||
Starting from 24.1 clickhouse version, it is possible to use a new configuration option.
|
Starting from 24.1 clickhouse version, it is possible to use a new configuration option.
|
||||||
It requires to specify:
|
It requires to specify:
|
||||||
1. `type` equal to `object_storage`
|
1. `type` equal to `object_storage`
|
||||||
2. `object_storage_type`, equal to one of `s3`, `azure_blob_storage` (or just `azure` from `24.3`), `hdfs`, `local_blob_storage` (or just `local` from `24.3`), `web`.
|
2. `object_storage_type`, equal to one of `s3`, `azure_blob_storage` (or just `azure` from `24.3`), `hdfs` (unsupported), `local_blob_storage` (or just `local` from `24.3`), `web`.
|
||||||
Optionally, `metadata_type` can be specified (it is equal to `local` by default), but it can also be set to `plain`, `web` and, starting from `24.4`, `plain_rewritable`.
|
Optionally, `metadata_type` can be specified (it is equal to `local` by default), but it can also be set to `plain`, `web` and, starting from `24.4`, `plain_rewritable`.
|
||||||
Usage of `plain` metadata type is described in [plain storage section](/docs/en/operations/storing-data.md/#storing-data-on-webserver), `web` metadata type can be used only with `web` object storage type, `local` metadata type stores metadata files locally (each metadata files contains mapping to files in object storage and some additional meta information about them).
|
Usage of `plain` metadata type is described in [plain storage section](/docs/en/operations/storing-data.md/#storing-data-on-webserver), `web` metadata type can be used only with `web` object storage type, `local` metadata type stores metadata files locally (each metadata files contains mapping to files in object storage and some additional meta information about them).
|
||||||
|
|
||||||
@ -328,7 +328,7 @@ Configuration:
|
|||||||
</s3_plain>
|
</s3_plain>
|
||||||
```
|
```
|
||||||
|
|
||||||
Starting from `24.1` it is possible configure any object storage disk (`s3`, `azure`, `hdfs`, `local`) using `plain` metadata type.
|
Starting from `24.1` it is possible configure any object storage disk (`s3`, `azure`, `hdfs` (unsupported), `local`) using `plain` metadata type.
|
||||||
|
|
||||||
Configuration:
|
Configuration:
|
||||||
``` xml
|
``` xml
|
||||||
@ -428,12 +428,14 @@ Examples of working configurations can be found in integration tests directory (
|
|||||||
Zero-copy replication is disabled by default in ClickHouse version 22.8 and higher. This feature is not recommended for production use.
|
Zero-copy replication is disabled by default in ClickHouse version 22.8 and higher. This feature is not recommended for production use.
|
||||||
:::
|
:::
|
||||||
|
|
||||||
## Using HDFS storage {#hdfs-storage}
|
## Using HDFS storage (Unsupported)
|
||||||
|
|
||||||
In this sample configuration:
|
In this sample configuration:
|
||||||
- the disk is of type `hdfs`
|
- the disk is of type `hdfs` (unsupported)
|
||||||
- the data is hosted at `hdfs://hdfs1:9000/clickhouse/`
|
- the data is hosted at `hdfs://hdfs1:9000/clickhouse/`
|
||||||
|
|
||||||
|
By the way, HDFS is unsupported and therefore there might be issues when using it. Feel free to make a pull request with the fix if any issue arises.
|
||||||
|
|
||||||
```xml
|
```xml
|
||||||
<clickhouse>
|
<clickhouse>
|
||||||
<storage_configuration>
|
<storage_configuration>
|
||||||
@ -464,9 +466,11 @@ In this sample configuration:
|
|||||||
</clickhouse>
|
</clickhouse>
|
||||||
```
|
```
|
||||||
|
|
||||||
|
Keep in mind that HDFS may not work in corner cases.
|
||||||
|
|
||||||
### Using Data Encryption {#encrypted-virtual-file-system}
|
### Using Data Encryption {#encrypted-virtual-file-system}
|
||||||
|
|
||||||
You can encrypt the data stored on [S3](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#table_engine-mergetree-s3), or [HDFS](#configuring-hdfs) external disks, or on a local disk. To turn on the encryption mode, in the configuration file you must define a disk with the type `encrypted` and choose a disk on which the data will be saved. An `encrypted` disk ciphers all written files on the fly, and when you read files from an `encrypted` disk it deciphers them automatically. So you can work with an `encrypted` disk like with a normal one.
|
You can encrypt the data stored on [S3](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#table_engine-mergetree-s3), or [HDFS](#configuring-hdfs) (unsupported) external disks, or on a local disk. To turn on the encryption mode, in the configuration file you must define a disk with the type `encrypted` and choose a disk on which the data will be saved. An `encrypted` disk ciphers all written files on the fly, and when you read files from an `encrypted` disk it deciphers them automatically. So you can work with an `encrypted` disk like with a normal one.
|
||||||
|
|
||||||
Example of disk configuration:
|
Example of disk configuration:
|
||||||
|
|
||||||
@ -529,7 +533,7 @@ Example of disk configuration:
|
|||||||
|
|
||||||
It is possible to configure local cache over disks in storage configuration starting from version 22.3.
|
It is possible to configure local cache over disks in storage configuration starting from version 22.3.
|
||||||
For versions 22.3 - 22.7 cache is supported only for `s3` disk type. For versions >= 22.8 cache is supported for any disk type: S3, Azure, Local, Encrypted, etc.
|
For versions 22.3 - 22.7 cache is supported only for `s3` disk type. For versions >= 22.8 cache is supported for any disk type: S3, Azure, Local, Encrypted, etc.
|
||||||
For versions >= 23.5 cache is supported only for remote disk types: S3, Azure, HDFS.
|
For versions >= 23.5 cache is supported only for remote disk types: S3, Azure, HDFS (unsupported).
|
||||||
Cache uses `LRU` cache policy.
|
Cache uses `LRU` cache policy.
|
||||||
|
|
||||||
|
|
||||||
@ -971,7 +975,7 @@ Use [http_max_single_read_retries](/docs/en/operations/settings/settings.md/#htt
|
|||||||
|
|
||||||
### Zero-copy Replication (not ready for production) {#zero-copy}
|
### Zero-copy Replication (not ready for production) {#zero-copy}
|
||||||
|
|
||||||
Zero-copy replication is possible, but not recommended, with `S3` and `HDFS` disks. Zero-copy replication means that if the data is stored remotely on several machines and needs to be synchronized, then only the metadata is replicated (paths to the data parts), but not the data itself.
|
Zero-copy replication is possible, but not recommended, with `S3` and `HDFS` (unsupported) disks. Zero-copy replication means that if the data is stored remotely on several machines and needs to be synchronized, then only the metadata is replicated (paths to the data parts), but not the data itself.
|
||||||
|
|
||||||
:::note Zero-copy replication is not ready for production
|
:::note Zero-copy replication is not ready for production
|
||||||
Zero-copy replication is disabled by default in ClickHouse version 22.8 and higher. This feature is not recommended for production use.
|
Zero-copy replication is disabled by default in ClickHouse version 22.8 and higher. This feature is not recommended for production use.
|
||||||
|
@ -108,7 +108,7 @@ Columns:
|
|||||||
- `used_aggregate_function_combinators` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `aggregate functions combinators`, which were used during query execution.
|
- `used_aggregate_function_combinators` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `aggregate functions combinators`, which were used during query execution.
|
||||||
- `used_database_engines` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `database engines`, which were used during query execution.
|
- `used_database_engines` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `database engines`, which were used during query execution.
|
||||||
- `used_data_type_families` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `data type families`, which were used during query execution.
|
- `used_data_type_families` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `data type families`, which were used during query execution.
|
||||||
- `used_dictionaries` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `dictionaries`, which were used during query execution.
|
- `used_dictionaries` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `dictionaries`, which were used during query execution. For dictionaries configured using an XML file this is the name of the dictionary, and for dictionaries created by an SQL statement, the canonical name is the fully qualified object name.
|
||||||
- `used_formats` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `formats`, which were used during query execution.
|
- `used_formats` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `formats`, which were used during query execution.
|
||||||
- `used_functions` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `functions`, which were used during query execution.
|
- `used_functions` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `functions`, which were used during query execution.
|
||||||
- `used_storages` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `storages`, which were used during query execution.
|
- `used_storages` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `storages`, which were used during query execution.
|
||||||
|
@ -0,0 +1,45 @@
|
|||||||
|
---
|
||||||
|
slug: /en/sql-reference/aggregate-functions/reference/analysis_of_variance
|
||||||
|
sidebar_position: 6
|
||||||
|
---
|
||||||
|
|
||||||
|
# analysisOfVariance
|
||||||
|
|
||||||
|
Provides a statistical test for one-way analysis of variance (ANOVA test). It is a test over several groups of normally distributed observations to find out whether all groups have the same mean or not.
|
||||||
|
|
||||||
|
**Syntax**
|
||||||
|
|
||||||
|
```sql
|
||||||
|
analysisOfVariance(val, group_no)
|
||||||
|
```
|
||||||
|
|
||||||
|
Aliases: `anova`
|
||||||
|
|
||||||
|
**Parameters**
|
||||||
|
- `val`: value.
|
||||||
|
- `group_no` : group number that `val` belongs to.
|
||||||
|
|
||||||
|
:::note
|
||||||
|
Groups are enumerated starting from 0 and there should be at least two groups to perform a test.
|
||||||
|
There should be at least one group with the number of observations greater than one.
|
||||||
|
:::
|
||||||
|
|
||||||
|
**Returned value**
|
||||||
|
|
||||||
|
- `(f_statistic, p_value)`. [Tuple](../../data-types/tuple.md)([Float64](../../data-types/float.md), [Float64](../../data-types/float.md)).
|
||||||
|
|
||||||
|
**Example**
|
||||||
|
|
||||||
|
Query:
|
||||||
|
|
||||||
|
```sql
|
||||||
|
SELECT analysisOfVariance(number, number % 2) FROM numbers(1048575);
|
||||||
|
```
|
||||||
|
|
||||||
|
Result:
|
||||||
|
|
||||||
|
```response
|
||||||
|
┌─analysisOfVariance(number, modulo(number, 2))─┐
|
||||||
|
│ (0,1) │
|
||||||
|
└───────────────────────────────────────────────┘
|
||||||
|
```
|
@ -37,6 +37,7 @@ Standard aggregate functions:
|
|||||||
|
|
||||||
ClickHouse-specific aggregate functions:
|
ClickHouse-specific aggregate functions:
|
||||||
|
|
||||||
|
- [analysisOfVariance](/docs/en/sql-reference/aggregate-functions/reference/analysis_of_variance.md)
|
||||||
- [any](/docs/en/sql-reference/aggregate-functions/reference/any_respect_nulls.md)
|
- [any](/docs/en/sql-reference/aggregate-functions/reference/any_respect_nulls.md)
|
||||||
- [anyHeavy](/docs/en/sql-reference/aggregate-functions/reference/anyheavy.md)
|
- [anyHeavy](/docs/en/sql-reference/aggregate-functions/reference/anyheavy.md)
|
||||||
- [anyLast](/docs/en/sql-reference/aggregate-functions/reference/anylast.md)
|
- [anyLast](/docs/en/sql-reference/aggregate-functions/reference/anylast.md)
|
||||||
|
@ -998,17 +998,170 @@ SELECT version()
|
|||||||
Returns the build ID generated by a compiler for the running ClickHouse server binary.
|
Returns the build ID generated by a compiler for the running ClickHouse server binary.
|
||||||
If executed in the context of a distributed table, this function generates a normal column with values relevant to each shard. Otherwise it produces a constant value.
|
If executed in the context of a distributed table, this function generates a normal column with values relevant to each shard. Otherwise it produces a constant value.
|
||||||
|
|
||||||
## blockNumber()
|
## blockNumber
|
||||||
|
|
||||||
Returns the sequence number of the data block where the row is located.
|
Returns a monotonically increasing sequence number of the [block](../../development/architecture.md#block) containing the row.
|
||||||
|
The returned block number is updated on a best-effort basis, i.e. it may not be fully accurate.
|
||||||
|
|
||||||
## rowNumberInBlock() {#rowNumberInBlock}
|
**Syntax**
|
||||||
|
|
||||||
|
```sql
|
||||||
|
blockNumber()
|
||||||
|
```
|
||||||
|
|
||||||
|
**Returned value**
|
||||||
|
|
||||||
|
- Sequence number of the data block where the row is located. [UInt64](../data-types/int-uint.md).
|
||||||
|
|
||||||
|
**Example**
|
||||||
|
|
||||||
|
Query:
|
||||||
|
|
||||||
|
```sql
|
||||||
|
SELECT blockNumber()
|
||||||
|
FROM
|
||||||
|
(
|
||||||
|
SELECT *
|
||||||
|
FROM system.numbers
|
||||||
|
LIMIT 10
|
||||||
|
) SETTINGS max_block_size = 2
|
||||||
|
```
|
||||||
|
|
||||||
|
Result:
|
||||||
|
|
||||||
|
```response
|
||||||
|
┌─blockNumber()─┐
|
||||||
|
│ 7 │
|
||||||
|
│ 7 │
|
||||||
|
└───────────────┘
|
||||||
|
┌─blockNumber()─┐
|
||||||
|
│ 8 │
|
||||||
|
│ 8 │
|
||||||
|
└───────────────┘
|
||||||
|
┌─blockNumber()─┐
|
||||||
|
│ 9 │
|
||||||
|
│ 9 │
|
||||||
|
└───────────────┘
|
||||||
|
┌─blockNumber()─┐
|
||||||
|
│ 10 │
|
||||||
|
│ 10 │
|
||||||
|
└───────────────┘
|
||||||
|
┌─blockNumber()─┐
|
||||||
|
│ 11 │
|
||||||
|
│ 11 │
|
||||||
|
└───────────────┘
|
||||||
|
```
|
||||||
|
|
||||||
|
## rowNumberInBlock {#rowNumberInBlock}
|
||||||
|
|
||||||
|
Returns for each [block](../../development/architecture.md#block) processed by `rowNumberInBlock` the number of the current row.
|
||||||
|
The returned number starts for each block at 0.
|
||||||
|
|
||||||
|
**Syntax**
|
||||||
|
|
||||||
|
```sql
|
||||||
|
rowNumberInBlock()
|
||||||
|
```
|
||||||
|
|
||||||
|
**Returned value**
|
||||||
|
|
||||||
|
- Ordinal number of the row in the data block starting from 0. [UInt64](../data-types/int-uint.md).
|
||||||
|
|
||||||
|
**Example**
|
||||||
|
|
||||||
|
Query:
|
||||||
|
|
||||||
|
```sql
|
||||||
|
SELECT rowNumberInBlock()
|
||||||
|
FROM
|
||||||
|
(
|
||||||
|
SELECT *
|
||||||
|
FROM system.numbers_mt
|
||||||
|
LIMIT 10
|
||||||
|
) SETTINGS max_block_size = 2
|
||||||
|
```
|
||||||
|
|
||||||
|
Result:
|
||||||
|
|
||||||
|
```response
|
||||||
|
┌─rowNumberInBlock()─┐
|
||||||
|
│ 0 │
|
||||||
|
│ 1 │
|
||||||
|
└────────────────────┘
|
||||||
|
┌─rowNumberInBlock()─┐
|
||||||
|
│ 0 │
|
||||||
|
│ 1 │
|
||||||
|
└────────────────────┘
|
||||||
|
┌─rowNumberInBlock()─┐
|
||||||
|
│ 0 │
|
||||||
|
│ 1 │
|
||||||
|
└────────────────────┘
|
||||||
|
┌─rowNumberInBlock()─┐
|
||||||
|
│ 0 │
|
||||||
|
│ 1 │
|
||||||
|
└────────────────────┘
|
||||||
|
┌─rowNumberInBlock()─┐
|
||||||
|
│ 0 │
|
||||||
|
│ 1 │
|
||||||
|
└────────────────────┘
|
||||||
|
```
|
||||||
|
|
||||||
|
## rowNumberInAllBlocks
|
||||||
|
|
||||||
|
Returns a unique row number for each row processed by `rowNumberInAllBlocks`. The returned numbers start at 0.
|
||||||
|
|
||||||
|
**Syntax**
|
||||||
|
|
||||||
|
```sql
|
||||||
|
rowNumberInAllBlocks()
|
||||||
|
```
|
||||||
|
|
||||||
|
**Returned value**
|
||||||
|
|
||||||
|
- Ordinal number of the row in the data block starting from 0. [UInt64](../data-types/int-uint.md).
|
||||||
|
|
||||||
|
**Example**
|
||||||
|
|
||||||
|
Query:
|
||||||
|
|
||||||
|
```sql
|
||||||
|
SELECT rowNumberInAllBlocks()
|
||||||
|
FROM
|
||||||
|
(
|
||||||
|
SELECT *
|
||||||
|
FROM system.numbers_mt
|
||||||
|
LIMIT 10
|
||||||
|
)
|
||||||
|
SETTINGS max_block_size = 2
|
||||||
|
```
|
||||||
|
|
||||||
|
Result:
|
||||||
|
|
||||||
|
```response
|
||||||
|
┌─rowNumberInAllBlocks()─┐
|
||||||
|
│ 0 │
|
||||||
|
│ 1 │
|
||||||
|
└────────────────────────┘
|
||||||
|
┌─rowNumberInAllBlocks()─┐
|
||||||
|
│ 4 │
|
||||||
|
│ 5 │
|
||||||
|
└────────────────────────┘
|
||||||
|
┌─rowNumberInAllBlocks()─┐
|
||||||
|
│ 2 │
|
||||||
|
│ 3 │
|
||||||
|
└────────────────────────┘
|
||||||
|
┌─rowNumberInAllBlocks()─┐
|
||||||
|
│ 6 │
|
||||||
|
│ 7 │
|
||||||
|
└────────────────────────┘
|
||||||
|
┌─rowNumberInAllBlocks()─┐
|
||||||
|
│ 8 │
|
||||||
|
│ 9 │
|
||||||
|
└────────────────────────┘
|
||||||
|
```
|
||||||
|
|
||||||
Returns the ordinal number of the row in the data block. Different data blocks are always recalculated.
|
|
||||||
|
|
||||||
## rowNumberInAllBlocks()
|
|
||||||
|
|
||||||
Returns the ordinal number of the row in the data block. This function only considers the affected data blocks.
|
|
||||||
|
|
||||||
## neighbor
|
## neighbor
|
||||||
|
|
||||||
|
@ -162,7 +162,7 @@ if (ARCH_AMD64 AND OS_LINUX AND NOT OS_ANDROID)
|
|||||||
set (HARMFUL_LIB harmful)
|
set (HARMFUL_LIB harmful)
|
||||||
endif ()
|
endif ()
|
||||||
|
|
||||||
target_link_libraries (clickhouse PRIVATE clickhouse_common_io string_utils ${HARMFUL_LIB})
|
target_link_libraries (clickhouse PRIVATE clickhouse_common_io ${HARMFUL_LIB})
|
||||||
target_include_directories (clickhouse PRIVATE ${CMAKE_CURRENT_BINARY_DIR})
|
target_include_directories (clickhouse PRIVATE ${CMAKE_CURRENT_BINARY_DIR})
|
||||||
|
|
||||||
if (ENABLE_CLICKHOUSE_KEEPER)
|
if (ENABLE_CLICKHOUSE_KEEPER)
|
||||||
|
@ -10,7 +10,6 @@ set (CLICKHOUSE_CLIENT_LINK
|
|||||||
clickhouse_common_io
|
clickhouse_common_io
|
||||||
clickhouse_functions
|
clickhouse_functions
|
||||||
clickhouse_parsers
|
clickhouse_parsers
|
||||||
string_utils
|
|
||||||
)
|
)
|
||||||
|
|
||||||
if (TARGET ch_rust::skim)
|
if (TARGET ch_rust::skim)
|
||||||
|
@ -15,7 +15,7 @@
|
|||||||
#include <Parsers/obfuscateQueries.h>
|
#include <Parsers/obfuscateQueries.h>
|
||||||
#include <Parsers/parseQuery.h>
|
#include <Parsers/parseQuery.h>
|
||||||
#include <Common/ErrorCodes.h>
|
#include <Common/ErrorCodes.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/TerminalSize.h>
|
#include <Common/TerminalSize.h>
|
||||||
#include <Core/BaseSettingsProgramOptions.h>
|
#include <Core/BaseSettingsProgramOptions.h>
|
||||||
|
|
||||||
|
@ -14,7 +14,7 @@
|
|||||||
#include <Common/TerminalSize.h>
|
#include <Common/TerminalSize.h>
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/SipHash.h>
|
#include <Common/SipHash.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/ShellCommand.h>
|
#include <Common/ShellCommand.h>
|
||||||
#include <Common/re2.h>
|
#include <Common/re2.h>
|
||||||
#include <base/find_symbols.h>
|
#include <base/find_symbols.h>
|
||||||
|
@ -148,6 +148,7 @@ if (BUILD_STANDALONE_KEEPER)
|
|||||||
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/createReadBufferFromFileBase.cpp
|
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/createReadBufferFromFileBase.cpp
|
||||||
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
|
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
|
||||||
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/IOUringReader.cpp
|
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/IOUringReader.cpp
|
||||||
|
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/getIOUringReader.cpp
|
||||||
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/WriteBufferFromTemporaryFile.cpp
|
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/WriteBufferFromTemporaryFile.cpp
|
||||||
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/WriteBufferWithFinalizeCallback.cpp
|
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/WriteBufferWithFinalizeCallback.cpp
|
||||||
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
|
${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/IO/AsynchronousBoundedReadBuffer.cpp
|
||||||
|
@ -1,4 +1,4 @@
|
|||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include "config_tools.h"
|
#include "config_tools.h"
|
||||||
|
|
||||||
|
|
||||||
|
@ -1,6 +1,6 @@
|
|||||||
#pragma once
|
#pragma once
|
||||||
|
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Core/Block.h>
|
#include <Core/Block.h>
|
||||||
#include <base/range.h>
|
#include <base/range.h>
|
||||||
|
|
||||||
|
@ -15,7 +15,7 @@
|
|||||||
|
|
||||||
#include "config_tools.h"
|
#include "config_tools.h"
|
||||||
|
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/getHashOfLoadedBinary.h>
|
#include <Common/getHashOfLoadedBinary.h>
|
||||||
#include <Common/IO.h>
|
#include <Common/IO.h>
|
||||||
|
|
||||||
|
@ -19,7 +19,7 @@
|
|||||||
#include <Processors/LimitTransform.h>
|
#include <Processors/LimitTransform.h>
|
||||||
#include <Common/SipHash.h>
|
#include <Common/SipHash.h>
|
||||||
#include <Common/UTF8Helpers.h>
|
#include <Common/UTF8Helpers.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/HashTable/HashMap.h>
|
#include <Common/HashTable/HashMap.h>
|
||||||
#include <Common/typeid_cast.h>
|
#include <Common/typeid_cast.h>
|
||||||
#include <Common/assert_cast.h>
|
#include <Common/assert_cast.h>
|
||||||
|
@ -4,7 +4,7 @@
|
|||||||
#include <Poco/String.h>
|
#include <Poco/String.h>
|
||||||
#include <base/find_symbols.h>
|
#include <base/find_symbols.h>
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include "validateODBCConnectionString.h"
|
#include "validateODBCConnectionString.h"
|
||||||
|
|
||||||
|
|
||||||
|
@ -13,7 +13,6 @@ set (CLICKHOUSE_SERVER_LINK
|
|||||||
clickhouse_parsers
|
clickhouse_parsers
|
||||||
clickhouse_storages_system
|
clickhouse_storages_system
|
||||||
clickhouse_table_functions
|
clickhouse_table_functions
|
||||||
string_utils
|
|
||||||
|
|
||||||
${LINK_RESOURCE_LIB}
|
${LINK_RESOURCE_LIB}
|
||||||
|
|
||||||
|
@ -1,5 +1,5 @@
|
|||||||
#include <Access/User.h>
|
#include <Access/User.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Core/Protocol.h>
|
#include <Core/Protocol.h>
|
||||||
#include <base/insertAtEnd.h>
|
#include <base/insertAtEnd.h>
|
||||||
|
|
||||||
|
@ -10,7 +10,7 @@
|
|||||||
#include <Dictionaries/IDictionary.h>
|
#include <Dictionaries/IDictionary.h>
|
||||||
#include <Common/Config/ConfigReloader.h>
|
#include <Common/Config/ConfigReloader.h>
|
||||||
#include <Common/SSHWrapper.h>
|
#include <Common/SSHWrapper.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/quoteString.h>
|
#include <Common/quoteString.h>
|
||||||
#include <Common/transformEndianness.h>
|
#include <Common/transformEndianness.h>
|
||||||
#include <Core/Settings.h>
|
#include <Core/Settings.h>
|
||||||
|
@ -1,6 +1,6 @@
|
|||||||
#include "AggregateFunctionCombinatorFactory.h"
|
#include "AggregateFunctionCombinatorFactory.h"
|
||||||
|
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
namespace DB
|
namespace DB
|
||||||
{
|
{
|
||||||
|
@ -39,6 +39,7 @@ public:
|
|||||||
std::optional<UUID> backup_uuid;
|
std::optional<UUID> backup_uuid;
|
||||||
bool deduplicate_files = true;
|
bool deduplicate_files = true;
|
||||||
bool allow_s3_native_copy = true;
|
bool allow_s3_native_copy = true;
|
||||||
|
bool allow_azure_native_copy = true;
|
||||||
bool use_same_s3_credentials_for_base_backup = false;
|
bool use_same_s3_credentials_for_base_backup = false;
|
||||||
bool azure_attempt_to_create_container = true;
|
bool azure_attempt_to_create_container = true;
|
||||||
ReadSettings read_settings;
|
ReadSettings read_settings;
|
||||||
|
@ -31,22 +31,28 @@ namespace ErrorCodes
|
|||||||
|
|
||||||
BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
|
BackupReaderAzureBlobStorage::BackupReaderAzureBlobStorage(
|
||||||
StorageAzureBlob::Configuration configuration_,
|
StorageAzureBlob::Configuration configuration_,
|
||||||
|
bool allow_azure_native_copy,
|
||||||
const ReadSettings & read_settings_,
|
const ReadSettings & read_settings_,
|
||||||
const WriteSettings & write_settings_,
|
const WriteSettings & write_settings_,
|
||||||
const ContextPtr & context_)
|
const ContextPtr & context_)
|
||||||
: BackupReaderDefault(read_settings_, write_settings_, getLogger("BackupReaderAzureBlobStorage"))
|
: BackupReaderDefault(read_settings_, write_settings_, getLogger("BackupReaderAzureBlobStorage"))
|
||||||
, data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.container, false, false}
|
, data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.getConnectionURL().toString(), false, false}
|
||||||
, configuration(configuration_)
|
, configuration(configuration_)
|
||||||
{
|
{
|
||||||
auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
|
auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
|
||||||
client_ptr->SetClickhouseOptions(Azure::Storage::Blobs::ClickhouseClientOptions{.IsClientForDisk=true});
|
client_ptr->SetClickhouseOptions(Azure::Storage::Blobs::ClickhouseClientOptions{.IsClientForDisk=true});
|
||||||
|
|
||||||
object_storage = std::make_unique<AzureObjectStorage>("BackupReaderAzureBlobStorage",
|
object_storage = std::make_unique<AzureObjectStorage>(
|
||||||
|
"BackupReaderAzureBlobStorage",
|
||||||
std::move(client_ptr),
|
std::move(client_ptr),
|
||||||
StorageAzureBlob::createSettings(context_),
|
StorageAzureBlob::createSettings(context_),
|
||||||
configuration_.container);
|
configuration.container,
|
||||||
|
configuration.getConnectionURL().toString());
|
||||||
|
|
||||||
client = object_storage->getAzureBlobStorageClient();
|
client = object_storage->getAzureBlobStorageClient();
|
||||||
settings = object_storage->getSettings();
|
auto settings_copy = *object_storage->getSettings();
|
||||||
|
settings_copy.use_native_copy = allow_azure_native_copy;
|
||||||
|
settings = std::make_unique<const AzureObjectStorageSettings>(settings_copy);
|
||||||
}
|
}
|
||||||
|
|
||||||
BackupReaderAzureBlobStorage::~BackupReaderAzureBlobStorage() = default;
|
BackupReaderAzureBlobStorage::~BackupReaderAzureBlobStorage() = default;
|
||||||
@ -76,9 +82,9 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
|
|||||||
DiskPtr destination_disk, const String & destination_path, WriteMode write_mode)
|
DiskPtr destination_disk, const String & destination_path, WriteMode write_mode)
|
||||||
{
|
{
|
||||||
auto destination_data_source_description = destination_disk->getDataSourceDescription();
|
auto destination_data_source_description = destination_disk->getDataSourceDescription();
|
||||||
if ((destination_data_source_description.type == DataSourceType::ObjectStorage)
|
LOG_TRACE(log, "Source description {}, desctionation description {}", data_source_description.description, destination_data_source_description.description);
|
||||||
&& (destination_data_source_description.object_storage_type == ObjectStorageType::Azure)
|
if (destination_data_source_description.sameKind(data_source_description)
|
||||||
&& (destination_data_source_description.is_encrypted == encrypted_in_backup))
|
&& destination_data_source_description.is_encrypted == encrypted_in_backup)
|
||||||
{
|
{
|
||||||
LOG_TRACE(log, "Copying {} from AzureBlobStorage to disk {}", path_in_backup, destination_disk->getName());
|
LOG_TRACE(log, "Copying {} from AzureBlobStorage to disk {}", path_in_backup, destination_disk->getName());
|
||||||
auto write_blob_function = [&](const Strings & blob_path, WriteMode mode, const std::optional<ObjectAttributes> &) -> size_t
|
auto write_blob_function = [&](const Strings & blob_path, WriteMode mode, const std::optional<ObjectAttributes> &) -> size_t
|
||||||
@ -116,12 +122,13 @@ void BackupReaderAzureBlobStorage::copyFileToDisk(const String & path_in_backup,
|
|||||||
|
|
||||||
BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
|
BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
|
||||||
StorageAzureBlob::Configuration configuration_,
|
StorageAzureBlob::Configuration configuration_,
|
||||||
|
bool allow_azure_native_copy,
|
||||||
const ReadSettings & read_settings_,
|
const ReadSettings & read_settings_,
|
||||||
const WriteSettings & write_settings_,
|
const WriteSettings & write_settings_,
|
||||||
const ContextPtr & context_,
|
const ContextPtr & context_,
|
||||||
bool attempt_to_create_container)
|
bool attempt_to_create_container)
|
||||||
: BackupWriterDefault(read_settings_, write_settings_, getLogger("BackupWriterAzureBlobStorage"))
|
: BackupWriterDefault(read_settings_, write_settings_, getLogger("BackupWriterAzureBlobStorage"))
|
||||||
, data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.container, false, false}
|
, data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.getConnectionURL().toString(), false, false}
|
||||||
, configuration(configuration_)
|
, configuration(configuration_)
|
||||||
{
|
{
|
||||||
auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false, attempt_to_create_container);
|
auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false, attempt_to_create_container);
|
||||||
@ -130,9 +137,12 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
|
|||||||
object_storage = std::make_unique<AzureObjectStorage>("BackupWriterAzureBlobStorage",
|
object_storage = std::make_unique<AzureObjectStorage>("BackupWriterAzureBlobStorage",
|
||||||
std::move(client_ptr),
|
std::move(client_ptr),
|
||||||
StorageAzureBlob::createSettings(context_),
|
StorageAzureBlob::createSettings(context_),
|
||||||
configuration_.container);
|
configuration_.container,
|
||||||
|
configuration_.getConnectionURL().toString());
|
||||||
client = object_storage->getAzureBlobStorageClient();
|
client = object_storage->getAzureBlobStorageClient();
|
||||||
settings = object_storage->getSettings();
|
auto settings_copy = *object_storage->getSettings();
|
||||||
|
settings_copy.use_native_copy = allow_azure_native_copy;
|
||||||
|
settings = std::make_unique<const AzureObjectStorageSettings>(settings_copy);
|
||||||
}
|
}
|
||||||
|
|
||||||
void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
|
void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backup, DiskPtr src_disk, const String & src_path,
|
||||||
@ -140,7 +150,9 @@ void BackupWriterAzureBlobStorage::copyFileFromDisk(const String & path_in_backu
|
|||||||
{
|
{
|
||||||
/// Use the native copy as a more optimal way to copy a file from AzureBlobStorage to AzureBlobStorage if it's possible.
|
/// Use the native copy as a more optimal way to copy a file from AzureBlobStorage to AzureBlobStorage if it's possible.
|
||||||
auto source_data_source_description = src_disk->getDataSourceDescription();
|
auto source_data_source_description = src_disk->getDataSourceDescription();
|
||||||
if (source_data_source_description.sameKind(data_source_description) && (source_data_source_description.is_encrypted == copy_encrypted))
|
LOG_TRACE(log, "Source description {}, desctionation description {}", source_data_source_description.description, data_source_description.description);
|
||||||
|
if (source_data_source_description.sameKind(data_source_description)
|
||||||
|
&& source_data_source_description.is_encrypted == copy_encrypted)
|
||||||
{
|
{
|
||||||
/// getBlobPath() can return more than 3 elements if the file is stored as multiple objects in AzureBlobStorage container.
|
/// getBlobPath() can return more than 3 elements if the file is stored as multiple objects in AzureBlobStorage container.
|
||||||
/// In this case we can't use the native copy.
|
/// In this case we can't use the native copy.
|
||||||
|
@ -16,7 +16,12 @@ namespace DB
|
|||||||
class BackupReaderAzureBlobStorage : public BackupReaderDefault
|
class BackupReaderAzureBlobStorage : public BackupReaderDefault
|
||||||
{
|
{
|
||||||
public:
|
public:
|
||||||
BackupReaderAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_);
|
BackupReaderAzureBlobStorage(
|
||||||
|
StorageAzureBlob::Configuration configuration_,
|
||||||
|
bool allow_azure_native_copy,
|
||||||
|
const ReadSettings & read_settings_,
|
||||||
|
const WriteSettings & write_settings_,
|
||||||
|
const ContextPtr & context_);
|
||||||
~BackupReaderAzureBlobStorage() override;
|
~BackupReaderAzureBlobStorage() override;
|
||||||
|
|
||||||
bool fileExists(const String & file_name) override;
|
bool fileExists(const String & file_name) override;
|
||||||
@ -37,7 +42,13 @@ private:
|
|||||||
class BackupWriterAzureBlobStorage : public BackupWriterDefault
|
class BackupWriterAzureBlobStorage : public BackupWriterDefault
|
||||||
{
|
{
|
||||||
public:
|
public:
|
||||||
BackupWriterAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_, bool attempt_to_create_container);
|
BackupWriterAzureBlobStorage(
|
||||||
|
StorageAzureBlob::Configuration configuration_,
|
||||||
|
bool allow_azure_native_copy,
|
||||||
|
const ReadSettings & read_settings_,
|
||||||
|
const WriteSettings & write_settings_,
|
||||||
|
const ContextPtr & context_,
|
||||||
|
bool attempt_to_create_container);
|
||||||
~BackupWriterAzureBlobStorage() override;
|
~BackupWriterAzureBlobStorage() override;
|
||||||
|
|
||||||
bool fileExists(const String & file_name) override;
|
bool fileExists(const String & file_name) override;
|
||||||
|
@ -4,7 +4,7 @@
|
|||||||
#include <Backups/BackupIO.h>
|
#include <Backups/BackupIO.h>
|
||||||
#include <Backups/IBackupEntry.h>
|
#include <Backups/IBackupEntry.h>
|
||||||
#include <Common/ProfileEvents.h>
|
#include <Common/ProfileEvents.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <base/hex.h>
|
#include <base/hex.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
#include <Common/quoteString.h>
|
#include <Common/quoteString.h>
|
||||||
|
@ -27,6 +27,7 @@ namespace ErrorCodes
|
|||||||
M(Bool, decrypt_files_from_encrypted_disks) \
|
M(Bool, decrypt_files_from_encrypted_disks) \
|
||||||
M(Bool, deduplicate_files) \
|
M(Bool, deduplicate_files) \
|
||||||
M(Bool, allow_s3_native_copy) \
|
M(Bool, allow_s3_native_copy) \
|
||||||
|
M(Bool, allow_azure_native_copy) \
|
||||||
M(Bool, use_same_s3_credentials_for_base_backup) \
|
M(Bool, use_same_s3_credentials_for_base_backup) \
|
||||||
M(Bool, azure_attempt_to_create_container) \
|
M(Bool, azure_attempt_to_create_container) \
|
||||||
M(Bool, read_from_filesystem_cache) \
|
M(Bool, read_from_filesystem_cache) \
|
||||||
|
@ -44,6 +44,9 @@ struct BackupSettings
|
|||||||
/// Whether native copy is allowed (optimization for cloud storages, that sometimes could have bugs)
|
/// Whether native copy is allowed (optimization for cloud storages, that sometimes could have bugs)
|
||||||
bool allow_s3_native_copy = true;
|
bool allow_s3_native_copy = true;
|
||||||
|
|
||||||
|
/// Whether native copy is allowed (optimization for cloud storages, that sometimes could have bugs)
|
||||||
|
bool allow_azure_native_copy = true;
|
||||||
|
|
||||||
/// Whether base backup to S3 should inherit credentials from the BACKUP query.
|
/// Whether base backup to S3 should inherit credentials from the BACKUP query.
|
||||||
bool use_same_s3_credentials_for_base_backup = false;
|
bool use_same_s3_credentials_for_base_backup = false;
|
||||||
|
|
||||||
|
@ -598,6 +598,7 @@ void BackupsWorker::doBackup(
|
|||||||
backup_create_params.backup_uuid = backup_settings.backup_uuid;
|
backup_create_params.backup_uuid = backup_settings.backup_uuid;
|
||||||
backup_create_params.deduplicate_files = backup_settings.deduplicate_files;
|
backup_create_params.deduplicate_files = backup_settings.deduplicate_files;
|
||||||
backup_create_params.allow_s3_native_copy = backup_settings.allow_s3_native_copy;
|
backup_create_params.allow_s3_native_copy = backup_settings.allow_s3_native_copy;
|
||||||
|
backup_create_params.allow_azure_native_copy = backup_settings.allow_azure_native_copy;
|
||||||
backup_create_params.use_same_s3_credentials_for_base_backup = backup_settings.use_same_s3_credentials_for_base_backup;
|
backup_create_params.use_same_s3_credentials_for_base_backup = backup_settings.use_same_s3_credentials_for_base_backup;
|
||||||
backup_create_params.azure_attempt_to_create_container = backup_settings.azure_attempt_to_create_container;
|
backup_create_params.azure_attempt_to_create_container = backup_settings.azure_attempt_to_create_container;
|
||||||
backup_create_params.read_settings = getReadSettingsForBackup(context, backup_settings);
|
backup_create_params.read_settings = getReadSettingsForBackup(context, backup_settings);
|
||||||
|
@ -135,7 +135,9 @@ void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
|
|||||||
|
|
||||||
if (params.open_mode == IBackup::OpenMode::READ)
|
if (params.open_mode == IBackup::OpenMode::READ)
|
||||||
{
|
{
|
||||||
auto reader = std::make_shared<BackupReaderAzureBlobStorage>(configuration,
|
auto reader = std::make_shared<BackupReaderAzureBlobStorage>(
|
||||||
|
configuration,
|
||||||
|
params.allow_azure_native_copy,
|
||||||
params.read_settings,
|
params.read_settings,
|
||||||
params.write_settings,
|
params.write_settings,
|
||||||
params.context);
|
params.context);
|
||||||
@ -150,7 +152,9 @@ void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
auto writer = std::make_shared<BackupWriterAzureBlobStorage>(configuration,
|
auto writer = std::make_shared<BackupWriterAzureBlobStorage>(
|
||||||
|
configuration,
|
||||||
|
params.allow_azure_native_copy,
|
||||||
params.read_settings,
|
params.read_settings,
|
||||||
params.write_settings,
|
params.write_settings,
|
||||||
params.context,
|
params.context,
|
||||||
|
@ -6,7 +6,7 @@
|
|||||||
|
|
||||||
#include <Common/ErrorHandlers.h>
|
#include <Common/ErrorHandlers.h>
|
||||||
#include <Common/SensitiveDataMasker.h>
|
#include <Common/SensitiveDataMasker.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
#include <Formats/registerFormats.h>
|
#include <Formats/registerFormats.h>
|
||||||
#include <IO/ReadHelpers.h>
|
#include <IO/ReadHelpers.h>
|
||||||
|
@ -307,7 +307,6 @@ endif()
|
|||||||
|
|
||||||
target_link_libraries (clickhouse_common_io
|
target_link_libraries (clickhouse_common_io
|
||||||
PRIVATE
|
PRIVATE
|
||||||
string_utils
|
|
||||||
widechar_width
|
widechar_width
|
||||||
${LINK_LIBRARIES_ONLY_ON_X86_64}
|
${LINK_LIBRARIES_ONLY_ON_X86_64}
|
||||||
PUBLIC
|
PUBLIC
|
||||||
@ -320,7 +319,6 @@ target_link_libraries (clickhouse_common_io
|
|||||||
|
|
||||||
target_link_libraries (clickhouse_compression
|
target_link_libraries (clickhouse_compression
|
||||||
PUBLIC
|
PUBLIC
|
||||||
string_utils
|
|
||||||
pcg_random
|
pcg_random
|
||||||
clickhouse_parsers
|
clickhouse_parsers
|
||||||
PRIVATE
|
PRIVATE
|
||||||
@ -410,7 +408,6 @@ dbms_target_link_libraries (
|
|||||||
clickhouse_parsers
|
clickhouse_parsers
|
||||||
ch_contrib::lz4
|
ch_contrib::lz4
|
||||||
Poco::JSON
|
Poco::JSON
|
||||||
string_utils
|
|
||||||
PUBLIC
|
PUBLIC
|
||||||
boost::system
|
boost::system
|
||||||
clickhouse_common_io
|
clickhouse_common_io
|
||||||
@ -645,7 +642,6 @@ if (ENABLE_TESTS)
|
|||||||
dbms
|
dbms
|
||||||
clickhouse_common_config
|
clickhouse_common_config
|
||||||
clickhouse_common_zookeeper
|
clickhouse_common_zookeeper
|
||||||
string_utils
|
|
||||||
hilite_comparator)
|
hilite_comparator)
|
||||||
|
|
||||||
if (TARGET ch_contrib::simdjson)
|
if (TARGET ch_contrib::simdjson)
|
||||||
|
@ -18,7 +18,7 @@
|
|||||||
#include <Common/typeid_cast.h>
|
#include <Common/typeid_cast.h>
|
||||||
#include <Common/TerminalSize.h>
|
#include <Common/TerminalSize.h>
|
||||||
#include <Common/clearPasswordFromCommandLine.h>
|
#include <Common/clearPasswordFromCommandLine.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/filesystemHelpers.h>
|
#include <Common/filesystemHelpers.h>
|
||||||
#include <Common/NetException.h>
|
#include <Common/NetException.h>
|
||||||
#include <Columns/ColumnString.h>
|
#include <Columns/ColumnString.h>
|
||||||
@ -710,8 +710,8 @@ void ClientBase::adjustSettings()
|
|||||||
settings.input_format_values_allow_data_after_semicolon.changed = false;
|
settings.input_format_values_allow_data_after_semicolon.changed = false;
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Do not limit pretty format output in case of --pager specified.
|
/// Do not limit pretty format output in case of --pager specified or in case of stdout is not a tty.
|
||||||
if (!pager.empty())
|
if (!pager.empty() || !stdout_is_a_tty)
|
||||||
{
|
{
|
||||||
if (!global_context->getSettingsRef().output_format_pretty_max_rows.changed)
|
if (!global_context->getSettingsRef().output_format_pretty_max_rows.changed)
|
||||||
{
|
{
|
||||||
|
@ -20,7 +20,7 @@
|
|||||||
#include <Common/NetException.h>
|
#include <Common/NetException.h>
|
||||||
#include <Common/CurrentMetrics.h>
|
#include <Common/CurrentMetrics.h>
|
||||||
#include <Common/DNSResolver.h>
|
#include <Common/DNSResolver.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/OpenSSLHelpers.h>
|
#include <Common/OpenSSLHelpers.h>
|
||||||
#include <Common/randomSeed.h>
|
#include <Common/randomSeed.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
|
@ -1,5 +1,3 @@
|
|||||||
add_subdirectory(StringUtils)
|
|
||||||
|
|
||||||
if (ENABLE_BENCHMARKS)
|
if (ENABLE_BENCHMARKS)
|
||||||
add_subdirectory(benchmarks)
|
add_subdirectory(benchmarks)
|
||||||
endif()
|
endif()
|
||||||
|
@ -13,8 +13,6 @@ target_link_libraries(clickhouse_common_config
|
|||||||
clickhouse_common_zookeeper
|
clickhouse_common_zookeeper
|
||||||
common
|
common
|
||||||
Poco::XML
|
Poco::XML
|
||||||
PRIVATE
|
|
||||||
string_utils
|
|
||||||
)
|
)
|
||||||
|
|
||||||
add_library(clickhouse_common_config_no_zookeeper_log ${SRCS})
|
add_library(clickhouse_common_config_no_zookeeper_log ${SRCS})
|
||||||
@ -23,8 +21,6 @@ target_link_libraries(clickhouse_common_config_no_zookeeper_log
|
|||||||
clickhouse_common_zookeeper_no_log
|
clickhouse_common_zookeeper_no_log
|
||||||
common
|
common
|
||||||
Poco::XML
|
Poco::XML
|
||||||
PRIVATE
|
|
||||||
string_utils
|
|
||||||
)
|
)
|
||||||
|
|
||||||
if (TARGET ch_contrib::yaml_cpp)
|
if (TARGET ch_contrib::yaml_cpp)
|
||||||
|
@ -18,7 +18,7 @@
|
|||||||
#include <Poco/NumberParser.h>
|
#include <Poco/NumberParser.h>
|
||||||
#include <Common/ZooKeeper/ZooKeeperNodeCache.h>
|
#include <Common/ZooKeeper/ZooKeeperNodeCache.h>
|
||||||
#include <Common/ZooKeeper/KeeperException.h>
|
#include <Common/ZooKeeper/KeeperException.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/XMLUtils.h>
|
#include <Common/XMLUtils.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
|
@ -289,7 +289,9 @@
|
|||||||
\
|
\
|
||||||
M(AddressesActive, "Total count of addresses which are used for creation connections with connection pools") \
|
M(AddressesActive, "Total count of addresses which are used for creation connections with connection pools") \
|
||||||
M(AddressesBanned, "Total count of addresses which are banned as faulty for creation connections with connection pools") \
|
M(AddressesBanned, "Total count of addresses which are banned as faulty for creation connections with connection pools") \
|
||||||
|
\
|
||||||
|
M(FilteringMarksWithPrimaryKey, "Number of threads currently doing filtering of mark ranges by the primary key") \
|
||||||
|
M(FilteringMarksWithSecondaryKeys, "Number of threads currently doing filtering of mark ranges by secondary keys") \
|
||||||
|
|
||||||
#ifdef APPLY_FOR_EXTERNAL_METRICS
|
#ifdef APPLY_FOR_EXTERNAL_METRICS
|
||||||
#define APPLY_FOR_METRICS(M) APPLY_FOR_BUILTIN_METRICS(M) APPLY_FOR_EXTERNAL_METRICS(M)
|
#define APPLY_FOR_METRICS(M) APPLY_FOR_BUILTIN_METRICS(M) APPLY_FOR_EXTERNAL_METRICS(M)
|
||||||
|
@ -12,7 +12,7 @@
|
|||||||
|
|
||||||
#include <Common/Arena.h>
|
#include <Common/Arena.h>
|
||||||
#include <Common/HashTable/HashMap.h>
|
#include <Common/HashTable/HashMap.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <IO/ReadBufferFromFile.h>
|
#include <IO/ReadBufferFromFile.h>
|
||||||
#include <IO/ReadBufferFromString.h>
|
#include <IO/ReadBufferFromString.h>
|
||||||
#include <IO/ReadHelpers.h>
|
#include <IO/ReadHelpers.h>
|
||||||
|
@ -1,5 +1,5 @@
|
|||||||
#include <Common/HTTPHeaderFilter.h>
|
#include <Common/HTTPHeaderFilter.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/re2.h>
|
#include <Common/re2.h>
|
||||||
|
|
||||||
|
@ -360,6 +360,7 @@ The server successfully detected this situation and will download merged part fr
|
|||||||
M(QueryProfilerSignalOverruns, "Number of times we drop processing of a query profiler signal due to overrun plus the number of signals that OS has not delivered due to overrun.") \
|
M(QueryProfilerSignalOverruns, "Number of times we drop processing of a query profiler signal due to overrun plus the number of signals that OS has not delivered due to overrun.") \
|
||||||
M(QueryProfilerConcurrencyOverruns, "Number of times we drop processing of a query profiler signal due to too many concurrent query profilers in other threads, which may indicate overload.") \
|
M(QueryProfilerConcurrencyOverruns, "Number of times we drop processing of a query profiler signal due to too many concurrent query profilers in other threads, which may indicate overload.") \
|
||||||
M(QueryProfilerRuns, "Number of times QueryProfiler had been run.") \
|
M(QueryProfilerRuns, "Number of times QueryProfiler had been run.") \
|
||||||
|
M(QueryProfilerErrors, "Invalid memory accesses during asynchronous stack unwinding.") \
|
||||||
\
|
\
|
||||||
M(CreatedLogEntryForMerge, "Successfully created log entry to merge parts in ReplicatedMergeTree.") \
|
M(CreatedLogEntryForMerge, "Successfully created log entry to merge parts in ReplicatedMergeTree.") \
|
||||||
M(NotCreatedLogEntryForMerge, "Log entry to merge parts in ReplicatedMergeTree is not created due to concurrent log update by another replica.") \
|
M(NotCreatedLogEntryForMerge, "Log entry to merge parts in ReplicatedMergeTree is not created due to concurrent log update by another replica.") \
|
||||||
|
@ -4,7 +4,7 @@
|
|||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/ProxyListConfigurationResolver.h>
|
#include <Common/ProxyListConfigurationResolver.h>
|
||||||
#include <Common/RemoteProxyConfigurationResolver.h>
|
#include <Common/RemoteProxyConfigurationResolver.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
|
|
||||||
namespace DB
|
namespace DB
|
||||||
|
@ -1,6 +1,6 @@
|
|||||||
#include <Common/ProxyListConfigurationResolver.h>
|
#include <Common/ProxyListConfigurationResolver.h>
|
||||||
|
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
#include <Poco/URI.h>
|
#include <Poco/URI.h>
|
||||||
|
|
||||||
|
@ -12,7 +12,6 @@
|
|||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
#include <Common/thread_local_rng.h>
|
#include <Common/thread_local_rng.h>
|
||||||
|
|
||||||
#include <random>
|
|
||||||
|
|
||||||
namespace CurrentMetrics
|
namespace CurrentMetrics
|
||||||
{
|
{
|
||||||
@ -25,6 +24,7 @@ namespace ProfileEvents
|
|||||||
extern const Event QueryProfilerSignalOverruns;
|
extern const Event QueryProfilerSignalOverruns;
|
||||||
extern const Event QueryProfilerConcurrencyOverruns;
|
extern const Event QueryProfilerConcurrencyOverruns;
|
||||||
extern const Event QueryProfilerRuns;
|
extern const Event QueryProfilerRuns;
|
||||||
|
extern const Event QueryProfilerErrors;
|
||||||
}
|
}
|
||||||
|
|
||||||
namespace DB
|
namespace DB
|
||||||
@ -84,11 +84,29 @@ namespace
|
|||||||
#endif
|
#endif
|
||||||
|
|
||||||
const auto signal_context = *reinterpret_cast<ucontext_t *>(context);
|
const auto signal_context = *reinterpret_cast<ucontext_t *>(context);
|
||||||
const StackTrace stack_trace(signal_context);
|
std::optional<StackTrace> stack_trace;
|
||||||
|
|
||||||
|
#if defined(SANITIZER)
|
||||||
|
constexpr bool sanitizer = true;
|
||||||
|
#else
|
||||||
|
constexpr bool sanitizer = false;
|
||||||
|
#endif
|
||||||
|
|
||||||
|
asynchronous_stack_unwinding = true;
|
||||||
|
if (sanitizer || 0 == sigsetjmp(asynchronous_stack_unwinding_signal_jump_buffer, 1))
|
||||||
|
{
|
||||||
|
stack_trace.emplace(signal_context);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
ProfileEvents::incrementNoTrace(ProfileEvents::QueryProfilerErrors);
|
||||||
|
}
|
||||||
|
asynchronous_stack_unwinding = false;
|
||||||
|
|
||||||
|
if (stack_trace)
|
||||||
|
TraceSender::send(trace_type, *stack_trace, {});
|
||||||
|
|
||||||
TraceSender::send(trace_type, stack_trace, {});
|
|
||||||
ProfileEvents::incrementNoTrace(ProfileEvents::QueryProfilerRuns);
|
ProfileEvents::incrementNoTrace(ProfileEvents::QueryProfilerRuns);
|
||||||
|
|
||||||
errno = saved_errno;
|
errno = saved_errno;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
#include <Poco/URI.h>
|
#include <Poco/URI.h>
|
||||||
#include <Poco/Util/AbstractConfiguration.h>
|
#include <Poco/Util/AbstractConfiguration.h>
|
||||||
#include <Common/RemoteHostFilter.h>
|
#include <Common/RemoteHostFilter.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/re2.h>
|
#include <Common/re2.h>
|
||||||
#include <IO/WriteHelpers.h>
|
#include <IO/WriteHelpers.h>
|
||||||
|
@ -5,7 +5,7 @@
|
|||||||
#include <Common/Scheduler/ISchedulerQueue.h>
|
#include <Common/Scheduler/ISchedulerQueue.h>
|
||||||
|
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
#include <map>
|
#include <map>
|
||||||
#include <tuple>
|
#include <tuple>
|
||||||
|
@ -10,7 +10,7 @@
|
|||||||
#include <Common/re2.h>
|
#include <Common/re2.h>
|
||||||
|
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/ProfileEvents.h>
|
#include <Common/ProfileEvents.h>
|
||||||
|
|
||||||
#ifndef NDEBUG
|
#ifndef NDEBUG
|
||||||
|
@ -560,3 +560,7 @@ void StackTrace::dropCache()
|
|||||||
std::lock_guard lock{stacktrace_cache_mutex};
|
std::lock_guard lock{stacktrace_cache_mutex};
|
||||||
cacheInstance().clear();
|
cacheInstance().clear();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
thread_local bool asynchronous_stack_unwinding = false;
|
||||||
|
thread_local sigjmp_buf asynchronous_stack_unwinding_signal_jump_buffer;
|
||||||
|
@ -8,6 +8,7 @@
|
|||||||
#include <optional>
|
#include <optional>
|
||||||
#include <functional>
|
#include <functional>
|
||||||
#include <csignal>
|
#include <csignal>
|
||||||
|
#include <csetjmp>
|
||||||
|
|
||||||
#ifdef OS_DARWIN
|
#ifdef OS_DARWIN
|
||||||
// ucontext is not available without _XOPEN_SOURCE
|
// ucontext is not available without _XOPEN_SOURCE
|
||||||
@ -87,3 +88,8 @@ protected:
|
|||||||
};
|
};
|
||||||
|
|
||||||
std::string signalToErrorMessage(int sig, const siginfo_t & info, const ucontext_t & context);
|
std::string signalToErrorMessage(int sig, const siginfo_t & info, const ucontext_t & context);
|
||||||
|
|
||||||
|
/// Special handling for errors during asynchronous stack unwinding,
|
||||||
|
/// Which is used in Query Profiler
|
||||||
|
extern thread_local bool asynchronous_stack_unwinding;
|
||||||
|
extern thread_local sigjmp_buf asynchronous_stack_unwinding_signal_jump_buffer;
|
||||||
|
@ -2,7 +2,7 @@
|
|||||||
|
|
||||||
#include <base/getPageSize.h>
|
#include <base/getPageSize.h>
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/UTF8Helpers.h>
|
#include <Common/UTF8Helpers.h>
|
||||||
#include <Core/Defines.h>
|
#include <Core/Defines.h>
|
||||||
#include <Poco/Unicode.h>
|
#include <Poco/Unicode.h>
|
||||||
|
87
src/Common/StringUtils.cpp
Normal file
87
src/Common/StringUtils.cpp
Normal file
@ -0,0 +1,87 @@
|
|||||||
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
|
#include <Common/TargetSpecific.h>
|
||||||
|
|
||||||
|
#if USE_MULTITARGET_CODE
|
||||||
|
#include <immintrin.h>
|
||||||
|
#endif
|
||||||
|
|
||||||
|
|
||||||
|
namespace impl
|
||||||
|
{
|
||||||
|
|
||||||
|
bool startsWith(const std::string & s, const char * prefix, size_t prefix_size)
|
||||||
|
{
|
||||||
|
return s.size() >= prefix_size && 0 == memcmp(s.data(), prefix, prefix_size);
|
||||||
|
}
|
||||||
|
|
||||||
|
bool endsWith(const std::string & s, const char * suffix, size_t suffix_size)
|
||||||
|
{
|
||||||
|
return s.size() >= suffix_size && 0 == memcmp(s.data() + s.size() - suffix_size, suffix, suffix_size);
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
DECLARE_DEFAULT_CODE(
|
||||||
|
bool isAllASCII(const UInt8 * data, size_t size)
|
||||||
|
{
|
||||||
|
UInt8 mask = 0;
|
||||||
|
for (size_t i = 0; i < size; ++i)
|
||||||
|
mask |= data[i];
|
||||||
|
|
||||||
|
return !(mask & 0x80);
|
||||||
|
})
|
||||||
|
|
||||||
|
DECLARE_SSE42_SPECIFIC_CODE(
|
||||||
|
/// Copy from https://github.com/lemire/fastvalidate-utf-8/blob/master/include/simdasciicheck.h
|
||||||
|
bool isAllASCII(const UInt8 * data, size_t size)
|
||||||
|
{
|
||||||
|
__m128i masks = _mm_setzero_si128();
|
||||||
|
|
||||||
|
size_t i = 0;
|
||||||
|
for (; i + 16 <= size; i += 16)
|
||||||
|
{
|
||||||
|
__m128i bytes = _mm_loadu_si128(reinterpret_cast<const __m128i *>(data + i));
|
||||||
|
masks = _mm_or_si128(masks, bytes);
|
||||||
|
}
|
||||||
|
int mask = _mm_movemask_epi8(masks);
|
||||||
|
|
||||||
|
UInt8 tail_mask = 0;
|
||||||
|
for (; i < size; i++)
|
||||||
|
tail_mask |= data[i];
|
||||||
|
|
||||||
|
mask |= (tail_mask & 0x80);
|
||||||
|
return !mask;
|
||||||
|
})
|
||||||
|
|
||||||
|
DECLARE_AVX2_SPECIFIC_CODE(
|
||||||
|
bool isAllASCII(const UInt8 * data, size_t size)
|
||||||
|
{
|
||||||
|
__m256i masks = _mm256_setzero_si256();
|
||||||
|
|
||||||
|
size_t i = 0;
|
||||||
|
for (; i + 32 <= size; i += 32)
|
||||||
|
{
|
||||||
|
__m256i bytes = _mm256_loadu_si256(reinterpret_cast<const __m256i *>(data + i));
|
||||||
|
masks = _mm256_or_si256(masks, bytes);
|
||||||
|
}
|
||||||
|
int mask = _mm256_movemask_epi8(masks);
|
||||||
|
|
||||||
|
UInt8 tail_mask = 0;
|
||||||
|
for (; i < size; i++)
|
||||||
|
tail_mask |= data[i];
|
||||||
|
|
||||||
|
mask |= (tail_mask & 0x80);
|
||||||
|
return !mask;
|
||||||
|
})
|
||||||
|
|
||||||
|
bool isAllASCII(const UInt8 * data, size_t size)
|
||||||
|
{
|
||||||
|
#if USE_MULTITARGET_CODE
|
||||||
|
if (isArchSupported(DB::TargetArch::AVX2))
|
||||||
|
return TargetSpecific::AVX2::isAllASCII(data, size);
|
||||||
|
if (isArchSupported(DB::TargetArch::SSE42))
|
||||||
|
return TargetSpecific::SSE42::isAllASCII(data, size);
|
||||||
|
#endif
|
||||||
|
return TargetSpecific::Default::isAllASCII(data, size);
|
||||||
|
}
|
@ -7,8 +7,10 @@
|
|||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
#include <type_traits>
|
#include <type_traits>
|
||||||
|
|
||||||
|
#include <base/types.h>
|
||||||
|
|
||||||
namespace detail
|
|
||||||
|
namespace impl
|
||||||
{
|
{
|
||||||
bool startsWith(const std::string & s, const char * prefix, size_t prefix_size);
|
bool startsWith(const std::string & s, const char * prefix, size_t prefix_size);
|
||||||
bool endsWith(const std::string & s, const char * suffix, size_t suffix_size);
|
bool endsWith(const std::string & s, const char * suffix, size_t suffix_size);
|
||||||
@ -17,12 +19,12 @@ namespace detail
|
|||||||
|
|
||||||
inline bool startsWith(const std::string & s, const std::string & prefix)
|
inline bool startsWith(const std::string & s, const std::string & prefix)
|
||||||
{
|
{
|
||||||
return detail::startsWith(s, prefix.data(), prefix.size());
|
return impl::startsWith(s, prefix.data(), prefix.size());
|
||||||
}
|
}
|
||||||
|
|
||||||
inline bool endsWith(const std::string & s, const std::string & suffix)
|
inline bool endsWith(const std::string & s, const std::string & suffix)
|
||||||
{
|
{
|
||||||
return detail::endsWith(s, suffix.data(), suffix.size());
|
return impl::endsWith(s, suffix.data(), suffix.size());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@ -30,12 +32,12 @@ inline bool endsWith(const std::string & s, const std::string & suffix)
|
|||||||
/// string that is known at compile time.
|
/// string that is known at compile time.
|
||||||
inline bool startsWith(const std::string & s, const char * prefix)
|
inline bool startsWith(const std::string & s, const char * prefix)
|
||||||
{
|
{
|
||||||
return detail::startsWith(s, prefix, strlen(prefix));
|
return impl::startsWith(s, prefix, strlen(prefix));
|
||||||
}
|
}
|
||||||
|
|
||||||
inline bool endsWith(const std::string & s, const char * suffix)
|
inline bool endsWith(const std::string & s, const char * suffix)
|
||||||
{
|
{
|
||||||
return detail::endsWith(s, suffix, strlen(suffix));
|
return impl::endsWith(s, suffix, strlen(suffix));
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Given an integer, return the adequate suffix for
|
/// Given an integer, return the adequate suffix for
|
||||||
@ -315,6 +317,9 @@ inline void trim(std::string & str, char c = ' ')
|
|||||||
trimLeft(str, c);
|
trimLeft(str, c);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// If all characters in the string are ASCII, return true
|
||||||
|
bool isAllASCII(const UInt8 * data, size_t size);
|
||||||
|
|
||||||
constexpr bool containsGlobs(const std::string & str)
|
constexpr bool containsGlobs(const std::string & str)
|
||||||
{
|
{
|
||||||
return str.find_first_of("*?{") != std::string::npos;
|
return str.find_first_of("*?{") != std::string::npos;
|
@ -1,8 +0,0 @@
|
|||||||
# These files are located in separate library, because they are used by separate products
|
|
||||||
# in places when no dependency on whole "dbms" library is possible.
|
|
||||||
|
|
||||||
include("${ClickHouse_SOURCE_DIR}/cmake/dbms_glob_sources.cmake")
|
|
||||||
|
|
||||||
add_headers_and_sources(clickhouse_common_stringutils .)
|
|
||||||
|
|
||||||
add_library(string_utils ${clickhouse_common_stringutils_headers} ${clickhouse_common_stringutils_sources})
|
|
@ -1,17 +0,0 @@
|
|||||||
#include "StringUtils.h"
|
|
||||||
|
|
||||||
|
|
||||||
namespace detail
|
|
||||||
{
|
|
||||||
|
|
||||||
bool startsWith(const std::string & s, const char * prefix, size_t prefix_size)
|
|
||||||
{
|
|
||||||
return s.size() >= prefix_size && 0 == memcmp(s.data(), prefix, prefix_size);
|
|
||||||
}
|
|
||||||
|
|
||||||
bool endsWith(const std::string & s, const char * suffix, size_t suffix_size)
|
|
||||||
{
|
|
||||||
return s.size() >= suffix_size && 0 == memcmp(s.data() + s.size() - suffix_size, suffix, suffix_size);
|
|
||||||
}
|
|
||||||
|
|
||||||
}
|
|
@ -1,5 +1,5 @@
|
|||||||
#include <Common/TLDListsHolder.h>
|
#include <Common/TLDListsHolder.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
#include <IO/ReadBufferFromFile.h>
|
#include <IO/ReadBufferFromFile.h>
|
||||||
#include <IO/ReadHelpers.h>
|
#include <IO/ReadHelpers.h>
|
||||||
|
@ -1,14 +1,9 @@
|
|||||||
#include <Common/StringUtils/StringUtils.h>
|
|
||||||
#include <Common/TargetSpecific.h>
|
|
||||||
#include <Common/UTF8Helpers.h>
|
#include <Common/UTF8Helpers.h>
|
||||||
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
#include <widechar_width.h>
|
#include <widechar_width.h>
|
||||||
#include <bit>
|
#include <bit>
|
||||||
|
|
||||||
#if USE_MULTITARGET_CODE
|
|
||||||
#include <immintrin.h>
|
|
||||||
#endif
|
|
||||||
|
|
||||||
namespace DB
|
namespace DB
|
||||||
{
|
{
|
||||||
namespace UTF8
|
namespace UTF8
|
||||||
@ -208,7 +203,6 @@ size_t computeWidthImpl(const UInt8 * data, size_t size, size_t prefix, size_t l
|
|||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
size_t computeWidth(const UInt8 * data, size_t size, size_t prefix) noexcept
|
size_t computeWidth(const UInt8 * data, size_t size, size_t prefix) noexcept
|
||||||
{
|
{
|
||||||
return computeWidthImpl<Width>(data, size, prefix, 0);
|
return computeWidthImpl<Width>(data, size, prefix, 0);
|
||||||
@ -219,71 +213,5 @@ size_t computeBytesBeforeWidth(const UInt8 * data, size_t size, size_t prefix, s
|
|||||||
return computeWidthImpl<BytesBeforeLimit>(data, size, prefix, limit);
|
return computeWidthImpl<BytesBeforeLimit>(data, size, prefix, limit);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
DECLARE_DEFAULT_CODE(
|
|
||||||
bool isAllASCII(const UInt8 * data, size_t size)
|
|
||||||
{
|
|
||||||
UInt8 mask = 0;
|
|
||||||
for (size_t i = 0; i < size; ++i)
|
|
||||||
mask |= data[i];
|
|
||||||
|
|
||||||
return !(mask & 0x80);
|
|
||||||
})
|
|
||||||
|
|
||||||
DECLARE_SSE42_SPECIFIC_CODE(
|
|
||||||
/// Copy from https://github.com/lemire/fastvalidate-utf-8/blob/master/include/simdasciicheck.h
|
|
||||||
bool isAllASCII(const UInt8 * data, size_t size)
|
|
||||||
{
|
|
||||||
__m128i masks = _mm_setzero_si128();
|
|
||||||
|
|
||||||
size_t i = 0;
|
|
||||||
for (; i + 16 <= size; i += 16)
|
|
||||||
{
|
|
||||||
__m128i bytes = _mm_loadu_si128(reinterpret_cast<const __m128i *>(data + i));
|
|
||||||
masks = _mm_or_si128(masks, bytes);
|
|
||||||
}
|
|
||||||
int mask = _mm_movemask_epi8(masks);
|
|
||||||
|
|
||||||
UInt8 tail_mask = 0;
|
|
||||||
for (; i < size; i++)
|
|
||||||
tail_mask |= data[i];
|
|
||||||
|
|
||||||
mask |= (tail_mask & 0x80);
|
|
||||||
return !mask;
|
|
||||||
})
|
|
||||||
|
|
||||||
DECLARE_AVX2_SPECIFIC_CODE(
|
|
||||||
bool isAllASCII(const UInt8 * data, size_t size)
|
|
||||||
{
|
|
||||||
__m256i masks = _mm256_setzero_si256();
|
|
||||||
|
|
||||||
size_t i = 0;
|
|
||||||
for (; i + 32 <= size; i += 32)
|
|
||||||
{
|
|
||||||
__m256i bytes = _mm256_loadu_si256(reinterpret_cast<const __m256i *>(data + i));
|
|
||||||
masks = _mm256_or_si256(masks, bytes);
|
|
||||||
}
|
|
||||||
int mask = _mm256_movemask_epi8(masks);
|
|
||||||
|
|
||||||
UInt8 tail_mask = 0;
|
|
||||||
for (; i < size; i++)
|
|
||||||
tail_mask |= data[i];
|
|
||||||
|
|
||||||
mask |= (tail_mask & 0x80);
|
|
||||||
return !mask;
|
|
||||||
})
|
|
||||||
|
|
||||||
bool isAllASCII(const UInt8* data, size_t size)
|
|
||||||
{
|
|
||||||
#if USE_MULTITARGET_CODE
|
|
||||||
if (isArchSupported(TargetArch::AVX2))
|
|
||||||
return TargetSpecific::AVX2::isAllASCII(data, size);
|
|
||||||
if (isArchSupported(TargetArch::SSE42))
|
|
||||||
return TargetSpecific::SSE42::isAllASCII(data, size);
|
|
||||||
#endif
|
|
||||||
return TargetSpecific::Default::isAllASCII(data, size);
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -136,10 +136,6 @@ size_t computeWidth(const UInt8 * data, size_t size, size_t prefix = 0) noexcept
|
|||||||
*/
|
*/
|
||||||
size_t computeBytesBeforeWidth(const UInt8 * data, size_t size, size_t prefix, size_t limit) noexcept;
|
size_t computeBytesBeforeWidth(const UInt8 * data, size_t size, size_t prefix, size_t limit) noexcept;
|
||||||
|
|
||||||
|
|
||||||
/// If all the characters in the string are ASCII, return true.
|
|
||||||
bool isAllASCII(const UInt8* data, size_t size);
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
}
|
}
|
||||||
|
@ -7,7 +7,7 @@
|
|||||||
#include <base/types.h>
|
#include <base/types.h>
|
||||||
#include <Poco/Unicode.h>
|
#include <Poco/Unicode.h>
|
||||||
#include <Common/StringSearcher.h>
|
#include <Common/StringSearcher.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/UTF8Helpers.h>
|
#include <Common/UTF8Helpers.h>
|
||||||
#include <base/unaligned.h>
|
#include <base/unaligned.h>
|
||||||
|
|
||||||
|
@ -12,8 +12,6 @@ target_link_libraries (clickhouse_common_zookeeper
|
|||||||
clickhouse_common_io
|
clickhouse_common_io
|
||||||
clickhouse_compression
|
clickhouse_compression
|
||||||
common
|
common
|
||||||
PRIVATE
|
|
||||||
string_utils
|
|
||||||
)
|
)
|
||||||
|
|
||||||
# for examples -- no logging (to avoid extra dependencies)
|
# for examples -- no logging (to avoid extra dependencies)
|
||||||
@ -23,8 +21,6 @@ target_link_libraries (clickhouse_common_zookeeper_no_log
|
|||||||
clickhouse_common_io
|
clickhouse_common_io
|
||||||
clickhouse_compression
|
clickhouse_compression
|
||||||
common
|
common
|
||||||
PRIVATE
|
|
||||||
string_utils
|
|
||||||
)
|
)
|
||||||
if (ENABLE_EXAMPLES)
|
if (ENABLE_EXAMPLES)
|
||||||
add_subdirectory(examples)
|
add_subdirectory(examples)
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
#include "Common/ZooKeeper/IKeeper.h"
|
#include "Common/ZooKeeper/IKeeper.h"
|
||||||
#include <Common/ZooKeeper/TestKeeper.h>
|
#include <Common/ZooKeeper/TestKeeper.h>
|
||||||
#include <Common/setThreadName.h>
|
#include <Common/setThreadName.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <base/types.h>
|
#include <base/types.h>
|
||||||
#include <functional>
|
#include <functional>
|
||||||
|
|
||||||
|
@ -19,7 +19,7 @@
|
|||||||
#include <Core/ServerUUID.h>
|
#include <Core/ServerUUID.h>
|
||||||
#include "Common/ZooKeeper/IKeeper.h"
|
#include "Common/ZooKeeper/IKeeper.h"
|
||||||
#include <Common/DNSResolver.h>
|
#include <Common/DNSResolver.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
|
|
||||||
#include <Poco/Net/NetException.h>
|
#include <Poco/Net/NetException.h>
|
||||||
|
@ -4,7 +4,7 @@
|
|||||||
#include <base/getFQDNOrHostName.h>
|
#include <base/getFQDNOrHostName.h>
|
||||||
#include <Poco/Util/AbstractConfiguration.h>
|
#include <Poco/Util/AbstractConfiguration.h>
|
||||||
#include <Common/isLocalAddress.h>
|
#include <Common/isLocalAddress.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Poco/String.h>
|
#include <Poco/String.h>
|
||||||
|
|
||||||
namespace DB
|
namespace DB
|
||||||
|
@ -7,7 +7,6 @@ clickhouse_add_executable(zkutil_test_commands_new_lib zkutil_test_commands_new_
|
|||||||
target_link_libraries(zkutil_test_commands_new_lib PRIVATE
|
target_link_libraries(zkutil_test_commands_new_lib PRIVATE
|
||||||
clickhouse_common_zookeeper_no_log
|
clickhouse_common_zookeeper_no_log
|
||||||
clickhouse_compression
|
clickhouse_compression
|
||||||
string_utils
|
|
||||||
dbms)
|
dbms)
|
||||||
|
|
||||||
clickhouse_add_executable(zkutil_test_async zkutil_test_async.cpp)
|
clickhouse_add_executable(zkutil_test_async zkutil_test_async.cpp)
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
#include <Poco/ConsoleChannel.h>
|
#include <Poco/ConsoleChannel.h>
|
||||||
#include <Poco/Logger.h>
|
#include <Poco/Logger.h>
|
||||||
#include <Poco/Event.h>
|
#include <Poco/Event.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/ZooKeeper/ZooKeeperImpl.h>
|
#include <Common/ZooKeeper/ZooKeeperImpl.h>
|
||||||
#include <Common/typeid_cast.h>
|
#include <Common/typeid_cast.h>
|
||||||
#include <iostream>
|
#include <iostream>
|
||||||
|
@ -1,5 +1,5 @@
|
|||||||
#include <base/hex.h>
|
#include <base/hex.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/escapeForFileName.h>
|
#include <Common/escapeForFileName.h>
|
||||||
|
|
||||||
namespace DB
|
namespace DB
|
||||||
|
@ -87,3 +87,6 @@ if (ENABLE_SSL)
|
|||||||
clickhouse_add_executable (encrypt_decrypt encrypt_decrypt.cpp)
|
clickhouse_add_executable (encrypt_decrypt encrypt_decrypt.cpp)
|
||||||
target_link_libraries (encrypt_decrypt PRIVATE dbms)
|
target_link_libraries (encrypt_decrypt PRIVATE dbms)
|
||||||
endif()
|
endif()
|
||||||
|
|
||||||
|
clickhouse_add_executable (check_pointer_valid check_pointer_valid.cpp)
|
||||||
|
target_link_libraries (check_pointer_valid PRIVATE clickhouse_common_io)
|
||||||
|
53
src/Common/examples/check_pointer_valid.cpp
Normal file
53
src/Common/examples/check_pointer_valid.cpp
Normal file
@ -0,0 +1,53 @@
|
|||||||
|
#include <csetjmp>
|
||||||
|
#include <csignal>
|
||||||
|
#include <cstring>
|
||||||
|
#include <iostream>
|
||||||
|
|
||||||
|
|
||||||
|
/// This example demonstrates how is it possible to check if a pointer to memory is readable using a signal handler.
|
||||||
|
|
||||||
|
thread_local bool checking_pointer = false;
|
||||||
|
thread_local jmp_buf signal_jump_buffer;
|
||||||
|
|
||||||
|
|
||||||
|
void signalHandler(int sig, siginfo_t *, void *)
|
||||||
|
{
|
||||||
|
if (checking_pointer && sig == SIGSEGV)
|
||||||
|
siglongjmp(signal_jump_buffer, 1);
|
||||||
|
}
|
||||||
|
|
||||||
|
bool isPointerValid(const void * ptr)
|
||||||
|
{
|
||||||
|
checking_pointer = true;
|
||||||
|
if (0 == sigsetjmp(signal_jump_buffer, 1))
|
||||||
|
{
|
||||||
|
char res;
|
||||||
|
memcpy(&res, ptr, 1);
|
||||||
|
__asm__ __volatile__("" :: "r"(res) : "memory");
|
||||||
|
checking_pointer = false;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
checking_pointer = false;
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
int main(int, char **)
|
||||||
|
{
|
||||||
|
struct sigaction sa;
|
||||||
|
memset(&sa, 0, sizeof(sa));
|
||||||
|
sa.sa_sigaction = signalHandler;
|
||||||
|
sa.sa_flags = SA_SIGINFO;
|
||||||
|
|
||||||
|
if (sigemptyset(&sa.sa_mask)
|
||||||
|
|| sigaddset(&sa.sa_mask, SIGSEGV)
|
||||||
|
|| sigaction(SIGSEGV, &sa, nullptr))
|
||||||
|
return 1;
|
||||||
|
|
||||||
|
std::cerr << isPointerValid(reinterpret_cast<const void *>(0x123456789)) << "\n";
|
||||||
|
std::cerr << isPointerValid(&sa) << "\n";
|
||||||
|
|
||||||
|
return 0;
|
||||||
|
}
|
@ -3,7 +3,7 @@
|
|||||||
#include <base/types.h>
|
#include <base/types.h>
|
||||||
#include <Common/Exception.h>
|
#include <Common/Exception.h>
|
||||||
#include <Common/PODArray.h>
|
#include <Common/PODArray.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
namespace DB
|
namespace DB
|
||||||
{
|
{
|
||||||
|
@ -1,6 +1,6 @@
|
|||||||
#include <Common/formatIPv6.h>
|
#include <Common/formatIPv6.h>
|
||||||
#include <base/hex.h>
|
#include <base/hex.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
#include <base/range.h>
|
#include <base/range.h>
|
||||||
#include <array>
|
#include <array>
|
||||||
|
@ -7,7 +7,7 @@
|
|||||||
#include <base/hex.h>
|
#include <base/hex.h>
|
||||||
#include <base/types.h>
|
#include <base/types.h>
|
||||||
#include <base/unaligned.h>
|
#include <base/unaligned.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
constexpr size_t IPV4_BINARY_LENGTH = 4;
|
constexpr size_t IPV4_BINARY_LENGTH = 4;
|
||||||
constexpr size_t IPV6_BINARY_LENGTH = 16;
|
constexpr size_t IPV6_BINARY_LENGTH = 16;
|
||||||
|
@ -3,7 +3,7 @@
|
|||||||
|
|
||||||
#if defined(OS_LINUX)
|
#if defined(OS_LINUX)
|
||||||
|
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <base/hex.h>
|
#include <base/hex.h>
|
||||||
#include <IO/ReadBufferFromFile.h>
|
#include <IO/ReadBufferFromFile.h>
|
||||||
#include <IO/ReadHelpers.h>
|
#include <IO/ReadHelpers.h>
|
||||||
|
@ -1,7 +1,7 @@
|
|||||||
#include <Common/getMultipleKeysFromConfig.h>
|
#include <Common/getMultipleKeysFromConfig.h>
|
||||||
|
|
||||||
#include <Poco/Util/AbstractConfiguration.h>
|
#include <Poco/Util/AbstractConfiguration.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
namespace DB
|
namespace DB
|
||||||
{
|
{
|
||||||
|
@ -8,7 +8,7 @@
|
|||||||
#include <Poco/Path.h>
|
#include <Poco/Path.h>
|
||||||
#include <Common/getCurrentProcessFDCount.h>
|
#include <Common/getCurrentProcessFDCount.h>
|
||||||
#include <Common/getMaxFileDescriptorCount.h>
|
#include <Common/getMaxFileDescriptorCount.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/config_version.h>
|
#include <Common/config_version.h>
|
||||||
#include "Coordination/KeeperFeatureFlags.h"
|
#include "Coordination/KeeperFeatureFlags.h"
|
||||||
#include <Coordination/Keeper4LWInfo.h>
|
#include <Coordination/Keeper4LWInfo.h>
|
||||||
|
@ -11,7 +11,7 @@
|
|||||||
#include <Common/ZooKeeper/ZooKeeperCommon.h>
|
#include <Common/ZooKeeper/ZooKeeperCommon.h>
|
||||||
#include <Common/SipHash.h>
|
#include <Common/SipHash.h>
|
||||||
#include <Common/ZooKeeper/ZooKeeperConstants.h>
|
#include <Common/ZooKeeper/ZooKeeperConstants.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/ZooKeeper/IKeeper.h>
|
#include <Common/ZooKeeper/IKeeper.h>
|
||||||
#include <base/hex.h>
|
#include <base/hex.h>
|
||||||
#include <base/scope_guard.h>
|
#include <base/scope_guard.h>
|
||||||
|
@ -5,6 +5,7 @@
|
|||||||
#include <Common/ThreadPool.h>
|
#include <Common/ThreadPool.h>
|
||||||
#include <Common/callOnce.h>
|
#include <Common/callOnce.h>
|
||||||
#include <Disks/IO/IOUringReader.h>
|
#include <Disks/IO/IOUringReader.h>
|
||||||
|
#include <Disks/IO/getIOUringReader.h>
|
||||||
|
|
||||||
#include <Core/ServerSettings.h>
|
#include <Core/ServerSettings.h>
|
||||||
|
|
||||||
@ -303,10 +304,10 @@ IAsynchronousReader & Context::getThreadPoolReader(FilesystemReaderType type) co
|
|||||||
}
|
}
|
||||||
|
|
||||||
#if USE_LIBURING
|
#if USE_LIBURING
|
||||||
IOUringReader & Context::getIOURingReader() const
|
IOUringReader & Context::getIOUringReader() const
|
||||||
{
|
{
|
||||||
callOnce(shared->io_uring_reader_initialized, [&] {
|
callOnce(shared->io_uring_reader_initialized, [&] {
|
||||||
shared->io_uring_reader = std::make_unique<IOUringReader>(512);
|
shared->io_uring_reader = createIOUringReader();
|
||||||
});
|
});
|
||||||
|
|
||||||
return *shared->io_uring_reader;
|
return *shared->io_uring_reader;
|
||||||
|
@ -137,7 +137,7 @@ public:
|
|||||||
|
|
||||||
IAsynchronousReader & getThreadPoolReader(FilesystemReaderType type) const;
|
IAsynchronousReader & getThreadPoolReader(FilesystemReaderType type) const;
|
||||||
#if USE_LIBURING
|
#if USE_LIBURING
|
||||||
IOUringReader & getIOURingReader() const;
|
IOUringReader & getIOUringReader() const;
|
||||||
#endif
|
#endif
|
||||||
std::shared_ptr<AsyncReadCounters> getAsyncReadCounters() const;
|
std::shared_ptr<AsyncReadCounters> getAsyncReadCounters() const;
|
||||||
ThreadPool & getThreadPoolWriter() const;
|
ThreadPool & getThreadPoolWriter() const;
|
||||||
|
@ -92,7 +92,7 @@ void applySettingsQuirks(Settings & settings, LoggerPtr log)
|
|||||||
|
|
||||||
void doSettingsSanityCheckClamp(Settings & current_settings, LoggerPtr log)
|
void doSettingsSanityCheckClamp(Settings & current_settings, LoggerPtr log)
|
||||||
{
|
{
|
||||||
auto getCurrentValue = [¤t_settings](const std::string_view name) -> Field
|
auto get_current_value = [¤t_settings](const std::string_view name) -> Field
|
||||||
{
|
{
|
||||||
Field current_value;
|
Field current_value;
|
||||||
bool has_current_value = current_settings.tryGet(name, current_value);
|
bool has_current_value = current_settings.tryGet(name, current_value);
|
||||||
@ -100,7 +100,7 @@ void doSettingsSanityCheckClamp(Settings & current_settings, LoggerPtr log)
|
|||||||
return current_value;
|
return current_value;
|
||||||
};
|
};
|
||||||
|
|
||||||
UInt64 max_threads = getCurrentValue("max_threads").get<UInt64>();
|
UInt64 max_threads = get_current_value("max_threads").get<UInt64>();
|
||||||
UInt64 max_threads_max_value = 256 * getNumberOfPhysicalCPUCores();
|
UInt64 max_threads_max_value = 256 * getNumberOfPhysicalCPUCores();
|
||||||
if (max_threads > max_threads_max_value)
|
if (max_threads > max_threads_max_value)
|
||||||
{
|
{
|
||||||
@ -109,7 +109,7 @@ void doSettingsSanityCheckClamp(Settings & current_settings, LoggerPtr log)
|
|||||||
current_settings.set("max_threads", max_threads_max_value);
|
current_settings.set("max_threads", max_threads_max_value);
|
||||||
}
|
}
|
||||||
|
|
||||||
constexpr UInt64 max_sane_block_rows_size = 4294967296; // 2^32
|
static constexpr UInt64 max_sane_block_rows_size = 4294967296; // 2^32
|
||||||
std::unordered_set<String> block_rows_settings{
|
std::unordered_set<String> block_rows_settings{
|
||||||
"max_block_size",
|
"max_block_size",
|
||||||
"max_insert_block_size",
|
"max_insert_block_size",
|
||||||
@ -120,13 +120,21 @@ void doSettingsSanityCheckClamp(Settings & current_settings, LoggerPtr log)
|
|||||||
"input_format_parquet_max_block_size"};
|
"input_format_parquet_max_block_size"};
|
||||||
for (auto const & setting : block_rows_settings)
|
for (auto const & setting : block_rows_settings)
|
||||||
{
|
{
|
||||||
auto block_size = getCurrentValue(setting).get<UInt64>();
|
if (auto block_size = get_current_value(setting).get<UInt64>();
|
||||||
if (block_size > max_sane_block_rows_size)
|
block_size > max_sane_block_rows_size)
|
||||||
{
|
{
|
||||||
if (log)
|
if (log)
|
||||||
LOG_WARNING(log, "Sanity check: '{}' value is too high ({}). Reduced to {}", setting, block_size, max_sane_block_rows_size);
|
LOG_WARNING(log, "Sanity check: '{}' value is too high ({}). Reduced to {}", setting, block_size, max_sane_block_rows_size);
|
||||||
current_settings.set(setting, max_sane_block_rows_size);
|
current_settings.set(setting, max_sane_block_rows_size);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (auto max_block_size = get_current_value("max_block_size").get<UInt64>(); max_block_size == 0)
|
||||||
|
{
|
||||||
|
if (log)
|
||||||
|
LOG_WARNING(log, "Sanity check: 'max_block_size' cannot be 0. Set to default value {}", DEFAULT_BLOCK_SIZE);
|
||||||
|
current_settings.set("max_block_size", DEFAULT_BLOCK_SIZE);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
@ -144,6 +144,9 @@ static std::atomic_flag fatal_error_printed;
|
|||||||
*/
|
*/
|
||||||
static void signalHandler(int sig, siginfo_t * info, void * context)
|
static void signalHandler(int sig, siginfo_t * info, void * context)
|
||||||
{
|
{
|
||||||
|
if (asynchronous_stack_unwinding && sig == SIGSEGV)
|
||||||
|
siglongjmp(asynchronous_stack_unwinding_signal_jump_buffer, 1);
|
||||||
|
|
||||||
DENY_ALLOCATIONS_IN_SCOPE;
|
DENY_ALLOCATIONS_IN_SCOPE;
|
||||||
auto saved_errno = errno; /// We must restore previous value of errno in signal handler.
|
auto saved_errno = errno; /// We must restore previous value of errno in signal handler.
|
||||||
|
|
||||||
@ -185,6 +188,7 @@ static void signalHandler(int sig, siginfo_t * info, void * context)
|
|||||||
errno = saved_errno;
|
errno = saved_errno;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
static bool getenvBool(const char * name)
|
static bool getenvBool(const char * name)
|
||||||
{
|
{
|
||||||
bool res = false;
|
bool res = false;
|
||||||
|
@ -7,7 +7,7 @@
|
|||||||
#include <Parsers/ASTLiteral.h>
|
#include <Parsers/ASTLiteral.h>
|
||||||
#include <Common/typeid_cast.h>
|
#include <Common/typeid_cast.h>
|
||||||
#include <Poco/String.h>
|
#include <Poco/String.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <IO/WriteHelpers.h>
|
#include <IO/WriteHelpers.h>
|
||||||
#include <Core/Defines.h>
|
#include <Core/Defines.h>
|
||||||
#include <Common/CurrentThread.h>
|
#include <Common/CurrentThread.h>
|
||||||
|
@ -1,5 +1,5 @@
|
|||||||
#include <base/map.h>
|
#include <base/map.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Columns/ColumnMap.h>
|
#include <Columns/ColumnMap.h>
|
||||||
#include <Core/Field.h>
|
#include <Core/Field.h>
|
||||||
#include <DataTypes/DataTypeMap.h>
|
#include <DataTypes/DataTypeMap.h>
|
||||||
|
@ -1,6 +1,6 @@
|
|||||||
#include <base/map.h>
|
#include <base/map.h>
|
||||||
#include <base/range.h>
|
#include <base/range.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Columns/ColumnTuple.h>
|
#include <Columns/ColumnTuple.h>
|
||||||
#include <Columns/ColumnConst.h>
|
#include <Columns/ColumnConst.h>
|
||||||
#include <Core/Field.h>
|
#include <Core/Field.h>
|
||||||
|
@ -3,7 +3,7 @@
|
|||||||
|
|
||||||
#include <Common/typeid_cast.h>
|
#include <Common/typeid_cast.h>
|
||||||
#include <Common/assert_cast.h>
|
#include <Common/assert_cast.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include "Columns/IColumn.h"
|
#include "Columns/IColumn.h"
|
||||||
|
|
||||||
#include <DataTypes/DataTypeArray.h>
|
#include <DataTypes/DataTypeArray.h>
|
||||||
|
@ -2,7 +2,7 @@
|
|||||||
#include <DataTypes/Serializations/SerializationNullable.h>
|
#include <DataTypes/Serializations/SerializationNullable.h>
|
||||||
#include <DataTypes/DataTypeMap.h>
|
#include <DataTypes/DataTypeMap.h>
|
||||||
|
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Columns/ColumnMap.h>
|
#include <Columns/ColumnMap.h>
|
||||||
#include <Core/Field.h>
|
#include <Core/Field.h>
|
||||||
#include <Formats/FormatSettings.h>
|
#include <Formats/FormatSettings.h>
|
||||||
|
@ -26,6 +26,8 @@
|
|||||||
#include <Common/escapeForFileName.h>
|
#include <Common/escapeForFileName.h>
|
||||||
#include <Common/filesystemHelpers.h>
|
#include <Common/filesystemHelpers.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
|
#include <Common/setThreadName.h>
|
||||||
|
|
||||||
|
|
||||||
namespace fs = std::filesystem;
|
namespace fs = std::filesystem;
|
||||||
|
|
||||||
@ -665,6 +667,7 @@ void DatabaseOnDisk::iterateMetadataFiles(ContextPtr local_context, const Iterat
|
|||||||
pool.scheduleOrThrowOnError(
|
pool.scheduleOrThrowOnError(
|
||||||
[batch, &process_metadata_file, &process_tmp_drop_metadata_file]() mutable
|
[batch, &process_metadata_file, &process_tmp_drop_metadata_file]() mutable
|
||||||
{
|
{
|
||||||
|
setThreadName("DatabaseOnDisk");
|
||||||
for (const auto & file : batch)
|
for (const auto & file : batch)
|
||||||
if (file.second)
|
if (file.second)
|
||||||
process_metadata_file(file.first);
|
process_metadata_file(file.first);
|
||||||
|
@ -76,6 +76,20 @@ static void setReplicatedEngine(ASTCreateQuery * create_query, ContextPtr contex
|
|||||||
String replica_path = server_settings.default_replica_path;
|
String replica_path = server_settings.default_replica_path;
|
||||||
String replica_name = server_settings.default_replica_name;
|
String replica_name = server_settings.default_replica_name;
|
||||||
|
|
||||||
|
/// Check that replica path doesn't exist
|
||||||
|
Macros::MacroExpansionInfo info;
|
||||||
|
StorageID table_id = StorageID(create_query->getDatabase(), create_query->getTable(), create_query->uuid);
|
||||||
|
info.table_id = table_id;
|
||||||
|
info.expand_special_macros_only = false;
|
||||||
|
|
||||||
|
String zookeeper_path = context->getMacros()->expand(replica_path, info);
|
||||||
|
if (context->getZooKeeper()->exists(zookeeper_path))
|
||||||
|
throw Exception(
|
||||||
|
ErrorCodes::LOGICAL_ERROR,
|
||||||
|
"Found existing ZooKeeper path {} while trying to convert table {} to replicated. Table will not be converted.",
|
||||||
|
zookeeper_path, backQuote(table_id.getFullTableName())
|
||||||
|
);
|
||||||
|
|
||||||
auto args = std::make_shared<ASTExpressionList>();
|
auto args = std::make_shared<ASTExpressionList>();
|
||||||
args->children.push_back(std::make_shared<ASTLiteral>(replica_path));
|
args->children.push_back(std::make_shared<ASTLiteral>(replica_path));
|
||||||
args->children.push_back(std::make_shared<ASTLiteral>(replica_name));
|
args->children.push_back(std::make_shared<ASTLiteral>(replica_name));
|
||||||
|
@ -944,6 +944,13 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
|
|||||||
query_context->setSetting("allow_hyperscan", 1);
|
query_context->setSetting("allow_hyperscan", 1);
|
||||||
query_context->setSetting("allow_simdjson", 1);
|
query_context->setSetting("allow_simdjson", 1);
|
||||||
query_context->setSetting("allow_deprecated_syntax_for_merge_tree", 1);
|
query_context->setSetting("allow_deprecated_syntax_for_merge_tree", 1);
|
||||||
|
query_context->setSetting("allow_suspicious_primary_key", 1);
|
||||||
|
query_context->setSetting("allow_suspicious_ttl_expressions", 1);
|
||||||
|
query_context->setSetting("allow_suspicious_variant_types", 1);
|
||||||
|
query_context->setSetting("enable_deflate_qpl_codec", 1);
|
||||||
|
query_context->setSetting("enable_zstd_qat_codec", 1);
|
||||||
|
query_context->setSetting("allow_create_index_without_type", 1);
|
||||||
|
query_context->setSetting("allow_experimental_s3queue", 1);
|
||||||
|
|
||||||
auto txn = std::make_shared<ZooKeeperMetadataTransaction>(current_zookeeper, zookeeper_path, false, "");
|
auto txn = std::make_shared<ZooKeeperMetadataTransaction>(current_zookeeper, zookeeper_path, false, "");
|
||||||
query_context->initZooKeeperMetadataTransaction(txn);
|
query_context->initZooKeeperMetadataTransaction(txn);
|
||||||
|
@ -39,7 +39,6 @@ target_link_libraries(clickhouse_dictionaries
|
|||||||
Poco::Data
|
Poco::Data
|
||||||
Poco::MongoDB
|
Poco::MongoDB
|
||||||
Poco::Redis
|
Poco::Redis
|
||||||
string_utils
|
|
||||||
)
|
)
|
||||||
|
|
||||||
target_link_libraries(clickhouse_dictionaries PUBLIC ch_contrib::abseil_swiss_tables)
|
target_link_libraries(clickhouse_dictionaries PUBLIC ch_contrib::abseil_swiss_tables)
|
||||||
|
@ -7,7 +7,7 @@
|
|||||||
#include <IO/WriteHelpers.h>
|
#include <IO/WriteHelpers.h>
|
||||||
#include <IO/Operators.h>
|
#include <IO/Operators.h>
|
||||||
|
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
|
|
||||||
#include <Formats/FormatSettings.h>
|
#include <Formats/FormatSettings.h>
|
||||||
#include <Columns/IColumn.h>
|
#include <Columns/IColumn.h>
|
||||||
|
@ -1,6 +1,6 @@
|
|||||||
#include "FileDictionarySource.h"
|
#include "FileDictionarySource.h"
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
#include <Common/StringUtils/StringUtils.h>
|
#include <Common/StringUtils.h>
|
||||||
#include <Common/filesystemHelpers.h>
|
#include <Common/filesystemHelpers.h>
|
||||||
#include <IO/ReadBufferFromFile.h>
|
#include <IO/ReadBufferFromFile.h>
|
||||||
#include <Interpreters/Context.h>
|
#include <Interpreters/Context.h>
|
||||||
|
@ -69,6 +69,15 @@ public:
|
|||||||
return dictionary_id.getNameForLogs();
|
return dictionary_id.getNameForLogs();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// Returns fully qualified unquoted dictionary name
|
||||||
|
std::string getQualifiedName() const
|
||||||
|
{
|
||||||
|
std::lock_guard lock{mutex};
|
||||||
|
if (dictionary_id.database_name.empty())
|
||||||
|
return dictionary_id.table_name;
|
||||||
|
return dictionary_id.database_name + "." + dictionary_id.table_name;
|
||||||
|
}
|
||||||
|
|
||||||
StorageID getDictionaryID() const
|
StorageID getDictionaryID() const
|
||||||
{
|
{
|
||||||
std::lock_guard lock{mutex};
|
std::lock_guard lock{mutex};
|
||||||
|
@ -32,8 +32,16 @@ bool DataSourceDescription::operator==(const DataSourceDescription & other) cons
|
|||||||
|
|
||||||
bool DataSourceDescription::sameKind(const DataSourceDescription & other) const
|
bool DataSourceDescription::sameKind(const DataSourceDescription & other) const
|
||||||
{
|
{
|
||||||
return std::tie(type, object_storage_type, description)
|
std::string_view our_description = description;
|
||||||
== std::tie(other.type, other.object_storage_type, other.description);
|
if (our_description.ends_with('/') && our_description.length() > 1)
|
||||||
|
our_description = our_description.substr(0, our_description.length() - 1);
|
||||||
|
|
||||||
|
std::string_view other_description = other.description;
|
||||||
|
if (other_description.ends_with('/') && other_description.length() > 1)
|
||||||
|
other_description = other_description.substr(0, other_description.length() - 1);
|
||||||
|
|
||||||
|
return std::tie(type, object_storage_type, our_description)
|
||||||
|
== std::tie(other.type, other.object_storage_type, other_description);
|
||||||
}
|
}
|
||||||
|
|
||||||
std::string DataSourceDescription::toString() const
|
std::string DataSourceDescription::toString() const
|
||||||
|
@ -1,5 +1,4 @@
|
|||||||
#include "IOUringReader.h"
|
#include "IOUringReader.h"
|
||||||
#include <memory>
|
|
||||||
|
|
||||||
#if USE_LIBURING
|
#if USE_LIBURING
|
||||||
|
|
||||||
@ -13,6 +12,7 @@
|
|||||||
#include <Common/ThreadPool.h>
|
#include <Common/ThreadPool.h>
|
||||||
#include <Common/logger_useful.h>
|
#include <Common/logger_useful.h>
|
||||||
#include <future>
|
#include <future>
|
||||||
|
#include <memory>
|
||||||
|
|
||||||
namespace ProfileEvents
|
namespace ProfileEvents
|
||||||
{
|
{
|
||||||
|
@ -4,9 +4,9 @@
|
|||||||
#include <IO/MMapReadBufferFromFileWithCache.h>
|
#include <IO/MMapReadBufferFromFileWithCache.h>
|
||||||
#include <IO/AsynchronousReadBufferFromFile.h>
|
#include <IO/AsynchronousReadBufferFromFile.h>
|
||||||
#include <Disks/IO/IOUringReader.h>
|
#include <Disks/IO/IOUringReader.h>
|
||||||
|
#include <Disks/IO/getIOUringReader.h>
|
||||||
#include <Disks/IO/ThreadPoolReader.h>
|
#include <Disks/IO/ThreadPoolReader.h>
|
||||||
#include <Disks/IO/getThreadPoolReader.h>
|
#include <Disks/IO/getThreadPoolReader.h>
|
||||||
#include <IO/SynchronousReader.h>
|
|
||||||
#include <IO/AsynchronousReader.h>
|
#include <IO/AsynchronousReader.h>
|
||||||
#include <Common/ProfileEvents.h>
|
#include <Common/ProfileEvents.h>
|
||||||
#include "config.h"
|
#include "config.h"
|
||||||
@ -100,14 +100,7 @@ std::unique_ptr<ReadBufferFromFileBase> createReadBufferFromFileBase(
|
|||||||
else if (settings.local_fs_method == LocalFSReadMethod::io_uring)
|
else if (settings.local_fs_method == LocalFSReadMethod::io_uring)
|
||||||
{
|
{
|
||||||
#if USE_LIBURING
|
#if USE_LIBURING
|
||||||
auto global_context = Context::getGlobalContextInstance();
|
auto & reader = getIOUringReaderOrThrow();
|
||||||
if (!global_context)
|
|
||||||
throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot obtain io_uring reader (global context not initialized)");
|
|
||||||
|
|
||||||
auto & reader = global_context->getIOURingReader();
|
|
||||||
if (!reader.isSupported())
|
|
||||||
throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "io_uring is not supported by this system");
|
|
||||||
|
|
||||||
res = std::make_unique<AsynchronousReadBufferFromFileWithDescriptorsCache>(
|
res = std::make_unique<AsynchronousReadBufferFromFileWithDescriptorsCache>(
|
||||||
reader,
|
reader,
|
||||||
settings.priority,
|
settings.priority,
|
||||||
|
41
src/Disks/IO/getIOUringReader.cpp
Normal file
41
src/Disks/IO/getIOUringReader.cpp
Normal file
@ -0,0 +1,41 @@
|
|||||||
|
#include <Disks/IO/getIOUringReader.h>
|
||||||
|
|
||||||
|
#if USE_LIBURING
|
||||||
|
|
||||||
|
#include <Interpreters/Context.h>
|
||||||
|
#include <Common/ErrorCodes.h>
|
||||||
|
|
||||||
|
namespace DB
|
||||||
|
{
|
||||||
|
|
||||||
|
namespace ErrorCodes
|
||||||
|
{
|
||||||
|
extern const int LOGICAL_ERROR;
|
||||||
|
extern const int UNSUPPORTED_METHOD;
|
||||||
|
}
|
||||||
|
|
||||||
|
std::unique_ptr<IOUringReader> createIOUringReader()
|
||||||
|
{
|
||||||
|
return std::make_unique<IOUringReader>(512);
|
||||||
|
}
|
||||||
|
|
||||||
|
IOUringReader & getIOUringReaderOrThrow(ContextPtr context)
|
||||||
|
{
|
||||||
|
auto & reader = context->getIOUringReader();
|
||||||
|
if (!reader.isSupported())
|
||||||
|
{
|
||||||
|
throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "io_uring is not supported by this system");
|
||||||
|
}
|
||||||
|
return reader;
|
||||||
|
}
|
||||||
|
|
||||||
|
IOUringReader & getIOUringReaderOrThrow()
|
||||||
|
{
|
||||||
|
auto context = Context::getGlobalContextInstance();
|
||||||
|
if (!context)
|
||||||
|
throw Exception(ErrorCodes::LOGICAL_ERROR, "Global context not initialized");
|
||||||
|
return getIOUringReaderOrThrow(context);
|
||||||
|
}
|
||||||
|
|
||||||
|
}
|
||||||
|
#endif
|
21
src/Disks/IO/getIOUringReader.h
Normal file
21
src/Disks/IO/getIOUringReader.h
Normal file
@ -0,0 +1,21 @@
|
|||||||
|
#pragma once
|
||||||
|
|
||||||
|
#include "config.h"
|
||||||
|
|
||||||
|
#if USE_LIBURING
|
||||||
|
|
||||||
|
#include <Interpreters/Context_fwd.h>
|
||||||
|
#include <Disks/IO/IOUringReader.h>
|
||||||
|
#include <memory>
|
||||||
|
|
||||||
|
namespace DB
|
||||||
|
{
|
||||||
|
|
||||||
|
std::unique_ptr<IOUringReader> createIOUringReader();
|
||||||
|
|
||||||
|
IOUringReader & getIOUringReaderOrThrow(ContextPtr);
|
||||||
|
|
||||||
|
IOUringReader & getIOUringReaderOrThrow();
|
||||||
|
|
||||||
|
}
|
||||||
|
#endif
|
Some files were not shown because too many files have changed in this diff Show More
Loading…
Reference in New Issue
Block a user