Convert skip_list.json into first line comments.

2024-12-18 04:12:19 +00:00 · 2021-09-12 15:35:00 +03:00 · 2021-09-12 15:35:00 +03:00 · bbb192ee85
commit bbb192ee85
parent a4153e5629
13 changed files with 739 additions and 320 deletions
--- a/docker/test/coverage/run.sh
+++ b/docker/test/coverage/run.sh
@ -80,7 +80,7 @@ LLVM_PROFILE_FILE='client_coverage_%5m.profraw' clickhouse-client --query "RENAM
 LLVM_PROFILE_FILE='client_coverage_%5m.profraw' clickhouse-client --query "RENAME TABLE datasets.visits_v1 TO test.visits"
 LLVM_PROFILE_FILE='client_coverage_%5m.profraw' clickhouse-client --query "SHOW TABLES FROM test"

-LLVM_PROFILE_FILE='client_coverage_%5m.profraw' clickhouse-test -j 8 --testname --shard --zookeeper --print-time --use-skip-list 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee /test_result.txt
+LLVM_PROFILE_FILE='client_coverage_%5m.profraw' clickhouse-test -j 8 --testname --shard --zookeeper --print-time 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee /test_result.txt

 readarray -t FAILED_TESTS < <(awk '/FAIL|TIMEOUT|ERROR/ { print substr($3, 1, length($3)-1) }' "/test_result.txt")

@ -97,7 +97,7 @@ then

    echo "Going to run again: ${FAILED_TESTS[*]}"

-    LLVM_PROFILE_FILE='client_coverage_%5m.profraw' clickhouse-test --order=random --testname --shard --zookeeper --use-skip-list "${FAILED_TESTS[@]}" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee -a /test_result.txt
+    LLVM_PROFILE_FILE='client_coverage_%5m.profraw' clickhouse-test --order=random --testname --shard --zookeeper "${FAILED_TESTS[@]}" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee -a /test_result.txt
 else
    echo "No failed tests"
 fi
--- a/docker/test/fasttest/run.sh
+++ b/docker/test/fasttest/run.sh
@ -275,11 +275,10 @@ function run_tests
        00834_cancel_http_readonly_queries_on_client_close
        00911_tautological_compare

-        # Hyperscan
-        00926_multimatch
-        00929_multi_match_edit_distance
-        01681_hyperscan_debug_assertion
-        02004_max_hyperscan_regex_length
+        00926_multimatch # Hyperscan
+        00929_multi_match_edit_distance # Hyperscan
+        01681_hyperscan_debug_assertion # Hyperscan
+        02004_max_hyperscan_regex_length # Hyperscan

        01176_mysql_client_interactive          # requires mysql client
        01031_mutations_interpreter_and_context
@ -344,70 +343,54 @@ function run_tests
        sha256
        xz

-        # Not sure why these two fail even in sequential mode. Disabled for now
-        # to make some progress.
-        00646_url_engine
-        00974_query_profiler
+        00646_url_engine     # Not sure why fail even in sequential mode. Disabled for now to make some progress.
+        00974_query_profiler # Not sure why fail even in sequential mode. Disabled for now to make some progress.

-         # In fasttest, ENABLE_LIBRARIES=0, so rocksdb engine is not enabled by default
-        01504_rocksdb
-        01686_rocksdb
+        01504_rocksdb        # In fasttest, ENABLE_LIBRARIES=0, so rocksdb engine is not enabled by default
+        01686_rocksdb        # In fasttest, ENABLE_LIBRARIES=0, so rocksdb engine is not enabled by default

-        # Look at DistributedFilesToInsert, so cannot run in parallel.
-        01460_DistributedFilesToInsert
+        01460_DistributedFilesToInsert # Look at DistributedFilesToInsert, so cannot run in parallel.

        01541_max_memory_usage_for_user_long

-        # Require python libraries like scipy, pandas and numpy
-        01322_ttest_scipy
-        01561_mann_whitney_scipy
+        01322_ttest_scipy        # Require python libraries like scipy, pandas and numpy
+        01561_mann_whitney_scipy # Require python libraries like scipy, pandas and numpy

-        01545_system_errors
-        # Checks system.errors
-        01563_distributed_query_finish
+        01545_system_errors            # Checks system.errors
+        01563_distributed_query_finish # Checks system.errors

-        # nc - command not found
-        01601_proxy_protocol
-        01622_defaults_for_url_engine
+        01601_proxy_protocol          # nc - command not found
+        01622_defaults_for_url_engine # nc - command not found

-        # JSON functions
-        01666_blns
+        01666_blns # JSON functions

-        # Requires postgresql-client
-        01802_test_postgresql_protocol_with_row_policy
+        01802_test_postgresql_protocol_with_row_policy # Requires postgresql-client

-        # Depends on AWS
-        01801_s3_cluster
-        02012_settings_clause_for_s3
+        01801_s3_cluster             # Depends on AWS
+        02012_settings_clause_for_s3 # Depends on AWS

-        # needs psql
-        01889_postgresql_protocol_null_fields
+        01889_postgresql_protocol_null_fields    # needs psql

-        # needs pv
-        01923_network_receive_time_metric_insert
+        01923_network_receive_time_metric_insert # needs pv

        01889_sqlite_read_write

-        # needs s2
-        01849_geoToS2
-        01851_s2_to_geo
-        01852_s2_get_neighbours
-        01853_s2_cells_intersect
-        01854_s2_cap_contains
-        01854_s2_cap_union
+        01849_geoToS2            # needs s2
+        01851_s2_to_geo          # needs s2
+        01852_s2_get_neighbours  # needs s2
+        01853_s2_cells_intersect # needs s2
+        01854_s2_cap_contains    # needs s2
+        01854_s2_cap_union       # needs s2

-        # needs s3
-        01944_insert_partition_by
+        01944_insert_partition_by # needs s3

-        # depends on Go
-        02013_zlib_read_after_eof
+        02013_zlib_read_after_eof # depends on Go

-        # Accesses CH via mysql table function (which is unavailable)
-        01747_system_session_log_long
+        01747_system_session_log_long # Accesses CH via mysql table function (which is unavailable)
    )

-    time clickhouse-test --hung-check -j 8 --order=random --use-skip-list \
-            --no-long --testname --shard --zookeeper --skip "${TESTS_TO_SKIP[@]}" \
+    time clickhouse-test --hung-check -j 8 --order=random \
+            --fast-tests-only --no-long --testname --shard --zookeeper \
            -- "$FASTTEST_FOCUS" 2>&1 \
        | ts '%Y-%m-%d %H:%M:%S' \
        | tee "$FASTTEST_OUTPUT/test_log.txt"
--- a/docker/test/stateful/run.sh
+++ b/docker/test/stateful/run.sh
@ -108,7 +108,7 @@ function run_tests()
        ADDITIONAL_OPTIONS+=('--replicated-database')
    fi

-    clickhouse-test --testname --shard --zookeeper --no-stateless --hung-check --use-skip-list --print-time "${ADDITIONAL_OPTIONS[@]}" \
+    clickhouse-test --testname --shard --zookeeper --no-stateless --hung-check --print-time "${ADDITIONAL_OPTIONS[@]}" \
        "$SKIP_TESTS_OPTION" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee test_output/test_result.txt
 }

--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@ -97,7 +97,7 @@ function run_tests()
    fi

    clickhouse-test --testname --shard --zookeeper --hung-check --print-time \
-            --use-skip-list --test-runs "$NUM_TRIES" "${ADDITIONAL_OPTIONS[@]}" 2>&1 \
+            --test-runs "$NUM_TRIES" "${ADDITIONAL_OPTIONS[@]}" 2>&1 \
        | ts '%Y-%m-%d %H:%M:%S' \
        | tee -a test_output/test_result.txt
 }
--- a/docker/test/stateless_unbundled/run.sh
+++ b/docker/test/stateless_unbundled/run.sh
@ -13,8 +13,4 @@ dpkg -i package_folder/clickhouse-test_*.deb

 service clickhouse-server start && sleep 5

-if grep -q -- "--use-skip-list" /usr/bin/clickhouse-test; then
-    SKIP_LIST_OPT="--use-skip-list"
-fi
-
-clickhouse-test --testname --shard --zookeeper "$SKIP_LIST_OPT" "$ADDITIONAL_OPTIONS" "$SKIP_TESTS_OPTION" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee test_output/test_result.txt
+clickhouse-test --testname --shard --zookeeper "$ADDITIONAL_OPTIONS" "$SKIP_TESTS_OPTION" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee test_output/test_result.txt
--- a/docker/test/stress/stress
+++ b/docker/test/stress/stress
@ -10,14 +10,6 @@ import logging
 import time


-def get_skip_list_cmd(path):
-    with open(path, 'r') as f:
-        for line in f:
-            if '--use-skip-list' in line:
-                return '--use-skip-list'
-    return ''
-
-
 def get_options(i):
    options = []
    client_options = []
@ -56,8 +48,6 @@ def get_options(i):


 def run_func_test(cmd, output_prefix, num_processes, skip_tests_option, global_time_limit):
-    skip_list_opt = get_skip_list_cmd(cmd)
-
    global_time_limit_option = ''
    if global_time_limit:
        global_time_limit_option = "--global_time_limit={}".format(global_time_limit)
@ -66,7 +56,7 @@ def run_func_test(cmd, output_prefix, num_processes, skip_tests_option, global_t
    pipes = []
    for i in range(0, len(output_paths)):
        f = open(output_paths[i], 'w')
-        full_command = "{} {} {} {} {}".format(cmd, skip_list_opt, get_options(i), global_time_limit_option, skip_tests_option)
+        full_command = "{} {} {} {}".format(cmd, get_options(i), global_time_limit_option, skip_tests_option)
        logging.info("Run func tests '%s'", full_command)
        p = Popen(full_command, shell=True, stdout=f, stderr=f)
        pipes.append(p)
--- a/programs/client/CMakeLists.txt
+++ b/programs/client/CMakeLists.txt
@ -4,6 +4,7 @@ set (CLICKHOUSE_CLIENT_SOURCES
    QueryFuzzer.cpp
    Suggest.cpp
    TestHint.cpp
+    TestTags.cpp
 )

 set (CLICKHOUSE_CLIENT_LINK
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@ -6,6 +6,7 @@
 #include "QueryFuzzer.h"
 #include "Suggest.h"
 #include "TestHint.h"
+#include "TestTags.h"

 #if USE_REPLXX
 #   include <common/ReplxxLineReader.h>
@ -1078,12 +1079,17 @@ private:

        bool echo_query = echo_queries;

+        /// Test tags are started with "--" so they are interpreted as comments anyway.
+        /// But if the echo is enabled we have to remove the test tags from `all_queries_text`
+        /// because we don't want test tags to be echoed.
+        size_t test_tags_length = test_mode ? getTestTagsLength(all_queries_text) : 0;
+
        /// Several queries separated by ';'.
        /// INSERT data is ended by the end of line, not ';'.
        /// An exception is VALUES format where we also support semicolon in
        /// addition to end of line.

-        const char * this_query_begin = all_queries_text.data();
+        const char * this_query_begin = all_queries_text.data() + test_tags_length;
        const char * all_queries_end = all_queries_text.data() + all_queries_text.size();

        while (this_query_begin < all_queries_end)
--- a/programs/client/TestTags.cpp
+++ b/programs/client/TestTags.cpp
@ -0,0 +1,50 @@
+#include "TestTags.h"
+
+
+namespace DB
+{
+
+size_t getTestTagsLength(const String & multiline_query)
+{
+    const String & text = multiline_query;
+    size_t pos = 0;
+    bool first_line = true;
+
+    while (true)
+    {
+        size_t line_start = pos;
+
+        /// Skip spaces.
+        while ((pos != text.length()) && (text[pos] == ' ' || text[pos] == '\t'))
+            ++pos;
+
+        /// Skip comment "--".
+        static constexpr const char comment[] = "--";
+        if (text.compare(pos, strlen(comment), comment) != 0)
+            return line_start;
+        pos += strlen(comment);
+
+        /// Skip the prefix "Tags:" if it's the first line.
+        if (first_line)
+        {
+            while ((pos != text.length()) && (text[pos] == ' ' || text[pos] == '\t'))
+                ++pos;
+
+            static constexpr const char tags_prefix[] = "Tags:";
+            if (text.compare(pos, strlen(tags_prefix), tags_prefix) != 0)
+                return 0;
+            pos += strlen(tags_prefix);
+            first_line = false;
+        }
+
+        /// Skip end-of-line.
+        size_t eol_pos = text.find_first_of("\r\n", pos);
+        if (eol_pos == String::npos)
+            return text.length();
+        bool two_chars_eol = (eol_pos + 1 < text.length()) && ((text[eol_pos + 1] == '\r') || (text[eol_pos + 1] == '\n')) && (text[eol_pos + 1] != text[eol_pos]);
+        size_t eol_length = two_chars_eol ? 2 : 1;
+        pos = eol_pos + eol_length;
+    }
+}
+
+}
--- a/programs/client/TestTags.h
+++ b/programs/client/TestTags.h
@ -0,0 +1,18 @@
+#pragma once
+
+#include <Core/Types.h>
+
+namespace DB
+{
+
+/// Returns the length of a text looking like
+/// -- Tags: x, y, z
+/// -- Tag x: explanation of tag x
+/// -- Tag y: explanation of tag y
+/// -- Tag z: explanation of tag z
+///
+/// at the beginning of a multiline query.
+/// If there are no test tags in the multiline query the function returns 0.
+size_t getTestTagsLength(const String & multiline_query);
+
+}
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@ -6,12 +6,11 @@ import os
 import os.path
 import signal
 import re
-import json
 import copy
 import traceback

 from argparse import ArgumentParser
-from typing import Tuple, Union, Optional, TextIO
+from typing import Tuple, Union, Optional, TextIO, Dict, Set, List
 import shlex
 import subprocess
 from subprocess import Popen
@ -83,76 +82,6 @@ def stop_tests():
            os.killpg(os.getpgid(os.getpid()), signal.SIGTERM)
            signal.signal(signal.SIGTERM, signal.SIG_DFL)

-def json_minify(string):
-    """
-    Removes all js-style comments from json string. Allows to have comments in skip_list.json.
-    The code was taken from https://github.com/getify/JSON.minify/tree/python under the MIT license.
-    """
-
-    tokenizer = re.compile(r'"|(/\*)|(\*/)|(//)|\n|\r')
-    end_slashes_re = re.compile(r'(\\)*$')
-
-    in_string = False
-    in_multi = False
-    in_single = False
-
-    new_str = []
-    index = 0
-
-    for match in re.finditer(tokenizer, string):
-        if not (in_multi or in_single):
-            tmp = string[index:match.start()]
-            new_str.append(tmp)
-        else:
-            # Replace comments with white space so that the JSON parser reports
-            # the correct column numbers on parsing errors.
-            new_str.append(' ' * (match.start() - index))
-
-        index = match.end()
-        val = match.group()
-
-        if val == '"' and not (in_multi or in_single):
-            escaped = end_slashes_re.search(string, 0, match.start())
-
-            # start of string or unescaped quote character to end string
-            if not in_string or (escaped is None or len(escaped.group()) % 2 == 0):  # noqa
-                in_string = not in_string
-            index -= 1  # include " character in next catch
-        elif not (in_string or in_multi or in_single):
-            if val == '/*':
-                in_multi = True
-            elif val == '//':
-                in_single = True
-        elif val == '*/' and in_multi and not (in_string or in_single):
-            in_multi = False
-            new_str.append(' ' * len(val))
-        elif val in '\r\n' and not (in_multi or in_string) and in_single:
-            in_single = False
-        elif not in_multi or in_single:  # noqa
-            new_str.append(val)
-
-        if val in '\r\n':
-            new_str.append(val)
-        elif in_multi or in_single:
-            new_str.append(' ' * len(val))
-
-    new_str.append(string[index:])
-    return ''.join(new_str)
-
-
-def remove_control_characters(s):
-    """
-    https://github.com/html5lib/html5lib-python/issues/96#issuecomment-43438438
-    """
-    def str_to_int(s, default, base=10):
-        if int(s, base) < 0x10000:
-            return chr(int(s, base))
-        return default
-    s = re.sub(r"&#(\d+);?", lambda c: str_to_int(c.group(1), c.group(0)), s)
-    s = re.sub(r"&#[xX]([0-9a-fA-F]+);?", lambda c: str_to_int(c.group(1), c.group(0), base=16), s)
-    s = re.sub(r"[\x00-\x08\x0b\x0e-\x1f\x7f]", "", s)
-    return s
-

 def get_db_engine(args, database_name):
    if args.replicated_database:
@ -429,48 +358,69 @@ def print_test_time(test_time) -> str:
        return ''


-def should_skip_test_by_name(name: str, test_ext: str) -> Tuple[bool, str]:
-    if args.skip and any(s in name for s in args.skip):
-        return True, "skip"
-
-    if not args.zookeeper and ('zookeeper' in name or 'replica' in name):
-        return True, "no zookeeper"
-
-    if not args.shard and \
-        ('shard' in name or 'distributed' in name or 'global' in name):
-        return True, "no shard"
-
-    # Tests for races and deadlocks usually are run in a loop for a significant
-    # amount of time
-    if args.no_long and \
-        ('long' in name or 'deadlock' in name or 'race' in name):
-        return True, "no long"
-
-    if not USE_JINJA and test_ext.endswith("j2"):
-        return True, "no jinja"
-
-    return False, ""
-
-
-def should_skip_disabled_test(name: str, suite_dir: str) -> Tuple[bool, str]:
-    disabled_file = os.path.join(suite_dir, name) + '.disabled'
-
-    if os.path.exists(disabled_file) and not args.disabled:
-        return True, open(disabled_file, 'r').read()
-
-    return False, ""
-
-
 # should skip test, should increment skipped_total, skip reason
-def should_skip_test(name: str, test_ext: str, suite_dir: str) -> Tuple[bool, bool, str]:
-    should_skip, skip_reason = should_skip_test_by_name(name, test_ext)
+def should_skip_test(name: str, test_ext: str, suite_dir: str, all_tags: Dict[str, Set[str]]) -> Tuple[bool, bool, str]:
+    tags = all_tags.get(name + test_ext)

-    if should_skip:
-        return True, True, skip_reason
+    should_skip = False
+    increment_skip_count = False
+    skip_reason = ''

-    should_skip, skip_reason = should_skip_disabled_test(name, suite_dir)
+    if tags and ('disabled' in tags) and not args.disabled:
+        should_skip = True
+        increment_skip_count = False
+        skip_reason = 'disabled'

-    return should_skip, False, skip_reason
+    elif os.path.exists(os.path.join(suite_dir, name) + '.disabled') and not args.disabled:
+        should_skip = True
+        increment_skip_count = False
+        skip_reason = 'disabled'
+
+    elif args.skip and any(s in name for s in args.skip):
+        should_skip = True
+        increment_skip_count = True
+        skip_reason = 'skip'
+
+    elif not USE_JINJA and test_ext.endswith("j2"):
+        should_skip = True
+        increment_skip_count = True
+        skip_reason = 'no jinja'
+
+    elif tags and (('zookeeper' in tags) or ('replica' in tags)) and not args.zookeeper:
+        should_skip = True
+        increment_skip_count = True
+        skip_reason = 'no zookeeper'
+
+    elif tags and (('shard' in tags) or ('distributed' in tags) or ('global' in tags)) and not args.shard:
+        should_skip = True
+        increment_skip_count = True
+        skip_reason = 'no shard'
+
+    elif tags and ('no-fasttest' in tags) and args.fast_tests_only:
+        should_skip = True
+        increment_skip_count = True
+        skip_reason = 'running fast tests only'
+
+    elif tags and (('long' in tags) or ('deadlock' in tags) or ('race' in tags)) and args.no_long:
+        # Tests for races and deadlocks usually are run in a loop for a significant amount of time
+        should_skip = True
+        increment_skip_count = True
+        skip_reason = 'not running long tests'
+
+    elif tags and ('no-replicated-database' in tags) and args.replicated_database:
+        should_skip = True
+        increment_skip_count = True
+        skip_reason = 'replicated-database'
+
+    elif tags:
+        for build_flag in args.build_flags:
+            if 'no-' + build_flag in tags:
+                should_skip = True
+                increment_skip_count = True
+                skip_reason = build_flag
+                break
+
+    return should_skip, increment_skip_count, skip_reason


 def send_test_name_failed(suite: str, case: str) -> bool:
@ -491,9 +441,9 @@ def send_test_name_failed(suite: str, case: str) -> bool:

 restarted_tests = []  # (test, stderr)

-# def run_tests_array(all_tests, suite, suite_dir, suite_tmp_dir, run_total):
+# def run_tests_array(all_tests, num_tests, suite, suite_dir, suite_tmp_dir, all_tags):
 def run_tests_array(all_tests_with_params):
-    all_tests, num_tests, suite, suite_dir, suite_tmp_dir = all_tests_with_params
+    all_tests, num_tests, suite, suite_dir, suite_tmp_dir, all_tags = all_tests_with_params
    global stop_time
    global exit_code
    global server_died
@ -558,7 +508,7 @@ def run_tests_array(all_tests_with_params):
                status = "{0:72}".format(removesuffix(name, ".gen", ".sql") + ": ")

            skip_test, increment_skip_count, skip_reason = \
-                should_skip_test(name, ext, suite_dir)
+                should_skip_test(name, ext, suite_dir, all_tags)

            if skip_test:
                status += MSG_SKIPPED + f" - {skip_reason}\n"
@ -782,16 +732,15 @@ def check_server_started(client, retry_count):


 class BuildFlags():
-    THREAD = 'thread-sanitizer'
-    ADDRESS = 'address-sanitizer'
-    UNDEFINED = 'ub-sanitizer'
-    MEMORY = 'memory-sanitizer'
-    DEBUG = 'debug-build'
-    UNBUNDLED = 'unbundled-build'
-    RELEASE = 'release-build'
-    DATABASE_ORDINARY = 'database-ordinary'
+    THREAD = 'tsan'
+    ADDRESS = 'asan'
+    UNDEFINED = 'ubsan'
+    MEMORY = 'msan'
+    DEBUG = 'debug'
+    UNBUNDLED = 'unbundled'
+    RELEASE = 'release'
+    ORDINARY_DATABASE = 'ordinary-database'
    POLYMORPHIC_PARTS = 'polymorphic-parts'
-    DATABASE_REPLICATED = 'database-replicated'


 def collect_build_flags(client):
@ -836,7 +785,7 @@ def collect_build_flags(client):

    if clickhouse_proc.returncode == 0:
        if b'Ordinary' in stdout:
-            result.append(BuildFlags.DATABASE_ORDINARY)
+            result.append(BuildFlags.ORDINARY_DATABASE)
    else:
        raise Exception("Cannot get information about build from server errorcode {}, stderr {}".format(clickhouse_proc.returncode, stderr))

@ -902,7 +851,7 @@ def open_client_process(



-def do_run_tests(jobs, suite, suite_dir, suite_tmp_dir, all_tests, parallel_tests, sequential_tests, parallel):
+def do_run_tests(jobs, suite, suite_dir, suite_tmp_dir, all_tests, all_tags, parallel_tests, sequential_tests, parallel):
    if jobs > 1 and len(parallel_tests) > 0:
        print("Found", len(parallel_tests), "parallel tests and", len(sequential_tests), "sequential tests")
        run_n, run_total = parallel.split('/')
@ -920,7 +869,7 @@ def do_run_tests(jobs, suite, suite_dir, suite_tmp_dir, all_tests, parallel_test
        batch_size = max(1, len(parallel_tests) // jobs)
        parallel_tests_array = []
        for _ in range(jobs):
-            parallel_tests_array.append((None, batch_size, suite, suite_dir, suite_tmp_dir))
+            parallel_tests_array.append((None, batch_size, suite, suite_dir, suite_tmp_dir, all_tags))

        with closing(multiprocessing.Pool(processes=jobs)) as pool:
            pool.map_async(run_tests_array, parallel_tests_array)
@ -935,11 +884,11 @@ def do_run_tests(jobs, suite, suite_dir, suite_tmp_dir, all_tests, parallel_test

        pool.join()

-        run_tests_array((sequential_tests, len(sequential_tests), suite, suite_dir, suite_tmp_dir))
+        run_tests_array((sequential_tests, len(sequential_tests), suite, suite_dir, suite_tmp_dir, all_tags))
        return len(sequential_tests) + len(parallel_tests)
    else:
        num_tests = len(all_tests)
-        run_tests_array((all_tests, num_tests, suite, suite_dir, suite_tmp_dir))
+        run_tests_array((all_tests, num_tests, suite, suite_dir, suite_tmp_dir, all_tags))
        return num_tests


@ -1053,23 +1002,10 @@ def main(args):
            "Server is not responding. Cannot execute 'SELECT 1' query. \
            If you are using split build, you have to specify -c option.")

-    build_flags = collect_build_flags(args.client)
-
-    if args.replicated_database:
-        build_flags.append(BuildFlags.DATABASE_REPLICATED)
-
-    if args.use_skip_list:
-        tests_to_skip_from_list = collect_tests_to_skip(args.skip_list_path, build_flags)
-    else:
-        tests_to_skip_from_list = set()
+    args.build_flags = collect_build_flags(args.client)

    if args.skip:
-        args.skip = set(args.skip) | tests_to_skip_from_list
-    else:
-        args.skip = tests_to_skip_from_list
-
-    if args.use_skip_list and not args.sequential:
-        args.sequential = collect_sequential_list(args.skip_list_path)
+        args.skip = set(args.skip)

    base_dir = os.path.abspath(args.queries)
    tmp_dir = os.path.abspath(args.tmp)
@ -1148,19 +1084,21 @@ def main(args):
            all_tests = get_tests_list(
                suite_dir, args.test, args.test_runs, tests_in_suite_key_func)

-            jobs = args.jobs
+            all_tags = read_test_tags(suite_dir, all_tests)

-            parallel_tests = []
            sequential_tests = []
+            if args.sequential:
+                for test in all_tests:
+                    if any(s in test for s in args.sequential):
+                        sequential_tests.append(test)
+            else:
+                sequential_tests = collect_sequential_list(all_tags)

-            for test in all_tests:
-                if any(s in test for s in args.sequential):
-                    sequential_tests.append(test)
-                else:
-                    parallel_tests.append(test)
+            sequential_tests_set = set(sequential_tests)
+            parallel_tests = [test for test in all_tests if test not in sequential_tests_set]

            total_tests_run += do_run_tests(
-                jobs, suite, suite_dir, suite_tmp_dir, all_tests, parallel_tests, sequential_tests, args.parallel)
+                args.jobs, suite, suite_dir, suite_tmp_dir, all_tests, all_tags, parallel_tests, sequential_tests, args.parallel)

    if server_died.is_set():
        exit_code.value = 1
@ -1232,40 +1170,58 @@ def get_additional_client_options_url(args):
    return ''


-def collect_tests_to_skip(skip_list_path, build_flags):
-    result = set([])
+def read_test_tags(suite_dir: str, all_tests: List[str]) -> Dict[str, Set[str]]:
+    def get_comment_sign(filename):
+        if filename.endswith('.sql') or filename.endswith('.sql.j2'):
+            return '--'
+        elif filename.endswith('.sh') or filename.endswith('.py') or filename.endswith('.expect'):
+            return '#'
+        else:
+            raise Exception(f'Unknown file_extension: {filename}')

-    if not os.path.exists(skip_list_path):
-        return result
+    def parse_tags_from_line(line, comment_sign):
+        if not line.startswith(comment_sign):
+            return None
+        tags_str = line[len(comment_sign):].lstrip()
+        tags_prefix = "Tags:"
+        if not tags_str.startswith(tags_prefix):
+            return None
+        tags_str = tags_str[len(tags_prefix):]
+        tags = tags_str.split(',')
+        tags = {tag.strip() for tag in tags}
+        return tags

-    with open(skip_list_path, 'r') as skip_list_file:
-        content = skip_list_file.read()
+    def is_shebang(line):
+        return line.startswith('#!')

-        # allows to have comments in skip_list.json
-        skip_dict = json.loads(json_minify(content))
+    def load_tags_from_file(filepath):
+        with open(filepath, 'r') as file:
+            try:
+                line = file.readline()
+                if is_shebang(line):
+                    line = file.readline()
+            except UnicodeDecodeError:
+                return []
+        return parse_tags_from_line(line, get_comment_sign(filepath))

-        for build_flag in build_flags:
-            result |= set(skip_dict[build_flag])
-
-    count = len(result)
-
-    if count > 0:
-        print(f"Found file with skip-list {skip_list_path}, {count} test will be skipped")
-
-    return result
+    all_tags = {}
+    start_time = datetime.now()
+    for test_name in all_tests:
+        tags = load_tags_from_file(os.path.join(suite_dir, test_name))
+        if tags:
+            all_tags[test_name] = tags
+    elapsed = (datetime.now() - start_time).total_seconds()
+    if elapsed > 1:
+        print(f"Tags for suite {suite_dir} read in {elapsed:.2f} seconds")
+    return all_tags


-def collect_sequential_list(skip_list_path):
-    if not os.path.exists(skip_list_path):
-        return set([])
-
-    with open(skip_list_path, 'r') as skip_list_file:
-        content = skip_list_file.read()
-        # allows to have comments in skip_list.json
-        skip_dict = json.loads(json_minify(content))
-        if 'parallel' in skip_dict:
-            return skip_dict['parallel']
-        return set([])
+def collect_sequential_list(all_tags: Dict[str, Set[str]]) -> List[str]:
+    res = []
+    for test_name, tags in all_tags.items():
+        if ('no-parallel' in tags) or ('sequential' in tags):
+            res.append(test_name)
+    return res


 if __name__ == '__main__':
@ -1308,10 +1264,9 @@ if __name__ == '__main__':
    parser.add_argument('--test-runs', default=1, nargs='?', type=int, help='Run each test many times (useful for e.g. flaky check)')
    parser.add_argument('-U', '--unified', default=3, type=int, help='output NUM lines of unified context')
    parser.add_argument('-r', '--server-check-retries', default=30, type=int, help='Num of tries to execute SELECT 1 before tests started')
-    parser.add_argument('--skip-list-path', help="Path to skip-list file")
-    parser.add_argument('--use-skip-list', action='store_true', default=False, help="Use skip list to skip tests if found")
    parser.add_argument('--db-engine', help='Database engine name')
    parser.add_argument('--replicated-database', action='store_true', default=False, help='Run tests with Replicated database engine')
+    parser.add_argument('--fast-tests-only', action='store_true', default=False, help='Run only fast tests (the tests without the "no-fasttest" tag)')
    parser.add_argument('--no-stateless', action='store_true', help='Disable all stateless tests')
    parser.add_argument('--no-stateful', action='store_true', help='Disable all stateful tests')
    parser.add_argument('--skip', nargs='+', help="Skip these tests")
@ -1358,12 +1313,6 @@ if __name__ == '__main__':

    print("Using queries from '" + args.queries + "' directory")

-    if args.skip_list_path is None:
-        args.skip_list_path = os.path.join(args.queries, 'skip_list.json')
-
-    if args.sequential is None:
-        args.sequential = set([])
-
    if args.tmp is None:
        args.tmp = args.queries
    if args.client is None:
--- a/tests/queries/skip_list.json
+++ b/tests/queries/skip_list.json
@ -112,12 +112,10 @@
        "01153_attach_mv_uuid",
        "01157_replace_table",
        "01185_create_or_replace_table",
-        /// Sometimes cannot lock file most likely due to concurrent or adjacent tests, but we don't care how it works in Ordinary database.
-        "rocksdb",
+        "rocksdb", /// Sometimes cannot lock file most likely due to concurrent or adjacent tests, but we don't care how it works in Ordinary database
        "01914_exchange_dictionaries" /// Requires Atomic database
    ],
    "database-replicated": [
-        /// Unclassified
        "memory_tracking",
        "memory_usage",
        "live_view",
@ -125,68 +123,67 @@
        "01269_create_with_null",
        "01451_replicated_detach_drop_and_quorum",
        "01188_attach_table_from_path",
-        /// ON CLUSTER is not allowed
-        "01181_db_atomic_drop_on_cluster",
-        "01175_distributed_ddl_output_mode",
+        
+        "01181_db_atomic_drop_on_cluster",   /// ON CLUSTER is not allowed
+        "01175_distributed_ddl_output_mode", /// ON CLUSTER is not allowed
        "01415_sticking_mutations",
-        /// user_files
-        "01721_engine_file_truncate_on_insert",
-        /// Fails due to additional replicas or shards
-        "quorum",
-        "01650_drop_part_and_deduplication_zookeeper",
-        "01532_execute_merges_on_single_replica",
-        "00652_replicated_mutations_default_database_zookeeper",
-        "00620_optimize_on_nonleader_replica_zookeeper",
-        "01158_zookeeper_log",
-        /// grep -c
-        "01018_ddl_dictionaries_bad_queries",
-        "00908_bloom_filter_index",
-        /// Unsupported type of ALTER query
-        "01650_fetch_patition_with_macro_in_zk_path",
-        "01451_detach_drop_part",
-        "01451_replicated_detach_drop_part",
-        "01417_freeze_partition_verbose",
-        "01417_freeze_partition_verbose_zookeeper",
-        "01130_in_memory_parts_partitons",
-        "01060_shutdown_table_after_detach",
-        "01021_only_tuple_columns",
-        "01015_attach_part",
-        "00955_test_final_mark",
-        "00753_alter_attach",
-        "00626_replace_partition_from_table_zookeeper",
-        "00626_replace_partition_from_table",
-        "00152_insert_different_granularity",
-        "00054_merge_tree_partitions",
-        "01781_merge_tree_deduplication",
-        "00980_zookeeper_merge_tree_alter_settings",
-        "00980_merge_alter_settings",
-        "02009_array_join_partition",
-        "02012_changed_enum_type_non_replicated",
-        "02012_zookeeper_changed_enum_type",
-        "02012_zookeeper_changed_enum_type_incompatible",
-        /// Old syntax is not allowed
-        "01062_alter_on_mutataion_zookeeper",
-        "00925_zookeeper_empty_replicated_merge_tree_optimize_final",
-        "00754_alter_modify_order_by_replicated_zookeeper",
-        "00652_replicated_mutations_zookeeper",
-        "00623_replicated_truncate_table_zookeeper",
-        "00516_deduplication_after_drop_partition_zookeeper",
-        "00446_clear_column_in_partition_concurrent_zookeeper",
-        "00236_replicated_drop_on_non_leader_zookeeper",
-        "00226_zookeeper_deduplication_and_unexpected_parts",
-        "00215_primary_key_order_zookeeper",
-        "00121_drop_column_zookeeper",
-        "00083_create_merge_tree_zookeeper",
-        "00062_replicated_merge_tree_alter_zookeeper",
-        /// Does not support renaming of multiple tables in single query
-        "00634_rename_view",
-        "00140_rename",
-        /// Different query_id
-        "01943_query_id_check",
-        /// Requires investigation
-        "00953_zookeeper_suetin_deduplication_bug",
-        "01783_http_chunk_size",
-        "00166_explain_estimate"
+        "01721_engine_file_truncate_on_insert", /// user_files
+        
+        "quorum",                                                /// Fails due to additional replicas or shards
+        "01650_drop_part_and_deduplication_zookeeper",           /// Fails due to additional replicas or shards
+        "01532_execute_merges_on_single_replica",                /// Fails due to additional replicas or shards
+        "00652_replicated_mutations_default_database_zookeeper", /// Fails due to additional replicas or shards
+        "00620_optimize_on_nonleader_replica_zookeeper",         /// Fails due to additional replicas or shards
+        "01158_zookeeper_log",                                   /// Fails due to additional replicas or shards
+        
+        "01018_ddl_dictionaries_bad_queries", /// grep -c
+        "00908_bloom_filter_index",           /// grep -c
+        
+        "01650_fetch_patition_with_macro_in_zk_path",     /// Unsupported type of ALTER query
+        "01451_detach_drop_part",                         /// Unsupported type of ALTER query
+        "01451_replicated_detach_drop_part",              /// Unsupported type of ALTER query
+        "01417_freeze_partition_verbose",                 /// Unsupported type of ALTER query
+        "01417_freeze_partition_verbose_zookeeper",       /// Unsupported type of ALTER query
+        "01130_in_memory_parts_partitons",                /// Unsupported type of ALTER query
+        "01060_shutdown_table_after_detach",              /// Unsupported type of ALTER query
+        "01021_only_tuple_columns",                       /// Unsupported type of ALTER query
+        "01015_attach_part",                              /// Unsupported type of ALTER query
+        "00955_test_final_mark",                          /// Unsupported type of ALTER query
+        "00753_alter_attach",                             /// Unsupported type of ALTER query
+        "00626_replace_partition_from_table_zookeeper",   /// Unsupported type of ALTER query
+        "00626_replace_partition_from_table",             /// Unsupported type of ALTER query
+        "00152_insert_different_granularity",             /// Unsupported type of ALTER query
+        "00054_merge_tree_partitions",                    /// Unsupported type of ALTER query
+        "01781_merge_tree_deduplication",                 /// Unsupported type of ALTER query
+        "00980_zookeeper_merge_tree_alter_settings",      /// Unsupported type of ALTER query
+        "00980_merge_alter_settings",                     /// Unsupported type of ALTER query
+        "02009_array_join_partition",                     /// Unsupported type of ALTER query
+        "02012_changed_enum_type_non_replicated",         /// Unsupported type of ALTER query
+        "02012_zookeeper_changed_enum_type",              /// Unsupported type of ALTER query
+        "02012_zookeeper_changed_enum_type_incompatible", /// Unsupported type of ALTER query
+        
+        "01062_alter_on_mutataion_zookeeper",                         /// Old syntax is not allowed
+        "00925_zookeeper_empty_replicated_merge_tree_optimize_final", /// Old syntax is not allowed
+        "00754_alter_modify_order_by_replicated_zookeeper",           /// Old syntax is not allowed
+        "00652_replicated_mutations_zookeeper",                       /// Old syntax is not allowed
+        "00623_replicated_truncate_table_zookeeper",                  /// Old syntax is not allowed
+        "00516_deduplication_after_drop_partition_zookeeper",         /// Old syntax is not allowed
+        "00446_clear_column_in_partition_concurrent_zookeeper",       /// Old syntax is not allowed
+        "00236_replicated_drop_on_non_leader_zookeeper",              /// Old syntax is not allowed
+        "00226_zookeeper_deduplication_and_unexpected_parts",         /// Old syntax is not allowed
+        "00215_primary_key_order_zookeeper",                          /// Old syntax is not allowed
+        "00121_drop_column_zookeeper",                                /// Old syntax is not allowed
+        "00083_create_merge_tree_zookeeper",                          /// Old syntax is not allowed
+        "00062_replicated_merge_tree_alter_zookeeper",                /// Old syntax is not allowed
+        
+        "00634_rename_view", /// Does not support renaming of multiple tables in single query
+        "00140_rename",      /// Does not support renaming of multiple tables in single query
+        
+        "01943_query_id_check", /// Different query_id
+        
+        "00953_zookeeper_suetin_deduplication_bug", /// Requires investigation
+        "01783_http_chunk_size",                    /// Requires investigation
+        "00166_explain_estimate"                    /// Requires investigation
    ],
    "polymorphic-parts": [
        "01508_partition_pruning_long", /// bug, shoud be fixed
--- a/tests/queries/skip_list_to_first_line_comment.py
+++ b/tests/queries/skip_list_to_first_line_comment.py
@ -0,0 +1,429 @@
+#!/usr/bin/python3
+
+import os
+import time
+
+TEST_FILE_EXTENSIONS = ['.sql', '.sql.j2', '.sh', '.py', '.expect']
+TEST_FILE_EXTENSIONS += [ext + '.disabled' for ext in TEST_FILE_EXTENSIONS]
+TAGS_PREFIX = "Tags:"
+
+
+def parse_skip_list_json(text):
+    pos = 0
+    def skip_spaces():
+        nonlocal pos
+        start_pos = pos
+        while pos < len(text) and text[pos].isspace():
+            pos += 1
+        return pos > start_pos
+
+    def skip_comment():
+        nonlocal pos
+        if text.startswith('//', pos):
+            end_of_line = text.find('\n', pos + 1)
+            if end_of_line == -1:
+                pos = len(text)
+                return True
+            pos = end_of_line + 1
+            return True
+        elif text.startswith('/*', pos):
+            end_of_comment = text.find('*/', pos + 2)
+            if end_of_comment == -1:
+                raise Exception(f'Not found the end of a comment at pos {pos}')
+            pos = end_of_comment + 2
+            return True
+        else:
+            return False
+
+    def skip_spaces_or_comments():
+        while skip_spaces() or skip_comment():
+            pass
+
+    def skip_char_only(c):
+        nonlocal pos
+        if not text.startswith(c, pos):
+            return False
+        pos += 1
+        return True
+
+    def skip_char(c):
+        skip_spaces_or_comments()
+        return skip_char_only(c)
+
+    def expect_char(c):
+        nonlocal pos
+        skip_spaces_or_comments()
+        if not text.startswith(c, pos):
+            raise Exception(f"Expected '{c}' at pos {pos}")
+        pos += 1
+
+    def parse_quoted_string():
+        nonlocal pos
+        skip_spaces_or_comments()
+        expect_char('"')
+        end_of_string = text.find('"', pos)
+        if end_of_string == -1:
+            raise Exception(f'Not found the end of a quoted string at pos {pos-1}')
+        str = text[pos:end_of_string]
+        pos = end_of_string + 1
+        return str
+
+    def parse_description_comment():
+        nonlocal pos
+        while pos < len(text) and (text[pos] == ' ' or text[pos] == '\t'):
+            pos += 1
+        if not text.startswith('///', pos):
+            return None
+        end_of_line = text.find('\n', pos + 3)
+        if end_of_line == -1:
+            description = text[pos+3:]
+            pos = len(text)
+        else:
+            description = text[pos+3:end_of_line]
+            pos = end_of_line + 1
+        description = description.strip()
+        return description
+
+    res = {}
+    expect_char('{')
+    while not skip_char('}'):
+        build_flag = parse_quoted_string()
+        expect_char(':')
+        expect_char('[')
+        patterns = []
+        while not skip_char(']'):
+            pattern = parse_quoted_string()
+            skip_char_only(',')
+            description = parse_description_comment()
+            patterns.append((pattern, description))
+        skip_char(',')
+        res[build_flag] = patterns
+    return res
+
+
+def load_skip_list_json(path):
+    if not os.path.exists(path):
+        raise Exception(f'File {path} not found')
+    with open(path, 'r') as file:
+        contents = file.read()
+        skip_dict = parse_skip_list_json(contents)
+        return skip_dict
+
+
+def parse_fasttest_run_sh(text):
+    mark = 'TESTS_TO_SKIP=('
+    pos = text.find(mark)
+    if pos == -1:
+        raise Exception('TESTS_TO_SKIP not found in fasttest/run.sh')
+    pos += len(mark)
+
+    def skip_spaces():
+        nonlocal pos
+        start_pos = pos
+        while pos < len(text) and text[pos].isspace():
+            pos += 1
+        return pos > start_pos
+
+    def skip_comment():
+        nonlocal pos
+        if text.startswith('#', pos):
+            end_of_line = text.find('\n', pos + 1)
+            if end_of_line == -1:
+                pos = len(text)
+                return True
+            pos = end_of_line + 1
+            return True
+        else:
+            return False
+
+    def skip_spaces_or_comments():
+        while skip_spaces() or skip_comment():
+            pass
+
+    def skip_char(c):
+        nonlocal pos
+        skip_spaces_or_comments()
+        if not text.startswith(c, pos):
+            return False
+        pos += 1
+        return True
+
+    def parse_test_pattern():
+        nonlocal pos
+        skip_spaces_or_comments()
+        cur_pos = pos
+        while (cur_pos < len(text)) and (text[cur_pos].isalnum() or text[cur_pos] == '_'):
+            cur_pos += 1
+        if cur_pos == pos:
+            raise Exception(f"Couldn't read a test's name or pattern at pos {pos}")
+        pattern = text[pos:cur_pos]
+        pos = cur_pos
+        return pattern
+        
+    def parse_description_comment():
+        nonlocal pos
+        while pos < len(text) and (text[pos] == ' ' or text[pos] == '\t'):
+            pos += 1
+        if not text.startswith('#', pos):
+            return None
+        end_of_line = text.find('\n', pos + 1)
+        if end_of_line == -1:
+            description = text[pos+1:]
+            pos = len(text)
+        else:
+            description = text[pos+1:end_of_line]
+            pos = end_of_line + 1
+        description = description.strip()
+        return description
+
+    patterns = []
+    while not skip_char(')'):
+        pattern = parse_test_pattern()
+        description = parse_description_comment()
+        patterns.append((pattern, description))
+    return {"fasttest": patterns}
+
+
+def load_fasttest_run_sh(path):
+    if not os.path.exists(path):
+        raise Exception(f'File {path} not found')
+    with open(path, 'r') as file:
+        contents = file.read()
+        skip_dict = parse_fasttest_run_sh(contents)
+        return skip_dict
+
+
+def get_comment_sign(filename):
+    if filename.endswith('.disabled'):
+        filename = filename[:-len('.disabled')]
+    if filename.endswith('.sql') or filename.endswith('.sql.j2'):
+        return '--'
+    elif filename.endswith('.sh') or filename.endswith('.py') or filename.endswith('.expect'):
+        return '#'
+    else:
+        raise Exception(f'Unknown file_extension: {filename}')
+
+
+def is_shebang(line):
+    return line.startswith('#!')
+
+
+def parse_tags_from_line(line, comment_sign):
+    if not line.startswith(comment_sign):
+        return None
+    tags_str = line[len(comment_sign):].lstrip()
+    if not tags_str.startswith(TAGS_PREFIX):
+        return None
+    tags_str = tags_str[len(TAGS_PREFIX):]
+    tags = tags_str.split(',')
+    tags = [tag.strip() for tag in tags]
+    return tags
+
+
+def format_tags_to_line(tags, comment_sign):
+    return comment_sign + ' ' + TAGS_PREFIX + ' ' + ', '.join(tags) + '\n'
+
+
+def load_tags_from_file(filepath):
+    with open(filepath, 'r') as file:
+        try:
+            line = file.readline()
+            if is_shebang(line):
+                line = file.readline()
+        except UnicodeDecodeError:
+            return []
+    return parse_tags_from_line(line, get_comment_sign(filepath))
+
+
+def save_tags_to_file(filepath, tags, description = {}):
+    if not tags:
+        return
+    with open(filepath, 'r') as file:
+        contents = file.read()
+
+    # Skip shebang.
+    shebang_line = ''
+    eol = contents.find('\n')
+    if eol != -1 and is_shebang(contents[:eol+1]):
+        shebang_line = contents[:eol+1]
+        contents = contents[eol+1:]
+
+    # Skip tag line with description lines.
+    eol = contents.find('\n')
+    comment_sign = get_comment_sign(filepath)
+    if eol != -1 and parse_tags_from_line(contents[:eol+1], comment_sign):
+        contents = contents[eol+1:]
+        while True:
+            eol = contents.find('\n')
+            if eol == -1 or contents[:eol+1].isspace():
+                break
+            contents = contents[eol+1:]
+
+    # Skip an empty line after tags.
+    eol = contents.find('\n')
+    if eol != -1 and contents[:eol+1].isspace():
+        contents = contents[eol+1:]
+    empty_line = '\n'
+
+    # New tags line.
+    tags_line = format_tags_to_line(tags, comment_sign)
+
+    # New description lines.
+    tags_with_descriptions = []
+    for tag in tags:
+        if description.get(tag):
+            tags_with_descriptions.append(tag)
+    
+    description_lines = ''
+    if tags_with_descriptions:
+        for tag in tags_with_descriptions:
+            description_lines += comment_sign + ' Tag ' + tag + ': ' + description[tag] + '\n'
+
+    contents = shebang_line + tags_line + description_lines + empty_line + contents
+    with open(filepath, 'w') as file:
+        file.write(contents)
+        print(f'Changed {filepath}')
+
+
+def build_flag_to_tag(build_flag):
+    if build_flag == "thread-sanitizer":
+        return "no-tsan"
+    elif build_flag == "address-sanitizer":
+        return "no-asan"
+    elif build_flag == "ub-sanitizer":
+        return "no-ubsan"
+    elif build_flag == "memory-sanitizer":
+        return "no-msan"
+    elif build_flag == "database-replicated":
+        return "no-replicated-database"
+    elif build_flag == "database-ordinary":
+        return "no-ordinary-database"
+    elif build_flag == "debug-build":
+        return "no-debug"
+    elif build_flag == "release-build":
+        return "no-release"
+    elif build_flag == "unbundled-build":
+        return "no-unbundled"
+    else:
+        return "no-" + build_flag
+
+
+def get_tags(test_name, skip_list):
+    tags = []
+    descriptions = {}
+
+    if test_name.endswith('.disabled'):
+        tags.append("disabled")
+
+    if 'deadlock' in test_name:
+        tags.append("deadlock")
+    elif 'race' in test_name:
+        tags.append("race")
+    elif 'long' in test_name:
+        tags.append("long")
+
+    if 'replica' in test_name:
+        tags.append("replica")
+    elif 'zookeeper' in test_name:
+        tags.append("zookeeper")
+
+    if 'distributed' in test_name:
+        tags.append("distributed")
+    elif 'shard' in test_name:
+        tags.append("shard")
+    elif 'global' in test_name:
+        tags.append("global")
+
+    for build_flag, patterns in skip_list.items():
+        for pattern, description in patterns:
+            if pattern in test_name:
+                tag = build_flag_to_tag(build_flag)
+                if not tag in tags:
+                    tags.append(tag)
+                    if description:
+                        descriptions[tag] = description
+
+    return tags, descriptions
+
+
+def load_all_tags(base_dir):
+    def get_comment_sign(filename):
+        if filename.endswith('.sql') or filename.endswith('.sql.j2'):
+            return '--'
+        elif filename.endswith('.sh') or filename.endswith('.py') or filename.endswith('.expect'):
+            return '#'
+        else:
+            raise Exception(f'Unknown file_extension: {filename}')
+
+    def parse_tags_from_line(line, comment_sign):
+        if not line.startswith(comment_sign):
+            return None
+        tags_str = line[len(comment_sign):].lstrip()
+        tags_prefix = "Tags:"
+        if not tags_str.startswith(tags_prefix):
+            return None
+        tags_str = tags_str[len(tags_prefix):]
+        tags = tags_str.split(',')
+        tags = {tag.strip() for tag in tags}
+        return tags
+
+    def is_shebang(line):
+        return line.startswith('#!')
+
+    def load_tags_from_file(filepath):
+        with open(filepath, 'r') as file:
+            try:
+                line = file.readline()
+                if is_shebang(line):
+                    line = file.readline()
+            except UnicodeDecodeError:
+                return []
+        return parse_tags_from_line(line, get_comment_sign(filepath))
+
+    all_tags = {}
+    for suite in os.listdir(base_dir):
+        suite_dir = os.path.join(base_dir, suite)
+        if not os.path.isdir(suite_dir):
+            continue
+        
+        for test_name in os.listdir(suite_dir):
+            test_path = os.path.join(suite_dir, test_name)
+            if not os.path.isfile(test_path) or all(not test_path.endswith(supported_ext) for supported_ext in TEST_FILE_EXTENSIONS):
+                continue
+            tags = load_tags_from_file(test_path)
+            if tags:
+                all_tags[test_path] = tags
+    return all_tags
+
+
+def load_all_tags_timing(base_dir):
+    start_time = time.time()
+    print(type(load_all_tags(base_dir)))
+    print("--- %s seconds ---" % (time.time() - start_time))
+
+
+def main():
+    base_dir = os.path.dirname(__file__)
+    print(f'base_dir={base_dir}')
+
+    #return load_all_tags_timing(base_dir)
+    
+    skip_dict = load_skip_list_json(os.path.join(base_dir, 'skip_list.json'))
+    skip_dict_from_fasttest_run_sh = load_fasttest_run_sh(os.path.join(base_dir, '../../docker/test/fasttest/run.sh'))
+    skip_dict = {**skip_dict, **skip_dict_from_fasttest_run_sh}
+    #print(f'skip_dict={skip_dict}')
+
+    for suite in os.listdir(base_dir):
+        suite_dir = os.path.join(base_dir, suite)
+        if not os.path.isdir(suite_dir):
+            continue
+        
+        for test_name in os.listdir(suite_dir):
+            test_path = os.path.join(suite_dir, test_name)
+            if not os.path.isfile(test_path) or all(not test_path.endswith(supported_ext) for supported_ext in TEST_FILE_EXTENSIONS):
+                continue
+            tags, descriptions = get_tags(test_path, skip_dict)
+            save_tags_to_file(test_path, tags, descriptions)
+
+if __name__ == '__main__':
+    main()