2021-09-10 11:52:21 +00:00
|
|
|
#!/usr/bin/env python3
|
2022-07-19 13:17:05 +00:00
|
|
|
import argparse
|
2022-07-19 11:31:43 +00:00
|
|
|
import csv
|
2021-09-10 11:52:21 +00:00
|
|
|
import logging
|
|
|
|
import os
|
2024-03-11 08:45:58 +00:00
|
|
|
import shutil
|
2022-07-19 11:31:43 +00:00
|
|
|
import subprocess
|
2021-12-01 14:23:51 +00:00
|
|
|
import sys
|
2024-03-11 12:07:39 +00:00
|
|
|
from concurrent.futures import ProcessPoolExecutor
|
2023-01-03 14:23:19 +00:00
|
|
|
from pathlib import Path
|
2024-03-21 20:23:06 +00:00
|
|
|
from typing import List, Tuple
|
2021-12-01 14:23:51 +00:00
|
|
|
|
2023-12-18 12:21:13 +00:00
|
|
|
from docker_images_helper import get_docker_image, pull_image
|
2024-03-11 08:45:58 +00:00
|
|
|
from env_helper import CI, REPO_COPY, TEMP_PATH
|
2023-12-18 08:07:22 +00:00
|
|
|
from git_helper import GIT_PREFIX, git_runner
|
2022-07-19 11:31:43 +00:00
|
|
|
from pr_info import PRInfo
|
2024-02-06 12:39:34 +00:00
|
|
|
from report import ERROR, FAILURE, SUCCESS, JobReport, TestResults, read_test_results
|
2022-07-19 13:17:05 +00:00
|
|
|
from ssh import SSHKey
|
2022-07-19 11:31:43 +00:00
|
|
|
from stopwatch import Stopwatch
|
2021-09-10 14:27:03 +00:00
|
|
|
|
|
|
|
|
2022-11-14 19:02:33 +00:00
|
|
|
def process_result(
|
2023-09-22 11:16:46 +00:00
|
|
|
result_directory: Path,
|
|
|
|
) -> Tuple[str, str, TestResults, List[Path]]:
|
2023-01-03 14:23:19 +00:00
|
|
|
test_results = [] # type: TestResults
|
2021-09-10 11:52:21 +00:00
|
|
|
additional_files = []
|
2023-09-22 11:16:46 +00:00
|
|
|
# Just upload all files from result_directory.
|
2022-01-13 19:52:02 +00:00
|
|
|
# If task provides processed results, then it's responsible
|
2023-09-22 11:16:46 +00:00
|
|
|
# for content of result_directory.
|
|
|
|
if result_directory.exists():
|
|
|
|
additional_files = [p for p in result_directory.iterdir() if p.is_file()]
|
2021-09-10 11:52:21 +00:00
|
|
|
|
2021-12-12 12:09:44 +00:00
|
|
|
status = []
|
2023-09-22 11:16:46 +00:00
|
|
|
status_path = result_directory / "check_status.tsv"
|
|
|
|
if status_path.exists():
|
2023-01-03 14:23:19 +00:00
|
|
|
logging.info("Found check_status.tsv")
|
2022-01-13 19:52:02 +00:00
|
|
|
with open(status_path, "r", encoding="utf-8") as status_file:
|
|
|
|
status = list(csv.reader(status_file, delimiter="\t"))
|
2021-09-10 11:52:21 +00:00
|
|
|
if len(status) != 1 or len(status[0]) != 2:
|
2023-09-22 11:16:46 +00:00
|
|
|
logging.info("Files in result folder %s", os.listdir(result_directory))
|
2024-02-06 12:39:34 +00:00
|
|
|
return ERROR, "Invalid check_status.tsv", test_results, additional_files
|
2021-09-10 11:52:21 +00:00
|
|
|
state, description = status[0][0], status[0][1]
|
|
|
|
|
|
|
|
try:
|
2023-09-22 11:16:46 +00:00
|
|
|
results_path = result_directory / "test_results.tsv"
|
2023-01-03 14:23:19 +00:00
|
|
|
test_results = read_test_results(results_path)
|
2021-09-10 11:52:21 +00:00
|
|
|
if len(test_results) == 0:
|
2024-02-26 17:46:15 +00:00
|
|
|
raise ValueError("Empty results")
|
2021-09-10 11:52:21 +00:00
|
|
|
|
|
|
|
return state, description, test_results, additional_files
|
|
|
|
except Exception:
|
2024-02-06 12:39:34 +00:00
|
|
|
if state == SUCCESS:
|
|
|
|
state, description = ERROR, "Failed to read test_results.tsv"
|
2021-09-10 11:52:21 +00:00
|
|
|
return state, description, test_results, additional_files
|
|
|
|
|
2021-11-29 14:17:17 +00:00
|
|
|
|
2022-07-19 13:17:05 +00:00
|
|
|
def parse_args():
|
|
|
|
parser = argparse.ArgumentParser("Check and report style issues in the repository")
|
|
|
|
parser.add_argument("--push", default=True, help=argparse.SUPPRESS)
|
|
|
|
parser.add_argument(
|
|
|
|
"--no-push",
|
|
|
|
action="store_false",
|
|
|
|
dest="push",
|
|
|
|
help="do not commit and push automatic fixes",
|
|
|
|
default=argparse.SUPPRESS,
|
|
|
|
)
|
|
|
|
return parser.parse_args()
|
|
|
|
|
|
|
|
|
2022-11-14 19:02:33 +00:00
|
|
|
def commit_push_staged(pr_info: PRInfo) -> None:
|
2022-07-19 13:17:05 +00:00
|
|
|
# It works ONLY for PRs, and only over ssh, so either
|
|
|
|
# ROBOT_CLICKHOUSE_SSH_KEY should be set or ssh-agent should work
|
|
|
|
assert pr_info.number
|
|
|
|
if not pr_info.head_name == pr_info.base_name:
|
|
|
|
# We can't push to forks, sorry folks
|
|
|
|
return
|
|
|
|
git_staged = git_runner("git diff --cached --name-only")
|
|
|
|
if not git_staged:
|
|
|
|
return
|
|
|
|
remote_url = pr_info.event["pull_request"]["base"]["repo"]["ssh_url"]
|
2024-03-11 19:57:35 +00:00
|
|
|
head = git_runner("git rev-parse HEAD^{}")
|
2022-12-01 12:01:35 +00:00
|
|
|
git_runner(f"{GIT_PREFIX} commit -m 'Automatic style fix'")
|
2024-03-11 19:57:35 +00:00
|
|
|
# The fetch to avoid issue 'pushed branch tip is behind its remote'
|
|
|
|
fetch_cmd = (
|
|
|
|
f"{GIT_PREFIX} fetch {remote_url} --no-recurse-submodules --depth=2 {head}"
|
2022-07-19 13:17:05 +00:00
|
|
|
)
|
2024-03-11 19:57:35 +00:00
|
|
|
push_cmd = f"{GIT_PREFIX} push {remote_url} HEAD:{pr_info.head_ref}"
|
2022-07-19 13:17:05 +00:00
|
|
|
if os.getenv("ROBOT_CLICKHOUSE_SSH_KEY", ""):
|
|
|
|
with SSHKey("ROBOT_CLICKHOUSE_SSH_KEY"):
|
2024-03-11 19:57:35 +00:00
|
|
|
git_runner(fetch_cmd)
|
2022-07-19 13:17:05 +00:00
|
|
|
git_runner(push_cmd)
|
2024-03-11 19:57:35 +00:00
|
|
|
return
|
|
|
|
|
|
|
|
git_runner(fetch_cmd)
|
|
|
|
git_runner(push_cmd)
|
2022-07-19 13:17:05 +00:00
|
|
|
|
|
|
|
|
2024-03-21 20:23:06 +00:00
|
|
|
def is_python(file: str) -> bool:
|
2024-03-12 09:50:44 +00:00
|
|
|
"""returns if the changed file in the repository is python script"""
|
|
|
|
# WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
|
|
|
|
# and `Support os.PathLike values in magic.from_file` is only from 0.4.25
|
2024-03-21 20:23:06 +00:00
|
|
|
# try:
|
|
|
|
# return bool(
|
|
|
|
# magic.from_file(os.path.join(REPO_COPY, file), mime=True)
|
|
|
|
# == "text/x-script.python"
|
|
|
|
# )
|
|
|
|
# except IsADirectoryError:
|
|
|
|
# # Process submodules w/o errors
|
|
|
|
# return False
|
|
|
|
return file.endswith(".py")
|
|
|
|
|
|
|
|
|
|
|
|
def is_shell(file: str) -> bool:
|
2024-03-12 09:50:44 +00:00
|
|
|
"""returns if the changed file in the repository is shell script"""
|
|
|
|
# WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
|
|
|
|
# and `Support os.PathLike values in magic.from_file` is only from 0.4.25
|
2024-03-21 20:23:06 +00:00
|
|
|
# try:
|
|
|
|
# return bool(
|
|
|
|
# magic.from_file(os.path.join(REPO_COPY, file), mime=True)
|
|
|
|
# == "text/x-shellscript"
|
|
|
|
# )
|
|
|
|
# except IsADirectoryError:
|
|
|
|
# # Process submodules w/o errors
|
|
|
|
# return False
|
|
|
|
return file.endswith(".sh")
|
2023-12-18 12:21:13 +00:00
|
|
|
|
|
|
|
|
2023-01-03 14:23:19 +00:00
|
|
|
def main():
|
2021-09-10 14:27:03 +00:00
|
|
|
logging.basicConfig(level=logging.INFO)
|
2022-07-19 13:17:05 +00:00
|
|
|
logging.getLogger("git_helper").setLevel(logging.DEBUG)
|
2024-03-11 12:07:39 +00:00
|
|
|
args = parse_args()
|
2021-11-19 14:47:04 +00:00
|
|
|
|
|
|
|
stopwatch = Stopwatch()
|
|
|
|
|
2023-11-10 20:16:54 +00:00
|
|
|
repo_path = Path(REPO_COPY)
|
2023-10-04 12:28:38 +00:00
|
|
|
temp_path = Path(TEMP_PATH)
|
2024-03-11 08:45:58 +00:00
|
|
|
if temp_path.is_dir():
|
|
|
|
shutil.rmtree(temp_path)
|
2023-09-22 11:16:46 +00:00
|
|
|
temp_path.mkdir(parents=True, exist_ok=True)
|
2021-09-15 12:59:39 +00:00
|
|
|
|
2024-03-11 08:45:58 +00:00
|
|
|
pr_info = PRInfo()
|
2024-03-12 09:50:44 +00:00
|
|
|
run_cpp_check = True
|
|
|
|
run_shell_check = True
|
|
|
|
run_python_check = True
|
|
|
|
if CI and pr_info.number > 0:
|
|
|
|
pr_info.fetch_changed_files()
|
2024-03-21 13:34:31 +00:00
|
|
|
run_cpp_check = any(
|
|
|
|
not (is_python(file) or is_shell(file)) for file in pr_info.changed_files
|
2024-03-12 09:50:44 +00:00
|
|
|
)
|
|
|
|
run_shell_check = any(is_shell(file) for file in pr_info.changed_files)
|
|
|
|
run_python_check = any(is_python(file) for file in pr_info.changed_files)
|
2021-09-10 11:52:21 +00:00
|
|
|
|
2023-12-18 08:07:22 +00:00
|
|
|
IMAGE_NAME = "clickhouse/style-test"
|
|
|
|
image = pull_image(get_docker_image(IMAGE_NAME))
|
2024-03-12 09:50:44 +00:00
|
|
|
docker_command = (
|
2022-01-13 19:52:02 +00:00
|
|
|
f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
|
|
|
|
f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
|
2024-03-12 09:50:44 +00:00
|
|
|
f"--entrypoint= -w/ClickHouse/utils/check-style {image}"
|
2024-03-11 08:45:58 +00:00
|
|
|
)
|
2024-03-12 09:50:44 +00:00
|
|
|
cmd_docs = f"{docker_command} ./check_docs.sh"
|
|
|
|
cmd_cpp = f"{docker_command} ./check_cpp.sh"
|
|
|
|
cmd_py = f"{docker_command} ./check_py.sh"
|
|
|
|
cmd_shell = f"{docker_command} ./check_shell.sh"
|
2024-03-09 20:38:23 +00:00
|
|
|
|
|
|
|
with ProcessPoolExecutor(max_workers=2) as executor:
|
2024-03-11 08:45:58 +00:00
|
|
|
logging.info("Run docs files check: %s", cmd_docs)
|
|
|
|
future = executor.submit(subprocess.run, cmd_docs, shell=True)
|
|
|
|
# Parallelization does not make it faster - run subsequently
|
|
|
|
_ = future.result()
|
|
|
|
|
2024-03-12 09:50:44 +00:00
|
|
|
if run_cpp_check:
|
2024-03-11 08:45:58 +00:00
|
|
|
logging.info("Run source files check: %s", cmd_cpp)
|
2024-03-12 09:50:44 +00:00
|
|
|
future = executor.submit(subprocess.run, cmd_cpp, shell=True)
|
|
|
|
_ = future.result()
|
2024-03-11 08:45:58 +00:00
|
|
|
|
2024-03-12 09:50:44 +00:00
|
|
|
if run_python_check:
|
2024-03-11 08:45:58 +00:00
|
|
|
logging.info("Run py files check: %s", cmd_py)
|
2024-03-12 09:50:44 +00:00
|
|
|
future = executor.submit(subprocess.run, cmd_py, shell=True)
|
|
|
|
_ = future.result()
|
|
|
|
if run_shell_check:
|
|
|
|
logging.info("Run shellcheck check: %s", cmd_shell)
|
|
|
|
future = executor.submit(subprocess.run, cmd_shell, shell=True)
|
|
|
|
_ = future.result()
|
|
|
|
|
|
|
|
if args.push:
|
|
|
|
commit_push_staged(pr_info)
|
2023-12-18 12:21:13 +00:00
|
|
|
|
2022-02-03 13:06:21 +00:00
|
|
|
subprocess.check_call(
|
2024-03-09 20:38:23 +00:00
|
|
|
f"python3 ../../utils/check-style/process_style_check_result.py --in-results-dir {temp_path} "
|
|
|
|
f"--out-results-file {temp_path}/test_results.tsv --out-status-file {temp_path}/check_status.tsv || "
|
|
|
|
f'echo -e "failure\tCannot parse results" > {temp_path}/check_status.tsv',
|
2022-01-13 19:52:02 +00:00
|
|
|
shell=True,
|
|
|
|
)
|
2022-02-03 13:06:21 +00:00
|
|
|
|
2021-09-15 10:50:30 +00:00
|
|
|
state, description, test_results, additional_files = process_result(temp_path)
|
2021-11-19 14:47:04 +00:00
|
|
|
|
2024-01-04 15:35:09 +00:00
|
|
|
JobReport(
|
|
|
|
description=description,
|
|
|
|
test_results=test_results,
|
|
|
|
status=state,
|
|
|
|
start_time=stopwatch.start_time_str,
|
|
|
|
duration=stopwatch.duration_seconds,
|
|
|
|
additional_files=additional_files,
|
|
|
|
).dump()
|
2022-03-29 12:41:47 +00:00
|
|
|
|
2024-02-06 12:39:34 +00:00
|
|
|
if state in [ERROR, FAILURE]:
|
2024-01-04 15:35:09 +00:00
|
|
|
print(f"Style check failed: [{description}]")
|
2022-03-29 12:41:47 +00:00
|
|
|
sys.exit(1)
|
2023-01-03 14:23:19 +00:00
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
main()
|