ClickHouse/tests/integration/test_catboost_model_reload/test.py

133 lines
3.9 KiB
Python
Raw Normal View History

2021-04-18 10:38:36 +00:00
import os
import sys
import time
import pytest
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
from helpers.cluster import ClickHouseCluster
cluster = ClickHouseCluster(__file__)
node = cluster.add_instance(
"node",
stay_alive=True,
main_configs=["config/models_config.xml", "config/catboost_lib.xml"],
)
2021-04-18 10:38:36 +00:00
def copy_file_to_container(local_path, dist_path, container_id):
os.system(
"docker cp {local} {cont_id}:{dist}".format(
local=local_path, cont_id=container_id, dist=dist_path
)
)
2021-04-18 10:38:36 +00:00
@pytest.fixture(scope="module")
def started_cluster():
try:
cluster.start()
copy_file_to_container(
os.path.join(SCRIPT_DIR, "model/."),
"/etc/clickhouse-server/model",
node.docker_id,
)
2021-04-18 10:38:36 +00:00
node.query("CREATE TABLE binary (x UInt64, y UInt64) ENGINE = TinyLog()")
node.query("INSERT INTO binary VALUES (1, 1), (1, 0), (0, 1), (0, 0)")
node.restart_clickhouse()
yield cluster
finally:
cluster.shutdown()
2021-04-18 10:38:36 +00:00
def test_model_reload(started_cluster):
2021-04-25 02:25:46 +00:00
if node.is_built_with_memory_sanitizer():
pytest.skip("Memory Sanitizer cannot work with third-party shared libraries")
node.exec_in_container(
["bash", "-c", "rm -f /etc/clickhouse-server/model/model.cbm"]
)
node.exec_in_container(
[
"bash",
"-c",
"ln /etc/clickhouse-server/model/conjunction.cbm /etc/clickhouse-server/model/model.cbm",
]
)
2021-04-18 10:38:36 +00:00
node.query("SYSTEM RELOAD MODEL model")
result = node.query(
"""
2021-04-18 10:38:36 +00:00
WITH modelEvaluate('model', toFloat64(x), toFloat64(y)) as prediction, exp(prediction) / (1 + exp(prediction)) as probability
SELECT if(probability > 0.5, 1, 0) FROM binary;
"""
)
assert result == "1\n0\n0\n0\n"
2021-04-18 10:38:36 +00:00
node.exec_in_container(["bash", "-c", "rm /etc/clickhouse-server/model/model.cbm"])
node.exec_in_container(
[
"bash",
"-c",
"ln /etc/clickhouse-server/model/disjunction.cbm /etc/clickhouse-server/model/model.cbm",
]
)
2021-04-18 10:38:36 +00:00
node.query("SYSTEM RELOAD MODEL model")
result = node.query(
"""
2021-04-18 10:38:36 +00:00
WITH modelEvaluate('model', toFloat64(x), toFloat64(y)) as prediction, exp(prediction) / (1 + exp(prediction)) as probability
SELECT if(probability > 0.5, 1, 0) FROM binary;
"""
)
assert result == "1\n1\n1\n0\n"
2021-04-18 10:38:36 +00:00
def test_models_reload(started_cluster):
2021-04-25 02:25:46 +00:00
if node.is_built_with_memory_sanitizer():
pytest.skip("Memory Sanitizer cannot work with third-party shared libraries")
node.exec_in_container(
["bash", "-c", "rm -f /etc/clickhouse-server/model/model.cbm"]
)
node.exec_in_container(
[
"bash",
"-c",
"ln /etc/clickhouse-server/model/conjunction.cbm /etc/clickhouse-server/model/model.cbm",
]
)
2021-04-18 10:38:36 +00:00
node.query("SYSTEM RELOAD MODELS")
result = node.query(
"""
2021-04-18 10:38:36 +00:00
WITH modelEvaluate('model', toFloat64(x), toFloat64(y)) as prediction, exp(prediction) / (1 + exp(prediction)) as probability
SELECT if(probability > 0.5, 1, 0) FROM binary;
"""
)
assert result == "1\n0\n0\n0\n"
2021-04-18 10:38:36 +00:00
node.exec_in_container(["bash", "-c", "rm /etc/clickhouse-server/model/model.cbm"])
node.exec_in_container(
[
"bash",
"-c",
"ln /etc/clickhouse-server/model/disjunction.cbm /etc/clickhouse-server/model/model.cbm",
]
)
2021-04-18 10:38:36 +00:00
node.query("SYSTEM RELOAD MODELS")
result = node.query(
"""
2021-04-18 10:38:36 +00:00
WITH modelEvaluate('model', toFloat64(x), toFloat64(y)) as prediction, exp(prediction) / (1 + exp(prediction)) as probability
SELECT if(probability > 0.5, 1, 0) FROM binary;
"""
)
assert result == "1\n1\n1\n0\n"