ClickHouse/tests/integration/test_dictionaries_mysql/test.py

403 lines
12 KiB
Python
Raw Normal View History

## sudo -H pip install PyMySQL
2021-08-09 11:23:44 +00:00
import warnings
import pymysql.cursors
import pytest
from helpers.cluster import ClickHouseCluster
import time
import logging
DICTS = ["configs/dictionaries/mysql_dict1.xml", "configs/dictionaries/mysql_dict2.xml"]
CONFIG_FILES = ["configs/remote_servers.xml", "configs/named_collections.xml"]
2023-06-08 18:30:34 +00:00
USER_CONFIGS = ["configs/users.xml"]
cluster = ClickHouseCluster(__file__)
instance = cluster.add_instance(
2023-06-09 11:13:33 +00:00
"instance",
main_configs=CONFIG_FILES,
user_configs=USER_CONFIGS,
with_mysql=True,
dictionaries=DICTS,
)
create_table_mysql_template = """
CREATE TABLE IF NOT EXISTS `test`.`{}` (
`id` int(11) NOT NULL,
`value` varchar(50) NOT NULL,
PRIMARY KEY (`id`)
) ENGINE=InnoDB;
"""
create_clickhouse_dictionary_table_template = """
2020-04-15 17:52:05 +00:00
CREATE TABLE IF NOT EXISTS `test`.`dict_table_{}` (`id` UInt64, `value` String) ENGINE = Dictionary({})
"""
@pytest.fixture(scope="module")
def started_cluster():
try:
# time.sleep(30)
cluster.start()
2020-04-15 17:52:05 +00:00
# Create a MySQL database
2021-03-16 10:00:49 +00:00
mysql_connection = get_mysql_conn(cluster)
create_mysql_db(mysql_connection, "test")
mysql_connection.close()
2020-04-15 17:52:05 +00:00
2019-10-11 07:25:22 +00:00
# Create database in ClickHouse
instance.query("CREATE DATABASE IF NOT EXISTS test")
2020-04-15 17:52:05 +00:00
2019-10-11 07:25:22 +00:00
# Create database in ClickChouse using MySQL protocol (will be used for data insertion)
instance.query(
"CREATE DATABASE clickhouse_mysql ENGINE = MySQL('mysql57:3306', 'test', 'root', 'clickhouse')"
)
2020-04-15 17:52:05 +00:00
yield cluster
finally:
cluster.shutdown()
2021-08-09 11:23:44 +00:00
def test_mysql_dictionaries_custom_query_full_load(started_cluster):
mysql_connection = get_mysql_conn(started_cluster)
execute_mysql_query(
mysql_connection,
"CREATE TABLE IF NOT EXISTS test.test_table_1 (id Integer, value_1 Text);",
)
execute_mysql_query(
mysql_connection,
"CREATE TABLE IF NOT EXISTS test.test_table_2 (id Integer, value_2 Text);",
)
execute_mysql_query(
mysql_connection, "INSERT INTO test.test_table_1 VALUES (1, 'Value_1');"
)
execute_mysql_query(
mysql_connection, "INSERT INTO test.test_table_2 VALUES (1, 'Value_2');"
)
2021-08-09 11:23:44 +00:00
query = instance.query
query(
"""
2021-08-09 11:23:44 +00:00
CREATE DICTIONARY test_dictionary_custom_query
(
id UInt64,
value_1 String,
value_2 String
)
PRIMARY KEY id
LAYOUT(FLAT())
SOURCE(MYSQL(
HOST 'mysql57'
PORT 3306
USER 'root'
PASSWORD 'clickhouse'
QUERY $doc$SELECT id, value_1, value_2 FROM test.test_table_1 INNER JOIN test.test_table_2 USING (id);$doc$))
LIFETIME(0)
"""
)
2021-08-09 11:23:44 +00:00
result = query("SELECT id, value_1, value_2 FROM test_dictionary_custom_query")
assert result == "1\tValue_1\tValue_2\n"
2021-08-09 11:23:44 +00:00
query("DROP DICTIONARY test_dictionary_custom_query;")
execute_mysql_query(mysql_connection, "DROP TABLE test.test_table_1;")
execute_mysql_query(mysql_connection, "DROP TABLE test.test_table_2;")
def test_mysql_dictionaries_custom_query_partial_load_simple_key(started_cluster):
mysql_connection = get_mysql_conn(started_cluster)
execute_mysql_query(
mysql_connection,
"CREATE TABLE IF NOT EXISTS test.test_table_1 (id Integer, value_1 Text);",
)
execute_mysql_query(
mysql_connection,
"CREATE TABLE IF NOT EXISTS test.test_table_2 (id Integer, value_2 Text);",
)
execute_mysql_query(
mysql_connection, "INSERT INTO test.test_table_1 VALUES (1, 'Value_1');"
)
execute_mysql_query(
mysql_connection, "INSERT INTO test.test_table_2 VALUES (1, 'Value_2');"
)
2020-04-15 17:52:05 +00:00
2021-08-09 11:23:44 +00:00
query = instance.query
query(
"""
2021-08-09 11:23:44 +00:00
CREATE DICTIONARY test_dictionary_custom_query
(
id UInt64,
value_1 String,
value_2 String
)
PRIMARY KEY id
LAYOUT(DIRECT())
SOURCE(MYSQL(
HOST 'mysql57'
PORT 3306
USER 'root'
PASSWORD 'clickhouse'
QUERY $doc$SELECT id, value_1, value_2 FROM test.test_table_1 INNER JOIN test.test_table_2 USING (id) WHERE {condition};$doc$))
"""
)
2021-08-09 11:23:44 +00:00
result = query(
"SELECT dictGet('test_dictionary_custom_query', ('value_1', 'value_2'), toUInt64(1))"
)
2021-08-09 11:23:44 +00:00
assert result == "('Value_1','Value_2')\n"
query("DROP DICTIONARY test_dictionary_custom_query;")
execute_mysql_query(mysql_connection, "DROP TABLE test.test_table_1;")
execute_mysql_query(mysql_connection, "DROP TABLE test.test_table_2;")
def test_mysql_dictionaries_custom_query_partial_load_complex_key(started_cluster):
mysql_connection = get_mysql_conn(started_cluster)
2020-04-15 17:52:05 +00:00
execute_mysql_query(
mysql_connection,
"CREATE TABLE IF NOT EXISTS test.test_table_1 (id Integer, id_key Text, value_1 Text);",
)
execute_mysql_query(
mysql_connection,
"CREATE TABLE IF NOT EXISTS test.test_table_2 (id Integer, id_key Text, value_2 Text);",
)
execute_mysql_query(
mysql_connection, "INSERT INTO test.test_table_1 VALUES (1, 'Key', 'Value_1');"
)
execute_mysql_query(
mysql_connection, "INSERT INTO test.test_table_2 VALUES (1, 'Key', 'Value_2');"
)
2019-10-11 07:25:22 +00:00
2021-08-09 11:23:44 +00:00
query = instance.query
query(
"""
2021-08-09 11:23:44 +00:00
CREATE DICTIONARY test_dictionary_custom_query
(
id UInt64,
id_key String,
value_1 String,
value_2 String
)
PRIMARY KEY id, id_key
LAYOUT(COMPLEX_KEY_DIRECT())
SOURCE(MYSQL(
HOST 'mysql57'
PORT 3306
USER 'root'
PASSWORD 'clickhouse'
QUERY $doc$SELECT id, id_key, value_1, value_2 FROM test.test_table_1 INNER JOIN test.test_table_2 USING (id, id_key) WHERE {condition};$doc$))
"""
)
2021-08-09 11:23:44 +00:00
result = query(
"SELECT dictGet('test_dictionary_custom_query', ('value_1', 'value_2'), (toUInt64(1), 'Key'))"
)
2021-08-09 11:23:44 +00:00
assert result == "('Value_1','Value_2')\n"
query("DROP DICTIONARY test_dictionary_custom_query;")
execute_mysql_query(mysql_connection, "DROP TABLE test.test_table_1;")
execute_mysql_query(mysql_connection, "DROP TABLE test.test_table_2;")
2021-09-02 13:01:26 +00:00
def test_predefined_connection_configuration(started_cluster):
mysql_connection = get_mysql_conn(started_cluster)
execute_mysql_query(mysql_connection, "DROP TABLE IF EXISTS test.test_table")
execute_mysql_query(
mysql_connection,
"CREATE TABLE IF NOT EXISTS test.test_table (id Integer, value Integer);",
)
execute_mysql_query(
mysql_connection, "INSERT INTO test.test_table VALUES (100, 200);"
)
2021-09-02 13:01:26 +00:00
instance.query(
"""
2021-09-02 13:01:26 +00:00
DROP DICTIONARY IF EXISTS dict;
CREATE DICTIONARY dict (id UInt32, value UInt32)
PRIMARY KEY id
SOURCE(MYSQL(NAME mysql1))
LIFETIME(MIN 1 MAX 2)
LAYOUT(HASHED());
"""
)
2021-09-02 13:01:26 +00:00
result = instance.query("SELECT dictGetUInt32(dict, 'value', toUInt64(100))")
assert int(result) == 200
2021-09-02 13:01:26 +00:00
instance.query(
"""
2021-09-02 13:01:26 +00:00
DROP DICTIONARY dict;
CREATE DICTIONARY dict (id UInt32, value UInt32)
PRIMARY KEY id
SOURCE(MYSQL(NAME mysql2))
LIFETIME(MIN 1 MAX 2)
LAYOUT(HASHED());
"""
)
result = instance.query_and_get_error(
"SELECT dictGetUInt32(dict, 'value', toUInt64(100))"
)
instance.query(
"""
2021-09-02 13:01:26 +00:00
DROP DICTIONARY dict;
CREATE DICTIONARY dict (id UInt32, value UInt32)
PRIMARY KEY id
SOURCE(MYSQL(NAME unknown_collection))
LIFETIME(MIN 1 MAX 2)
LAYOUT(HASHED());
"""
)
result = instance.query_and_get_error(
"SELECT dictGetUInt32(dict, 'value', toUInt64(100))"
)
2021-09-02 13:01:26 +00:00
instance.query(
"""
2021-09-02 13:01:26 +00:00
DROP DICTIONARY dict;
CREATE DICTIONARY dict (id UInt32, value UInt32)
PRIMARY KEY id
SOURCE(MYSQL(NAME mysql3 PORT 3306))
LIFETIME(MIN 1 MAX 2)
LAYOUT(HASHED());
"""
)
2021-09-02 13:01:26 +00:00
result = instance.query("SELECT dictGetUInt32(dict, 'value', toUInt64(100))")
assert int(result) == 200
2021-09-02 13:01:26 +00:00
instance.query(
"""
2022-01-10 11:00:03 +00:00
DROP DICTIONARY IF EXISTS dict;
CREATE DICTIONARY dict (id UInt32, value UInt32)
PRIMARY KEY id
SOURCE(MYSQL(NAME mysql1 connection_pool_size 0))
LIFETIME(MIN 1 MAX 2)
LAYOUT(HASHED());
"""
)
result = instance.query_and_get_error(
"SELECT dictGetUInt32(dict, 'value', toUInt64(100))"
)
assert "Connection pool cannot have zero size" in result
2022-01-10 11:00:03 +00:00
instance.query(
"""
2022-01-10 22:58:05 +00:00
DROP DICTIONARY IF EXISTS dict;
CREATE DICTIONARY dict (id UInt32, value UInt32)
PRIMARY KEY id
SOURCE(MYSQL(NAME mysql4))
LIFETIME(MIN 1 MAX 2)
LAYOUT(HASHED());
"""
)
result = instance.query_and_get_error(
"SELECT dictGetUInt32(dict, 'value', toUInt64(100))"
)
assert "Connection pool cannot have zero size" in result
2022-01-10 22:58:05 +00:00
instance.query(
"""
2022-01-10 22:58:05 +00:00
DROP DICTIONARY IF EXISTS dict;
CREATE DICTIONARY dict (id UInt32, value UInt32)
PRIMARY KEY id
SOURCE(MYSQL(NAME mysql4 connection_pool_size 1))
LIFETIME(MIN 1 MAX 2)
LAYOUT(HASHED());
"""
)
2022-01-10 22:58:05 +00:00
result = instance.query("SELECT dictGetUInt32(dict, 'value', toUInt64(100))")
assert int(result) == 200
2022-01-10 22:58:05 +00:00
2023-04-13 17:33:58 +00:00
instance.query(
"""
DROP DICTIONARY IF EXISTS dict;
CREATE DICTIONARY dict (id UInt32, value UInt32)
PRIMARY KEY id
SOURCE(MYSQL(NAME mysql4 connection_pool_size 1 close_connection 1 share_connection 1))
LIFETIME(MIN 1 MAX 2)
LAYOUT(HASHED());
"""
)
result = instance.query("SELECT dictGetUInt32(dict, 'value', toUInt64(100))")
assert int(result) == 200
2021-09-02 13:01:26 +00:00
def create_mysql_db(mysql_connection, name):
with mysql_connection.cursor() as cursor:
2021-02-15 09:35:45 +00:00
cursor.execute("DROP DATABASE IF EXISTS {}".format(name))
cursor.execute("CREATE DATABASE {} DEFAULT CHARACTER SET 'utf8'".format(name))
2021-03-16 10:00:49 +00:00
def prepare_mysql_table(started_cluster, table_name, index):
mysql_connection = get_mysql_conn(started_cluster)
2020-04-15 17:52:05 +00:00
# Create table
create_mysql_table(mysql_connection, table_name + str(index))
# Insert rows using CH
query = instance.query
query(
"INSERT INTO `clickhouse_mysql`.{}(id, value) select number, concat('{} value ', toString(number)) from numbers(10000) ".format(
table_name + str(index), table_name + str(index)
)
)
assert (
query(
"SELECT count() FROM `clickhouse_mysql`.{}".format(table_name + str(index))
).rstrip()
== "10000"
)
mysql_connection.close()
2020-04-15 17:52:05 +00:00
# Create CH Dictionary tables based on MySQL tables
query(
create_clickhouse_dictionary_table_template.format(
table_name + str(index), "dict" + str(index)
)
)
2021-03-16 10:00:49 +00:00
def get_mysql_conn(started_cluster):
errors = []
conn = None
for _ in range(5):
try:
if conn is None:
conn = pymysql.connect(
user="root",
password="clickhouse",
host=started_cluster.mysql_ip,
port=started_cluster.mysql_port,
)
else:
conn.ping(reconnect=True)
logging.debug(
f"MySQL Connection establised: {started_cluster.mysql_ip}:{started_cluster.mysql_port}"
)
return conn
except Exception as e:
errors += [str(e)]
time.sleep(1)
2021-08-09 11:23:44 +00:00
raise Exception("Connection not establised, {}".format(errors))
2021-08-09 11:23:44 +00:00
def execute_mysql_query(connection, query):
logging.debug("Execute MySQL query:{}".format(query))
with warnings.catch_warnings():
warnings.simplefilter("ignore")
with connection.cursor() as cursor:
cursor.execute(query)
connection.commit()
def create_mysql_table(conn, table_name):
with conn.cursor() as cursor:
cursor.execute(create_table_mysql_template.format(table_name))