mirror of
https://github.com/ClickHouse/ClickHouse.git
synced 2024-11-21 15:12:02 +00:00
fixed bug with ClickHouseDictionarySource & test for all sources added
This commit is contained in:
parent
64a4640e0e
commit
c0051d9cd9
@ -74,6 +74,7 @@ ClickHouseDictionarySource::ClickHouseDictionarySource(
|
||||
/// We should set user info even for the case when the dictionary is loaded in-process (without TCP communication).
|
||||
context.setUser(user, password, Poco::Net::SocketAddress("127.0.0.1", 0), {});
|
||||
/// Processors are not supported here yet.
|
||||
context.setSettings(context_.getSettings());
|
||||
context.setSetting("experimental_use_processors", false);
|
||||
/// Query context is needed because some code in executeQuery function may assume it exists.
|
||||
/// Current example is Context::getSampleBlockCache from InterpreterSelectWithUnionQuery::getSampleBlock.
|
||||
@ -217,6 +218,8 @@ void registerDictionarySourceClickHouse(DictionarySourceFactory & factory)
|
||||
bool /* check_config */) -> DictionarySourcePtr
|
||||
{
|
||||
Context context_local_copy = copyContextAndApplySettings(config_prefix, context, config);
|
||||
|
||||
std::cerr << "initialization: " << context_local_copy.getSettings().max_bytes_to_read << '\n';
|
||||
/// Note that processors are not supported yet (see constructor),
|
||||
/// hence it is not possible to override experimental_use_processors setting
|
||||
return std::make_unique<ClickHouseDictionarySource>(dict_struct, config, config_prefix + ".clickhouse", sample_block, context_local_copy);
|
||||
|
@ -0,0 +1,30 @@
|
||||
<?xml version="1.0"?>
|
||||
<yandex>
|
||||
<logger>
|
||||
<level>trace</level>
|
||||
<log>/var/log/clickhouse-server/clickhouse-server.log</log>
|
||||
<errorlog>/var/log/clickhouse-server/clickhouse-server.err.log</errorlog>
|
||||
<size>1000M</size>
|
||||
<count>10</count>
|
||||
</logger>
|
||||
|
||||
<tcp_port>9000</tcp_port>
|
||||
<listen_host>127.0.0.1</listen_host>
|
||||
|
||||
<openSSL>
|
||||
<client>
|
||||
<cacheSessions>true</cacheSessions>
|
||||
<verificationMode>none</verificationMode>
|
||||
<invalidCertificateHandler>
|
||||
<name>AcceptCertificateHandler</name>
|
||||
</invalidCertificateHandler>
|
||||
</client>
|
||||
</openSSL>
|
||||
|
||||
<max_concurrent_queries>500</max_concurrent_queries>
|
||||
<mark_cache_size>5368709120</mark_cache_size>
|
||||
<path>./clickhouse/</path>
|
||||
<users_config>users.xml</users_config>
|
||||
|
||||
<dictionaries_config>/etc/clickhouse-server/config.d/*.xml</dictionaries_config>
|
||||
</yandex>
|
@ -0,0 +1,48 @@
|
||||
<yandex>
|
||||
<dictionary>
|
||||
<name>test_clickhouse</name>
|
||||
|
||||
<source>
|
||||
<clickhouse>
|
||||
<host>localhost</host>
|
||||
<port>9000</port>
|
||||
<user>default</user>
|
||||
<password></password>
|
||||
<db>default</db>
|
||||
<table>source</table>
|
||||
</clickhouse>
|
||||
|
||||
<settings>
|
||||
<max_result_bytes>1</max_result_bytes>
|
||||
</settings>
|
||||
|
||||
</source>
|
||||
|
||||
<lifetime>600</lifetime>
|
||||
|
||||
<layout>
|
||||
<flat/>
|
||||
</layout>
|
||||
|
||||
<structure>
|
||||
<id>
|
||||
<name>id</name>
|
||||
</id>
|
||||
<attribute>
|
||||
<name>first</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
<attribute>
|
||||
<name>second</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
<attribute>
|
||||
<name>third</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
</structure>
|
||||
</dictionary>
|
||||
</yandex>
|
@ -0,0 +1,45 @@
|
||||
<yandex>
|
||||
<dictionary>
|
||||
<name>test_executable</name>
|
||||
|
||||
<source>
|
||||
<executable>
|
||||
<command>cat /etc/clickhouse-server/config.d/source.csv</command>
|
||||
<format>CSVWithNames</format>
|
||||
</executable>
|
||||
|
||||
<settings>
|
||||
<format_csv_allow_single_quotes>0</format_csv_allow_single_quotes>
|
||||
<format_csv_allow_double_quotes>0</format_csv_allow_double_quotes>
|
||||
</settings>
|
||||
|
||||
</source>
|
||||
|
||||
<lifetime>600</lifetime>
|
||||
|
||||
<layout>
|
||||
<flat/>
|
||||
</layout>
|
||||
|
||||
<structure>
|
||||
<id>
|
||||
<name>id</name>
|
||||
</id>
|
||||
<attribute>
|
||||
<name>first</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
<attribute>
|
||||
<name>second</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
<attribute>
|
||||
<name>third</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
</structure>
|
||||
</dictionary>
|
||||
</yandex>
|
@ -0,0 +1,45 @@
|
||||
<yandex>
|
||||
<dictionary>
|
||||
<name>test_file</name>
|
||||
|
||||
<source>
|
||||
<file>
|
||||
<path>/etc/clickhouse-server/config.d/source.csv</path>
|
||||
<format>CSVWithNames</format>
|
||||
</file>
|
||||
|
||||
<settings>
|
||||
<format_csv_allow_single_quotes>0</format_csv_allow_single_quotes>
|
||||
<format_csv_allow_double_quotes>0</format_csv_allow_double_quotes>
|
||||
</settings>
|
||||
|
||||
</source>
|
||||
|
||||
<lifetime>600</lifetime>
|
||||
|
||||
<layout>
|
||||
<flat/>
|
||||
</layout>
|
||||
|
||||
<structure>
|
||||
<id>
|
||||
<name>id</name>
|
||||
</id>
|
||||
<attribute>
|
||||
<name>first</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
<attribute>
|
||||
<name>second</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
<attribute>
|
||||
<name>third</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
</structure>
|
||||
</dictionary>
|
||||
</yandex>
|
@ -0,0 +1,54 @@
|
||||
<yandex>
|
||||
<dictionary>
|
||||
<name>test_http</name>
|
||||
<source>
|
||||
<http>
|
||||
<url>http://localhost:5555/source.csv</url>
|
||||
<format>CSVWithNames</format>
|
||||
<credentials>
|
||||
<user>foo</user>
|
||||
<password>bar</password>
|
||||
</credentials>
|
||||
<headers>
|
||||
<header>
|
||||
<name>api-key</name>
|
||||
<value>secret</value>
|
||||
</header>
|
||||
</headers>
|
||||
</http>
|
||||
|
||||
<settings>
|
||||
<format_csv_allow_single_quotes>0</format_csv_allow_single_quotes>
|
||||
<format_csv_allow_double_quotes>0</format_csv_allow_double_quotes>
|
||||
</settings>
|
||||
|
||||
</source>
|
||||
|
||||
<lifetime>600</lifetime>
|
||||
|
||||
<layout>
|
||||
<flat/>
|
||||
</layout>
|
||||
|
||||
<structure>
|
||||
<id>
|
||||
<name>id</name>
|
||||
</id>
|
||||
<attribute>
|
||||
<name>first</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
<attribute>
|
||||
<name>second</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
<attribute>
|
||||
<name>third</name>
|
||||
<type>String</type>
|
||||
<null_value></null_value>
|
||||
</attribute>
|
||||
</structure>
|
||||
</dictionary>
|
||||
</yandex>
|
@ -0,0 +1,3 @@
|
||||
id,first,second,third
|
||||
1,'a,"b,c
|
||||
2,'d,"e,f
|
Can't render this file because it contains an unexpected character in line 3 and column 6.
|
@ -0,0 +1,23 @@
|
||||
<?xml version="1.0"?>
|
||||
<yandex>
|
||||
<profiles>
|
||||
<default>
|
||||
</default>
|
||||
</profiles>
|
||||
|
||||
<users>
|
||||
<default>
|
||||
<password></password>
|
||||
<networks incl="networks" replace="replace">
|
||||
<ip>::/0</ip>
|
||||
</networks>
|
||||
<profile>default</profile>
|
||||
<quota>default</quota>
|
||||
</default>
|
||||
</users>
|
||||
|
||||
<quotas>
|
||||
<default>
|
||||
</default>
|
||||
</quotas>
|
||||
</yandex>
|
@ -0,0 +1,86 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
import argparse
|
||||
from BaseHTTPServer import BaseHTTPRequestHandler, HTTPServer
|
||||
import socket
|
||||
import ssl
|
||||
import csv
|
||||
|
||||
|
||||
# Decorator used to see if authentication works for external dictionary who use a HTTP source.
|
||||
def check_auth(fn):
|
||||
def wrapper(req):
|
||||
auth_header = req.headers.get('authorization', None)
|
||||
api_key = req.headers.get('api-key', None)
|
||||
if not auth_header or auth_header != 'Basic Zm9vOmJhcg==' or not api_key or api_key != 'secret':
|
||||
req.send_response(401)
|
||||
else:
|
||||
fn(req)
|
||||
return wrapper
|
||||
|
||||
|
||||
def start_server(server_address, data_path, schema, cert_path, address_family):
|
||||
class TSVHTTPHandler(BaseHTTPRequestHandler):
|
||||
@check_auth
|
||||
def do_GET(self):
|
||||
self.__send_headers()
|
||||
self.__send_data()
|
||||
|
||||
@check_auth
|
||||
def do_POST(self):
|
||||
ids = self.__read_and_decode_post_ids()
|
||||
print "ids=", ids
|
||||
self.__send_headers()
|
||||
self.__send_data(ids)
|
||||
|
||||
def __send_headers(self):
|
||||
self.send_response(200)
|
||||
self.send_header('Content-type', 'text/csv')
|
||||
self.end_headers()
|
||||
|
||||
def __send_data(self, only_ids = None):
|
||||
with open(data_path, 'r') as fl:
|
||||
reader = csv.reader(fl, delimiter='\t')
|
||||
for row in reader:
|
||||
if not only_ids or (row[0] in only_ids):
|
||||
self.wfile.write('\t'.join(row) + '\n')
|
||||
|
||||
def __read_and_decode_post_ids(self):
|
||||
data = self.__read_and_decode_post_data()
|
||||
return filter(None, data.split())
|
||||
|
||||
def __read_and_decode_post_data(self):
|
||||
transfer_encoding = self.headers.get("Transfer-encoding")
|
||||
decoded = ""
|
||||
if transfer_encoding == "chunked":
|
||||
while True:
|
||||
s = self.rfile.readline()
|
||||
chunk_length = int(s, 16)
|
||||
if not chunk_length:
|
||||
break
|
||||
decoded += self.rfile.read(chunk_length)
|
||||
self.rfile.readline()
|
||||
else:
|
||||
content_length = int(self.headers.get("Content-Length", 0))
|
||||
decoded = self.rfile.read(content_length)
|
||||
return decoded
|
||||
|
||||
if address_family == "ipv6":
|
||||
HTTPServer.address_family = socket.AF_INET6
|
||||
httpd = HTTPServer(server_address, TSVHTTPHandler)
|
||||
if schema == "https":
|
||||
httpd.socket = ssl.wrap_socket(httpd.socket, certfile=cert_path, server_side=True)
|
||||
httpd.serve_forever()
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
parser = argparse.ArgumentParser(description="Simple HTTP server returns data from file")
|
||||
parser.add_argument("--host", default="localhost")
|
||||
parser.add_argument("--port", default=5555, type=int)
|
||||
parser.add_argument("--data-path", required=True)
|
||||
parser.add_argument("--schema", choices=("http", "https"), required=True)
|
||||
parser.add_argument("--cert-path", default="./fake_cert.pem")
|
||||
parser.add_argument('--address-family', choices=("ipv4", "ipv6"), default="ipv4")
|
||||
|
||||
args = parser.parse_args()
|
||||
|
||||
start_server((args.host, args.port), args.data_path, args.schema, args.cert_path, args.address_family)
|
62
tests/integration/test_dictionary_custom_settings/test.py
Normal file
62
tests/integration/test_dictionary_custom_settings/test.py
Normal file
@ -0,0 +1,62 @@
|
||||
import os
|
||||
import pytest
|
||||
|
||||
from helpers.cluster import ClickHouseCluster
|
||||
|
||||
SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
|
||||
config_dir = os.path.join(SCRIPT_DIR, './configs')
|
||||
DICTIONARY_FILES = [
|
||||
'configs/dictionaries/FileSourceConfig.xml',
|
||||
'configs/dictionaries/ExecutableSourceConfig.xml',
|
||||
'configs/dictionaries/source.csv',
|
||||
'configs/dictionaries/HTTPSourceConfig.xml',
|
||||
'configs/dictionaries/ClickHouseSourceConfig.xml'
|
||||
]
|
||||
|
||||
cluster = ClickHouseCluster(__file__, base_configs_dir=config_dir)
|
||||
instance = cluster.add_instance('node', main_configs=DICTIONARY_FILES, config_dir=config_dir)
|
||||
|
||||
def prepare():
|
||||
node = instance
|
||||
path = "/source.csv"
|
||||
|
||||
script_dir = os.path.dirname(os.path.realpath(__file__))
|
||||
node.copy_file_to_container(os.path.join(script_dir, './http_server.py'), '/http_server.py')
|
||||
node.copy_file_to_container(os.path.join(script_dir, 'configs/dictionaries/source.csv'), './source.csv')
|
||||
node.exec_in_container([
|
||||
"bash",
|
||||
"-c",
|
||||
"python2 /http_server.py --data-path={tbl} --schema=http --host=localhost --port=5555".format(
|
||||
tbl=path)
|
||||
], detach=True)
|
||||
|
||||
|
||||
@pytest.fixture(scope="module")
|
||||
def start_cluster():
|
||||
try:
|
||||
cluster.start()
|
||||
prepare()
|
||||
yield cluster
|
||||
finally:
|
||||
cluster.shutdown()
|
||||
|
||||
def test_work(start_cluster):
|
||||
query = instance.query
|
||||
|
||||
assert query("SELECT dictGetString('test_file', 'first', toUInt64(1))") == "\\\'a\n"
|
||||
assert query("SELECT dictGetString('test_file', 'second', toUInt64(1))") == "\"b\n"
|
||||
assert query("SELECT dictGetString('test_executable', 'first', toUInt64(1))") == "\\\'a\n"
|
||||
assert query("SELECT dictGetString('test_executable', 'second', toUInt64(1))") == "\"b\n"
|
||||
|
||||
caught_exception = ''
|
||||
try:
|
||||
instance.query("CREATE TABLE source (id UInt64, first String, second String, third String) ENGINE=File(CSVWithNames);")
|
||||
instance.query("INSERT INTO default.source VALUES (1, 'aaa', 'bbb', 'cccc'), (2, 'ddd', 'eee', 'fff')")
|
||||
instance.query("SELECT dictGetString('test_clickhouse', 'second', toUInt64(1))")
|
||||
except Exception as e:
|
||||
caught_exception = str(e)
|
||||
|
||||
assert caught_exception.find("Limit for result exceeded") != -1
|
||||
|
||||
assert query("SELECT dictGetString('test_http', 'first', toUInt64(1))") == "\\\'a\n"
|
||||
assert query("SELECT dictGetString('test_http', 'second', toUInt64(1))") == "\"b\n"
|
Loading…
Reference in New Issue
Block a user