2021-03-05 09:38:00 +00:00
# include "SharedLibraryHandler.h"
2021-10-02 07:13:14 +00:00
# include <base/scope_guard.h>
# include <base/bit_cast.h>
# include <base/find_symbols.h>
2021-06-15 19:55:21 +00:00
# include <IO/ReadHelpers.h>
2021-03-05 09:38:00 +00:00
namespace DB
{
2021-03-07 19:53:10 +00:00
namespace ErrorCodes
{
extern const int EXTERNAL_LIBRARY_ERROR ;
extern const int SIZES_OF_COLUMNS_DOESNT_MATCH ;
}
2021-03-06 18:21:40 +00:00
SharedLibraryHandler : : SharedLibraryHandler (
const std : : string & library_path_ ,
2021-03-24 08:41:42 +00:00
const std : : vector < std : : string > & library_settings ,
2021-03-24 09:23:29 +00:00
const Block & sample_block_ ,
2021-03-24 19:32:31 +00:00
const std : : vector < std : : string > & attributes_names_ )
2021-03-06 18:21:40 +00:00
: library_path ( library_path_ )
2021-03-24 08:41:42 +00:00
, sample_block ( sample_block_ )
2021-03-24 19:32:31 +00:00
, attributes_names ( attributes_names_ )
2021-03-06 18:21:40 +00:00
{
2021-03-22 14:39:17 +00:00
library = std : : make_shared < SharedLibrary > ( library_path , RTLD_LAZY ) ;
2021-03-24 07:53:15 +00:00
settings_holder = std : : make_shared < CStringsHolder > ( CStringsHolder ( library_settings ) ) ;
2021-03-06 18:21:40 +00:00
2021-03-17 08:20:14 +00:00
auto lib_new = library - > tryGet < ClickHouseLibrary : : LibraryNewFunc > ( ClickHouseLibrary : : LIBRARY_CREATE_NEW_FUNC_NAME ) ;
2021-03-06 18:21:40 +00:00
if ( lib_new )
lib_data = lib_new ( & settings_holder - > strings , ClickHouseLibrary : : log ) ;
2021-03-17 08:20:14 +00:00
else
throw Exception ( " Method libNew failed " , ErrorCodes : : EXTERNAL_LIBRARY_ERROR ) ;
2021-03-06 18:21:40 +00:00
}
2021-03-05 15:37:43 +00:00
SharedLibraryHandler : : SharedLibraryHandler ( const SharedLibraryHandler & other )
: library_path { other . library_path }
2021-03-24 09:23:29 +00:00
, sample_block { other . sample_block }
, attributes_names { other . attributes_names }
2021-03-05 15:37:43 +00:00
, library { other . library }
, settings_holder { other . settings_holder }
2021-03-05 09:38:00 +00:00
{
2021-03-17 08:20:14 +00:00
auto lib_clone = library - > tryGet < ClickHouseLibrary : : LibraryCloneFunc > ( ClickHouseLibrary : : LIBRARY_CLONE_FUNC_NAME ) ;
if ( lib_clone )
{
2021-03-05 15:37:43 +00:00
lib_data = lib_clone ( other . lib_data ) ;
2021-03-17 08:20:14 +00:00
}
else
{
auto lib_new = library - > tryGet < ClickHouseLibrary : : LibraryNewFunc > ( ClickHouseLibrary : : LIBRARY_CREATE_NEW_FUNC_NAME ) ;
if ( lib_new )
lib_data = lib_new ( & settings_holder - > strings , ClickHouseLibrary : : log ) ;
}
2021-03-05 09:38:00 +00:00
}
SharedLibraryHandler : : ~ SharedLibraryHandler ( )
{
2021-03-17 08:20:14 +00:00
auto lib_delete = library - > tryGet < ClickHouseLibrary : : LibraryDeleteFunc > ( ClickHouseLibrary : : LIBRARY_DELETE_FUNC_NAME ) ;
2021-03-05 09:38:00 +00:00
if ( lib_delete )
lib_delete ( lib_data ) ;
}
2021-03-05 10:43:47 +00:00
bool SharedLibraryHandler : : isModified ( )
{
2021-03-17 08:20:14 +00:00
auto func_is_modified = library - > tryGet < ClickHouseLibrary : : LibraryIsModifiedFunc > ( ClickHouseLibrary : : LIBRARY_IS_MODIFIED_FUNC_NAME ) ;
if ( func_is_modified )
2021-03-05 10:43:47 +00:00
return func_is_modified ( lib_data , & settings_holder - > strings ) ;
return true ;
}
bool SharedLibraryHandler : : supportsSelectiveLoad ( )
{
2021-03-17 08:20:14 +00:00
auto func_supports_selective_load = library - > tryGet < ClickHouseLibrary : : LibrarySupportsSelectiveLoadFunc > ( ClickHouseLibrary : : LIBRARY_SUPPORTS_SELECTIVE_LOAD_FUNC_NAME ) ;
if ( func_supports_selective_load )
2021-03-05 10:43:47 +00:00
return func_supports_selective_load ( lib_data , & settings_holder - > strings ) ;
return true ;
}
2021-03-05 09:38:00 +00:00
2021-03-24 09:23:29 +00:00
BlockInputStreamPtr SharedLibraryHandler : : loadAll ( )
2021-03-05 09:38:00 +00:00
{
2021-03-24 09:23:29 +00:00
auto columns_holder = std : : make_unique < ClickHouseLibrary : : CString [ ] > ( attributes_names . size ( ) ) ;
ClickHouseLibrary : : CStrings columns { static_cast < decltype ( ClickHouseLibrary : : CStrings : : data ) > ( columns_holder . get ( ) ) , attributes_names . size ( ) } ;
for ( size_t i = 0 ; i < attributes_names . size ( ) ; + + i )
columns . data [ i ] = attributes_names [ i ] . c_str ( ) ;
2021-03-05 09:38:00 +00:00
2021-03-17 08:20:14 +00:00
auto load_all_func = library - > get < ClickHouseLibrary : : LibraryLoadAllFunc > ( ClickHouseLibrary : : LIBRARY_LOAD_ALL_FUNC_NAME ) ;
auto data_new_func = library - > get < ClickHouseLibrary : : LibraryDataNewFunc > ( ClickHouseLibrary : : LIBRARY_DATA_NEW_FUNC_NAME ) ;
auto data_delete_func = library - > get < ClickHouseLibrary : : LibraryDataDeleteFunc > ( ClickHouseLibrary : : LIBRARY_DATA_DELETE_FUNC_NAME ) ;
2021-03-05 09:38:00 +00:00
2021-03-17 08:20:14 +00:00
ClickHouseLibrary : : LibraryData data_ptr = data_new_func ( lib_data ) ;
SCOPE_EXIT ( data_delete_func ( lib_data , data_ptr ) ) ;
2021-03-05 09:38:00 +00:00
2021-03-17 08:20:14 +00:00
ClickHouseLibrary : : RawClickHouseLibraryTable data = load_all_func ( data_ptr , & settings_holder - > strings , & columns ) ;
2021-03-24 08:41:42 +00:00
auto block = dataToBlock ( data ) ;
2021-03-05 09:38:00 +00:00
return std : : make_shared < OneBlockInputStream > ( block ) ;
}
2021-03-24 09:23:29 +00:00
BlockInputStreamPtr SharedLibraryHandler : : loadIds ( const std : : vector < uint64_t > & ids )
2021-03-05 09:38:00 +00:00
{
2021-06-15 19:55:21 +00:00
const ClickHouseLibrary : : VectorUInt64 ids_data { bit_cast < decltype ( ClickHouseLibrary : : VectorUInt64 : : data ) > ( ids . data ( ) ) , ids . size ( ) } ;
2021-03-23 15:41:53 +00:00
2021-03-24 09:23:29 +00:00
auto columns_holder = std : : make_unique < ClickHouseLibrary : : CString [ ] > ( attributes_names . size ( ) ) ;
ClickHouseLibrary : : CStrings columns_pass { static_cast < decltype ( ClickHouseLibrary : : CStrings : : data ) > ( columns_holder . get ( ) ) , attributes_names . size ( ) } ;
2021-03-05 09:38:00 +00:00
2021-03-17 08:20:14 +00:00
auto load_ids_func = library - > get < ClickHouseLibrary : : LibraryLoadIdsFunc > ( ClickHouseLibrary : : LIBRARY_LOAD_IDS_FUNC_NAME ) ;
auto data_new_func = library - > get < ClickHouseLibrary : : LibraryDataNewFunc > ( ClickHouseLibrary : : LIBRARY_DATA_NEW_FUNC_NAME ) ;
auto data_delete_func = library - > get < ClickHouseLibrary : : LibraryDataDeleteFunc > ( ClickHouseLibrary : : LIBRARY_DATA_DELETE_FUNC_NAME ) ;
2021-03-05 09:38:00 +00:00
2021-03-17 08:20:14 +00:00
ClickHouseLibrary : : LibraryData data_ptr = data_new_func ( lib_data ) ;
SCOPE_EXIT ( data_delete_func ( lib_data , data_ptr ) ) ;
2021-03-05 09:38:00 +00:00
2021-03-17 08:20:14 +00:00
ClickHouseLibrary : : RawClickHouseLibraryTable data = load_ids_func ( data_ptr , & settings_holder - > strings , & columns_pass , & ids_data ) ;
2021-03-24 08:41:42 +00:00
auto block = dataToBlock ( data ) ;
2021-03-05 09:38:00 +00:00
2021-03-10 13:10:05 +00:00
return std : : make_shared < OneBlockInputStream > ( block ) ;
}
2021-03-24 08:41:42 +00:00
BlockInputStreamPtr SharedLibraryHandler : : loadKeys ( const Columns & key_columns )
2021-03-10 13:10:05 +00:00
{
auto holder = std : : make_unique < ClickHouseLibrary : : Row [ ] > ( key_columns . size ( ) ) ;
std : : vector < std : : unique_ptr < ClickHouseLibrary : : Field [ ] > > column_data_holders ;
for ( size_t i = 0 ; i < key_columns . size ( ) ; + + i )
{
auto cell_holder = std : : make_unique < ClickHouseLibrary : : Field [ ] > ( key_columns [ i ] - > size ( ) ) ;
for ( size_t j = 0 ; j < key_columns [ i ] - > size ( ) ; + + j )
{
auto data_ref = key_columns [ i ] - > getDataAt ( j ) ;
cell_holder [ j ] = ClickHouseLibrary : : Field {
. data = static_cast < const void * > ( data_ref . data ) ,
. size = data_ref . size } ;
}
holder [ i ] = ClickHouseLibrary : : Row {
. data = static_cast < ClickHouseLibrary : : Field * > ( cell_holder . get ( ) ) ,
. size = key_columns [ i ] - > size ( ) } ;
column_data_holders . push_back ( std : : move ( cell_holder ) ) ;
}
ClickHouseLibrary : : Table request_cols {
. data = static_cast < ClickHouseLibrary : : Row * > ( holder . get ( ) ) ,
. size = key_columns . size ( ) } ;
2021-03-17 08:20:14 +00:00
auto load_keys_func = library - > get < ClickHouseLibrary : : LibraryLoadKeysFunc > ( ClickHouseLibrary : : LIBRARY_LOAD_KEYS_FUNC_NAME ) ;
auto data_new_func = library - > get < ClickHouseLibrary : : LibraryDataNewFunc > ( ClickHouseLibrary : : LIBRARY_DATA_NEW_FUNC_NAME ) ;
auto data_delete_func = library - > get < ClickHouseLibrary : : LibraryDataDeleteFunc > ( ClickHouseLibrary : : LIBRARY_DATA_DELETE_FUNC_NAME ) ;
2021-03-10 13:10:05 +00:00
2021-03-17 08:20:14 +00:00
ClickHouseLibrary : : LibraryData data_ptr = data_new_func ( lib_data ) ;
SCOPE_EXIT ( data_delete_func ( lib_data , data_ptr ) ) ;
2021-03-10 13:10:05 +00:00
2021-03-17 08:20:14 +00:00
ClickHouseLibrary : : RawClickHouseLibraryTable data = load_keys_func ( data_ptr , & settings_holder - > strings , & request_cols ) ;
2021-03-24 08:41:42 +00:00
auto block = dataToBlock ( data ) ;
2021-03-10 13:10:05 +00:00
2021-03-05 09:38:00 +00:00
return std : : make_shared < OneBlockInputStream > ( block ) ;
}
2021-03-24 08:41:42 +00:00
Block SharedLibraryHandler : : dataToBlock ( const ClickHouseLibrary : : RawClickHouseLibraryTable data )
2021-03-05 09:38:00 +00:00
{
if ( ! data )
throw Exception ( " LibraryDictionarySource: No data returned " , ErrorCodes : : EXTERNAL_LIBRARY_ERROR ) ;
const auto * columns_received = static_cast < const ClickHouseLibrary : : Table * > ( data ) ;
if ( columns_received - > error_code )
throw Exception (
" LibraryDictionarySource: Returned error: " + std : : to_string ( columns_received - > error_code ) + " " + ( columns_received - > error_string ? columns_received - > error_string : " " ) ,
ErrorCodes : : EXTERNAL_LIBRARY_ERROR ) ;
2021-03-17 08:20:14 +00:00
MutableColumns columns = sample_block . cloneEmptyColumns ( ) ;
2021-03-05 09:38:00 +00:00
for ( size_t col_n = 0 ; col_n < columns_received - > size ; + + col_n )
{
if ( columns . size ( ) ! = columns_received - > data [ col_n ] . size )
throw Exception (
" LibraryDictionarySource: Returned unexpected number of columns: " + std : : to_string ( columns_received - > data [ col_n ] . size ) + " , must be " + std : : to_string ( columns . size ( ) ) ,
ErrorCodes : : SIZES_OF_COLUMNS_DOESNT_MATCH ) ;
for ( size_t row_n = 0 ; row_n < columns_received - > data [ col_n ] . size ; + + row_n )
{
const auto & field = columns_received - > data [ col_n ] . data [ row_n ] ;
if ( ! field . data )
{
/// sample_block contains null_value (from config) inside corresponding column
const auto & col = sample_block . getByPosition ( row_n ) ;
columns [ row_n ] - > insertFrom ( * ( col . column ) , 0 ) ;
}
else
{
const auto & size = field . size ;
columns [ row_n ] - > insertData ( static_cast < const char * > ( field . data ) , size ) ;
}
}
}
return sample_block . cloneWithColumns ( std : : move ( columns ) ) ;
}
}