#if !defined(ARCADIA_BUILD) #include "config_core.h" #endif #if USE_MYSQL #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include "MySQLBlockInputStream.h" namespace DB { namespace ErrorCodes { extern const int NUMBER_OF_COLUMNS_DOESNT_MATCH; extern const int NOT_IMPLEMENTED; } StreamSettings::StreamSettings(const Settings & settings, bool auto_close_, bool fetch_by_name_, size_t max_retry_) : max_read_mysql_row_nums((settings.external_storage_max_read_rows) ? settings.external_storage_max_read_rows : settings.max_block_size) , max_read_mysql_bytes_size(settings.external_storage_max_read_bytes) , auto_close(auto_close_) , fetch_by_name(fetch_by_name_) , default_num_tries_on_connection_loss(max_retry_) { } MySQLBlockInputStream::Connection::Connection( const mysqlxx::PoolWithFailover::Entry & entry_, const std::string & query_str) : entry(entry_) , query{entry->query(query_str)} , result{query.use()} { } /// Used in MaterializedMySQL and in doInvalidateQuery for dictionary source. MySQLBlockInputStream::MySQLBlockInputStream( const mysqlxx::PoolWithFailover::Entry & entry, const std::string & query_str, const Block & sample_block, const StreamSettings & settings_) : log(&Poco::Logger::get("MySQLBlockInputStream")) , connection{std::make_unique(entry, query_str)} , settings{std::make_unique(settings_)} { description.init(sample_block); initPositionMappingFromQueryResultStructure(); } /// For descendant MySQLWithFailoverBlockInputStream MySQLBlockInputStream::MySQLBlockInputStream(const Block &sample_block_, const StreamSettings & settings_) : log(&Poco::Logger::get("MySQLBlockInputStream")) , settings(std::make_unique(settings_)) { description.init(sample_block_); } /// Used by MySQL storage / table function and dictionary source. MySQLWithFailoverBlockInputStream::MySQLWithFailoverBlockInputStream( mysqlxx::PoolWithFailoverPtr pool_, const std::string & query_str_, const Block & sample_block_, const StreamSettings & settings_) : MySQLBlockInputStream(sample_block_, settings_) , pool(pool_) , query_str(query_str_) { } void MySQLWithFailoverBlockInputStream::readPrefix() { size_t count_connect_attempts = 0; /// For recovering from "Lost connection to MySQL server during query" errors while (true) { try { connection = std::make_unique(pool->get(), query_str); break; } catch (const mysqlxx::ConnectionLost & ecl) /// There are two retriable failures: CR_SERVER_GONE_ERROR, CR_SERVER_LOST { LOG_WARNING(log, "Failed connection ({}/{}). Trying to reconnect... (Info: {})", count_connect_attempts, settings->default_num_tries_on_connection_loss, ecl.displayText()); } if (++count_connect_attempts > settings->default_num_tries_on_connection_loss) { LOG_ERROR(log, "Failed to create connection to MySQL. ({}/{})", count_connect_attempts, settings->default_num_tries_on_connection_loss); throw; } } initPositionMappingFromQueryResultStructure(); } namespace { using ValueType = ExternalResultDescription::ValueType; void insertValue(const IDataType & data_type, IColumn & column, const ValueType type, const mysqlxx::Value & value, size_t & read_bytes_size) { switch (type) { case ValueType::vtUInt8: assert_cast(column).insertValue(value.getUInt()); read_bytes_size += 1; break; case ValueType::vtUInt16: assert_cast(column).insertValue(value.getUInt()); read_bytes_size += 2; break; case ValueType::vtUInt32: assert_cast(column).insertValue(value.getUInt()); read_bytes_size += 4; break; case ValueType::vtUInt64: assert_cast(column).insertValue(value.getUInt()); read_bytes_size += 8; break; case ValueType::vtInt8: assert_cast(column).insertValue(value.getInt()); read_bytes_size += 1; break; case ValueType::vtInt16: assert_cast(column).insertValue(value.getInt()); read_bytes_size += 2; break; case ValueType::vtInt32: assert_cast(column).insertValue(value.getInt()); read_bytes_size += 4; break; case ValueType::vtInt64: assert_cast(column).insertValue(value.getInt()); read_bytes_size += 8; break; case ValueType::vtFloat32: assert_cast(column).insertValue(value.getDouble()); read_bytes_size += 4; break; case ValueType::vtFloat64: assert_cast(column).insertValue(value.getDouble()); read_bytes_size += 8; break; case ValueType::vtEnum8: assert_cast(column).insertValue(assert_cast &>(data_type).castToValue(value.data()).get()); read_bytes_size += assert_cast(column).byteSize(); break; case ValueType::vtEnum16: assert_cast(column).insertValue(assert_cast &>(data_type).castToValue(value.data()).get()); read_bytes_size += assert_cast(column).byteSize(); break; case ValueType::vtString: assert_cast(column).insertData(value.data(), value.size()); read_bytes_size += assert_cast(column).byteSize(); break; case ValueType::vtDate: assert_cast(column).insertValue(UInt16(value.getDate().getDayNum())); read_bytes_size += 2; break; case ValueType::vtDateTime: { ReadBufferFromString in(value); time_t time = 0; readDateTimeText(time, in, assert_cast(data_type).getTimeZone()); if (time < 0) time = 0; assert_cast(column).insertValue(time); read_bytes_size += 4; break; } case ValueType::vtUUID: assert_cast(column).insert(parse(value.data(), value.size())); read_bytes_size += assert_cast(column).byteSize(); break; case ValueType::vtDateTime64:[[fallthrough]]; case ValueType::vtDecimal32: [[fallthrough]]; case ValueType::vtDecimal64: [[fallthrough]]; case ValueType::vtDecimal128:[[fallthrough]]; case ValueType::vtDecimal256: { ReadBuffer buffer(const_cast(value.data()), value.size(), 0); data_type.getDefaultSerialization()->deserializeWholeText(column, buffer, FormatSettings{}); read_bytes_size += column.sizeOfValueIfFixed(); break; } case ValueType::vtFixedString: assert_cast(column).insertData(value.data(), value.size()); read_bytes_size += column.sizeOfValueIfFixed(); break; default: throw Exception("Unsupported value type", ErrorCodes::NOT_IMPLEMENTED); } } void insertDefaultValue(IColumn & column, const IColumn & sample_column) { column.insertFrom(sample_column, 0); } } Block MySQLBlockInputStream::readImpl() { auto row = connection->result.fetch(); if (!row) { if (settings->auto_close) connection->entry.disconnect(); return {}; } MutableColumns columns(description.sample_block.columns()); for (const auto i : collections::range(0, columns.size())) columns[i] = description.sample_block.getByPosition(i).column->cloneEmpty(); size_t num_rows = 0; size_t read_bytes_size = 0; while (row) { for (size_t index = 0; index < position_mapping.size(); ++index) { const auto value = row[position_mapping[index]]; const auto & sample = description.sample_block.getByPosition(index); bool is_type_nullable = description.types[index].second; if (!value.isNull()) { if (is_type_nullable) { ColumnNullable & column_nullable = assert_cast(*columns[index]); const auto & data_type = assert_cast(*sample.type); insertValue(*data_type.getNestedType(), column_nullable.getNestedColumn(), description.types[index].first, value, read_bytes_size); column_nullable.getNullMapData().emplace_back(false); } else { insertValue(*sample.type, *columns[index], description.types[index].first, value, read_bytes_size); } } else { insertDefaultValue(*columns[index], *sample.column); if (is_type_nullable) { ColumnNullable & column_nullable = assert_cast(*columns[index]); column_nullable.getNullMapData().back() = true; } } } ++num_rows; if (num_rows == settings->max_read_mysql_row_nums || (settings->max_read_mysql_bytes_size && read_bytes_size >= settings->max_read_mysql_bytes_size)) break; row = connection->result.fetch(); } return description.sample_block.cloneWithColumns(std::move(columns)); } void MySQLBlockInputStream::initPositionMappingFromQueryResultStructure() { position_mapping.resize(description.sample_block.columns()); if (!settings->fetch_by_name) { if (description.sample_block.columns() != connection->result.getNumFields()) throw Exception{"mysqlxx::UseQueryResult contains " + toString(connection->result.getNumFields()) + " columns while " + toString(description.sample_block.columns()) + " expected", ErrorCodes::NUMBER_OF_COLUMNS_DOESNT_MATCH}; for (const auto idx : collections::range(0, connection->result.getNumFields())) position_mapping[idx] = idx; } else { const auto & sample_names = description.sample_block.getNames(); std::unordered_set missing_names(sample_names.begin(), sample_names.end()); size_t fields_size = connection->result.getNumFields(); for (const size_t & idx : collections::range(0, fields_size)) { const auto & field_name = connection->result.getFieldName(idx); if (description.sample_block.has(field_name)) { const auto & position = description.sample_block.getPositionByName(field_name); position_mapping[position] = idx; missing_names.erase(field_name); } } if (!missing_names.empty()) { WriteBufferFromOwnString exception_message; for (auto iter = missing_names.begin(); iter != missing_names.end(); ++iter) { if (iter != missing_names.begin()) exception_message << ", "; exception_message << *iter; } throw Exception("mysqlxx::UseQueryResult must be contain the" + exception_message.str() + " columns.", ErrorCodes::NUMBER_OF_COLUMNS_DOESNT_MATCH); } } } } #endif