ClickHouse/programs/odbc-bridge/ODBCBlockInputStream.cpp

171 lines
5.9 KiB
C++
Raw Normal View History

#include "ODBCBlockInputStream.h"
#include <vector>
2021-03-22 11:40:29 +00:00
#include <IO/ReadBufferFromString.h>
#include <DataTypes/DataTypeNullable.h>
2021-11-22 12:21:15 +00:00
#include <DataTypes/DataTypeDateTime64.h>
#include <Columns/ColumnNullable.h>
#include <Columns/ColumnString.h>
#include <Columns/ColumnsNumber.h>
#include <Common/assert_cast.h>
2018-09-05 16:20:12 +00:00
#include <IO/ReadHelpers.h>
2018-06-05 19:46:49 +00:00
#include <IO/WriteHelpers.h>
2022-04-27 15:05:45 +00:00
#include <Common/logger_useful.h>
2016-12-08 02:49:04 +00:00
namespace DB
{
namespace ErrorCodes
{
extern const int UNKNOWN_TYPE;
2016-12-08 02:49:04 +00:00
}
2021-10-11 16:11:50 +00:00
ODBCSource::ODBCSource(
2021-06-07 18:09:16 +00:00
nanodbc::ConnectionHolderPtr connection_holder, const std::string & query_str, const Block & sample_block, const UInt64 max_block_size_)
2021-10-11 16:11:50 +00:00
: ISource(sample_block)
, log(&Poco::Logger::get("ODBCSource"))
2019-08-03 11:02:40 +00:00
, max_block_size{max_block_size_}
2021-03-22 11:40:29 +00:00
, query(query_str)
2016-12-08 02:49:04 +00:00
{
description.init(sample_block);
2021-06-07 18:09:16 +00:00
result = execute<nanodbc::result>(connection_holder,
[&](nanodbc::connection & connection) { return execute(connection, query); });
2016-12-08 02:49:04 +00:00
}
2021-10-11 16:11:50 +00:00
Chunk ODBCSource::generate()
2016-12-08 02:49:04 +00:00
{
2021-10-11 16:11:50 +00:00
if (is_finished)
return {};
2021-03-22 11:40:29 +00:00
MutableColumns columns(description.sample_block.cloneEmptyColumns());
size_t num_rows = 0;
2016-12-08 02:49:04 +00:00
2021-03-22 11:40:29 +00:00
while (true)
{
if (!result.next())
{
2021-10-11 16:11:50 +00:00
is_finished = true;
2021-03-22 11:40:29 +00:00
break;
}
2016-12-08 02:49:04 +00:00
2021-03-22 11:40:29 +00:00
for (int idx = 0; idx < result.columns(); ++idx)
{
const auto & sample = description.sample_block.getByPosition(idx);
2021-03-22 11:40:29 +00:00
if (!result.is_null(idx))
{
bool is_nullable = description.types[idx].second;
if (is_nullable)
{
ColumnNullable & column_nullable = assert_cast<ColumnNullable &>(*columns[idx]);
const auto & data_type = assert_cast<const DataTypeNullable &>(*sample.type);
insertValue(column_nullable.getNestedColumn(), data_type.getNestedType(), description.types[idx].first, result, idx);
column_nullable.getNullMapData().emplace_back(0);
}
else
{
insertValue(*columns[idx], sample.type, description.types[idx].first, result, idx);
}
}
else
insertDefaultValue(*columns[idx], *sample.column);
}
2016-12-08 02:49:04 +00:00
2021-03-22 11:40:29 +00:00
if (++num_rows == max_block_size)
break;
}
2016-12-08 02:49:04 +00:00
2021-10-11 16:11:50 +00:00
return Chunk(std::move(columns), num_rows);
2016-12-08 02:49:04 +00:00
}
2021-03-22 11:40:29 +00:00
2021-10-11 16:11:50 +00:00
void ODBCSource::insertValue(
IColumn & column, const DataTypePtr data_type, const ValueType type, nanodbc::result & row, size_t idx)
2021-03-22 11:40:29 +00:00
{
switch (type)
{
case ValueType::vtUInt8:
assert_cast<ColumnUInt8 &>(column).insertValue(row.get<uint16_t>(idx));
break;
case ValueType::vtUInt16:
assert_cast<ColumnUInt16 &>(column).insertValue(row.get<uint16_t>(idx));
break;
case ValueType::vtUInt32:
assert_cast<ColumnUInt32 &>(column).insertValue(row.get<uint32_t>(idx));
break;
case ValueType::vtUInt64:
assert_cast<ColumnUInt64 &>(column).insertValue(row.get<uint64_t>(idx));
break;
case ValueType::vtInt8:
assert_cast<ColumnInt8 &>(column).insertValue(row.get<int16_t>(idx));
break;
case ValueType::vtInt16:
assert_cast<ColumnInt16 &>(column).insertValue(row.get<int16_t>(idx));
break;
case ValueType::vtInt32:
assert_cast<ColumnInt32 &>(column).insertValue(row.get<int32_t>(idx));
break;
case ValueType::vtInt64:
assert_cast<ColumnInt64 &>(column).insertValue(row.get<int64_t>(idx));
break;
case ValueType::vtFloat32:
assert_cast<ColumnFloat32 &>(column).insertValue(row.get<float>(idx));
break;
case ValueType::vtFloat64:
assert_cast<ColumnFloat64 &>(column).insertValue(row.get<double>(idx));
break;
case ValueType::vtFixedString:[[fallthrough]];
case ValueType::vtEnum8:
case ValueType::vtEnum16:
2021-03-22 11:40:29 +00:00
case ValueType::vtString:
assert_cast<ColumnString &>(column).insert(row.get<std::string>(idx));
break;
case ValueType::vtUUID:
{
auto value = row.get<std::string>(idx);
assert_cast<ColumnUInt128 &>(column).insert(parse<UUID>(value.data(), value.size()));
break;
}
case ValueType::vtDate:
assert_cast<ColumnUInt16 &>(column).insertValue(UInt16{LocalDate{row.get<std::string>(idx)}.getDayNum()});
break;
case ValueType::vtDateTime:
{
auto value = row.get<std::string>(idx);
ReadBufferFromString in(value);
2021-03-22 11:40:29 +00:00
time_t time = 0;
2021-06-21 08:18:38 +00:00
readDateTimeText(time, in, assert_cast<const DataTypeDateTime *>(data_type.get())->getTimeZone());
2021-03-22 11:40:29 +00:00
if (time < 0)
time = 0;
assert_cast<ColumnUInt32 &>(column).insertValue(static_cast<UInt32>(time));
2021-03-22 11:40:29 +00:00
break;
}
2021-11-22 12:21:15 +00:00
case ValueType::vtDateTime64:
{
auto value = row.get<std::string>(idx);
ReadBufferFromString in(value);
DateTime64 time = 0;
const auto * datetime_type = assert_cast<const DataTypeDateTime64 *>(data_type.get());
readDateTime64Text(time, datetime_type->getScale(), in, datetime_type->getTimeZone());
assert_cast<DataTypeDateTime64::ColumnType &>(column).insertValue(time);
break;
}
case ValueType::vtDecimal32: [[fallthrough]];
case ValueType::vtDecimal64: [[fallthrough]];
case ValueType::vtDecimal128: [[fallthrough]];
case ValueType::vtDecimal256:
{
auto value = row.get<std::string>(idx);
ReadBufferFromString istr(value);
2021-03-31 08:42:57 +00:00
data_type->getDefaultSerialization()->deserializeWholeText(column, istr, FormatSettings{});
break;
}
2021-03-22 11:40:29 +00:00
default:
throw Exception(ErrorCodes::UNKNOWN_TYPE, "Unsupported value type");
2021-03-22 11:40:29 +00:00
}
}
2016-12-08 02:49:04 +00:00
}