#include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include namespace DB { namespace ErrorCodes { extern const int BAD_ARGUMENTS; } ExternalTableDataPtr BaseExternalTable::getData(const Context & context) { initReadBuffer(); initSampleBlock(); auto input = context.getInputFormat(format, *read_buffer, sample_block, DEFAULT_BLOCK_SIZE); auto stream = std::make_shared(input); auto data = std::make_unique(); data->table_name = name; data->pipe = std::make_unique(std::make_shared(std::move(stream))); return data; } void BaseExternalTable::clean() { name.clear(); file.clear(); format.clear(); structure.clear(); sample_block.clear(); read_buffer.reset(); } /// Function for debugging information output void BaseExternalTable::write() { std::cerr << "file " << file << std::endl; std::cerr << "name " << name << std::endl; std::cerr << "format " << format << std::endl; std::cerr << "structure: \n"; for (const auto & elem : structure) std::cerr << '\t' << elem.first << ' ' << elem.second << std::endl; } void BaseExternalTable::parseStructureFromStructureField(const std::string & argument) { std::vector vals; splitInto<' ', ','>(vals, argument, true); if (vals.size() % 2 != 0) throw Exception("Odd number of attributes in section structure: " + std::to_string(vals.size()), ErrorCodes::BAD_ARGUMENTS); for (size_t i = 0; i < vals.size(); i += 2) structure.emplace_back(vals[i], vals[i + 1]); } void BaseExternalTable::parseStructureFromTypesField(const std::string & argument) { std::vector vals; splitInto<' ', ','>(vals, argument, true); for (size_t i = 0; i < vals.size(); ++i) structure.emplace_back("_" + toString(i + 1), vals[i]); } void BaseExternalTable::initSampleBlock() { const DataTypeFactory & data_type_factory = DataTypeFactory::instance(); for (const auto & elem : structure) { ColumnWithTypeAndName column; column.name = elem.first; column.type = data_type_factory.get(elem.second); column.column = column.type->createColumn(); sample_block.insert(std::move(column)); } } void ExternalTable::initReadBuffer() { if (file == "-") read_buffer = std::make_unique(STDIN_FILENO); else read_buffer = std::make_unique(file); } ExternalTable::ExternalTable(const boost::program_options::variables_map & external_options) { if (external_options.count("file")) file = external_options["file"].as(); else throw Exception("--file field have not been provided for external table", ErrorCodes::BAD_ARGUMENTS); if (external_options.count("name")) name = external_options["name"].as(); else throw Exception("--name field have not been provided for external table", ErrorCodes::BAD_ARGUMENTS); if (external_options.count("format")) format = external_options["format"].as(); else throw Exception("--format field have not been provided for external table", ErrorCodes::BAD_ARGUMENTS); if (external_options.count("structure")) parseStructureFromStructureField(external_options["structure"].as()); else if (external_options.count("types")) parseStructureFromTypesField(external_options["types"].as()); else throw Exception("Neither --structure nor --types have not been provided for external table", ErrorCodes::BAD_ARGUMENTS); } void ExternalTablesHandler::handlePart(const Poco::Net::MessageHeader & header, std::istream & stream) { const Settings & settings = context.getSettingsRef(); /// The buffer is initialized here, not in the virtual function initReadBuffer read_buffer_impl = std::make_unique(stream); if (settings.http_max_multipart_form_data_size) read_buffer = std::make_unique( *read_buffer_impl, settings.http_max_multipart_form_data_size, true, "the maximum size of multipart/form-data. This limit can be tuned by 'http_max_multipart_form_data_size' setting"); else read_buffer = std::move(read_buffer_impl); /// Retrieve a collection of parameters from MessageHeader Poco::Net::NameValueCollection content; std::string label; Poco::Net::MessageHeader::splitParameters(header.get("Content-Disposition"), label, content); /// Get parameters name = content.get("name", "_data"); format = params.get(name + "_format", "TabSeparated"); if (params.has(name + "_structure")) parseStructureFromStructureField(params.get(name + "_structure")); else if (params.has(name + "_types")) parseStructureFromTypesField(params.get(name + "_types")); else throw Exception("Neither structure nor types have not been provided for external table " + name + ". Use fields " + name + "_structure or " + name + "_types to do so.", ErrorCodes::BAD_ARGUMENTS); ExternalTableDataPtr data = getData(context); /// Create table NamesAndTypesList columns = sample_block.getNamesAndTypesList(); auto temporary_table = TemporaryTableHolder(context, ColumnsDescription{columns}, {}); auto storage = temporary_table.getTable(); context.addExternalTable(data->table_name, std::move(temporary_table)); BlockOutputStreamPtr output = storage->write(ASTPtr(), storage->getInMemoryMetadataPtr(), context); /// Write data data->pipe->resize(1); auto sink = std::make_shared(std::move(output)); connect(*data->pipe->getOutputPort(0), sink->getPort()); auto processors = Pipe::detachProcessors(std::move(*data->pipe)); processors.push_back(std::move(sink)); auto executor = std::make_shared(processors); executor->execute(/*num_threads = */ 1); /// We are ready to receive the next file, for this we clear all the information received clean(); } }