2024-05-03 14:48:50 +00:00
|
|
|
#include <Common/proxyConfigurationToPocoProxyConfig.h>
|
|
|
|
|
|
|
|
|
2024-06-04 18:04:14 +00:00
|
|
|
#include <Common/StringUtils.h>
|
2024-05-10 20:20:36 +00:00
|
|
|
#include <base/find_symbols.h>
|
2024-05-03 14:48:50 +00:00
|
|
|
|
|
|
|
#pragma clang diagnostic push
|
|
|
|
#pragma clang diagnostic ignored "-Wzero-as-null-pointer-constant"
|
|
|
|
#pragma clang diagnostic ignored "-Wgnu-anonymous-struct"
|
|
|
|
#pragma clang diagnostic ignored "-Wnested-anon-types"
|
|
|
|
#pragma clang diagnostic ignored "-Wunused-parameter"
|
|
|
|
#pragma clang diagnostic ignored "-Wshadow-field-in-constructor"
|
|
|
|
#pragma clang diagnostic ignored "-Wdtor-name"
|
|
|
|
#include <re2/re2.h>
|
|
|
|
#pragma clang diagnostic pop
|
|
|
|
|
|
|
|
namespace DB
|
|
|
|
{
|
|
|
|
|
2024-05-06 13:38:10 +00:00
|
|
|
namespace
|
|
|
|
{
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Copy `curl` behavior instead of `wget` as it seems to be more flexible.
|
|
|
|
* `curl` strips leading dot and accepts url gitlab.com as a match for no_proxy .gitlab.com,
|
|
|
|
* while `wget` does an exact match.
|
|
|
|
* */
|
|
|
|
std::string buildPocoRegexpEntryWithoutLeadingDot(const std::string & host)
|
|
|
|
{
|
|
|
|
std::string_view view_without_leading_dot = host;
|
|
|
|
if (host[0] == '.')
|
|
|
|
{
|
|
|
|
view_without_leading_dot = std::string_view {host.begin() + 1u, host.end()};
|
|
|
|
}
|
|
|
|
|
|
|
|
return RE2::QuoteMeta(view_without_leading_dot);
|
|
|
|
}
|
|
|
|
|
2024-06-05 12:52:42 +00:00
|
|
|
}
|
|
|
|
|
2024-05-03 14:48:50 +00:00
|
|
|
/*
|
|
|
|
* Even though there is not an RFC that defines NO_PROXY, it is usually a comma-separated list of domains.
|
|
|
|
* Different tools implement their own versions of `NO_PROXY` support. Some support CIDR blocks, some support wildcard etc.
|
|
|
|
* Opting for a simple implementation that covers most use cases:
|
|
|
|
* * Support only single wildcard * (match anything)
|
2024-05-06 19:53:36 +00:00
|
|
|
* * Match subdomains
|
|
|
|
* * Strip leading dots
|
2024-05-03 14:48:50 +00:00
|
|
|
* * No regex
|
|
|
|
* * No CIDR blocks
|
|
|
|
* * No fancy stuff about loopback IPs
|
|
|
|
* https://about.gitlab.com/blog/2021/01/27/we-need-to-talk-no-proxy/
|
|
|
|
* Open for discussions
|
|
|
|
* */
|
2024-05-10 20:20:36 +00:00
|
|
|
std::string buildPocoNonProxyHosts(const std::string & no_proxy_hosts_string)
|
2024-05-03 14:48:50 +00:00
|
|
|
{
|
2024-05-06 13:38:10 +00:00
|
|
|
static constexpr auto OR_SEPARATOR = "|";
|
|
|
|
static constexpr auto MATCH_ANYTHING = R"((.*?))";
|
|
|
|
static constexpr auto MATCH_SUBDOMAINS_REGEX = R"((?:.*\.)?)";
|
|
|
|
|
2024-05-10 20:20:36 +00:00
|
|
|
bool match_any_host = no_proxy_hosts_string.size() == 1 && no_proxy_hosts_string[0] == '*';
|
2024-05-03 14:48:50 +00:00
|
|
|
|
|
|
|
if (match_any_host)
|
|
|
|
{
|
2024-05-06 13:38:10 +00:00
|
|
|
return MATCH_ANYTHING;
|
2024-05-03 14:48:50 +00:00
|
|
|
}
|
|
|
|
|
2024-05-10 20:20:36 +00:00
|
|
|
std::vector<std::string> no_proxy_hosts;
|
|
|
|
splitInto<','>(no_proxy_hosts, no_proxy_hosts_string);
|
2024-05-03 14:48:50 +00:00
|
|
|
|
|
|
|
bool first = true;
|
|
|
|
std::string result;
|
|
|
|
|
2024-05-10 20:20:36 +00:00
|
|
|
for (auto & host : no_proxy_hosts)
|
2024-05-03 14:48:50 +00:00
|
|
|
{
|
|
|
|
trim(host);
|
|
|
|
|
2024-05-06 19:53:36 +00:00
|
|
|
if (host.empty())
|
2024-05-03 14:48:50 +00:00
|
|
|
{
|
2024-05-06 19:53:36 +00:00
|
|
|
continue;
|
|
|
|
}
|
2024-05-03 14:48:50 +00:00
|
|
|
|
2024-05-06 19:53:36 +00:00
|
|
|
if (!first)
|
|
|
|
{
|
|
|
|
result.append(OR_SEPARATOR);
|
|
|
|
}
|
2024-05-06 13:38:10 +00:00
|
|
|
|
2024-05-06 19:53:36 +00:00
|
|
|
auto escaped_host_without_leading_dot = buildPocoRegexpEntryWithoutLeadingDot(host);
|
2024-05-06 13:38:10 +00:00
|
|
|
|
2024-05-06 19:53:36 +00:00
|
|
|
result.append(MATCH_SUBDOMAINS_REGEX);
|
|
|
|
result.append(escaped_host_without_leading_dot);
|
|
|
|
|
|
|
|
first = false;
|
2024-05-03 14:48:50 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
Poco::Net::HTTPClientSession::ProxyConfig proxyConfigurationToPocoProxyConfig(const DB::ProxyConfiguration & proxy_configuration)
|
|
|
|
{
|
|
|
|
Poco::Net::HTTPClientSession::ProxyConfig poco_proxy_config;
|
|
|
|
|
|
|
|
poco_proxy_config.host = proxy_configuration.host;
|
|
|
|
poco_proxy_config.port = proxy_configuration.port;
|
|
|
|
poco_proxy_config.protocol = DB::ProxyConfiguration::protocolToString(proxy_configuration.protocol);
|
|
|
|
poco_proxy_config.tunnel = proxy_configuration.tunneling;
|
|
|
|
poco_proxy_config.originalRequestProtocol = DB::ProxyConfiguration::protocolToString(proxy_configuration.original_request_protocol);
|
2024-06-05 12:52:42 +00:00
|
|
|
poco_proxy_config.nonProxyHosts = proxy_configuration.no_proxy_hosts;
|
2024-05-03 14:48:50 +00:00
|
|
|
|
|
|
|
return poco_proxy_config;
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|