提高批量请求的野兽内存使用率
boost beast memory usage for bulk requests
我运行这个
boost-beast-client-async-ssl 示例,没关系。但是,如果我同时创建 10000 个会话,我的程序内存使用量会增长到 400 MB,而且永远不会下降。我会在没有 ssl(简单的 http)的情况下进行测试,并且没有长大的记忆。
问:openssl 有什么问题?
有我的 main 函数。
//up boost-beast-client-async-ssl session code.
struct io_context_runner
{
boost::asio::io_context * ioc;
void operator()()const
{
try{
boost::asio::io_context::work w(*ioc);
ioc->run();
}catch(std::exception& e){
fprintf(stderr, "e: %s\n", e.what());
}
}
};
int main(int argc, char* argv[] ){
try
{
int total_run = 1;
if (argc > 1) total_run = atoi(argv[1]);
const char* const host = "104.236.162.70" ;// IP of isocpp.org
const char* const port = "443"; //
const char* const target= "/" ; //
std::string const body = ""; //
int version = 11;
// The io_context is required for all I/O
boost::asio::io_context ioc;
// The SSL context is required, and holds certificates
ssl::context ctx{ssl::context::sslv23_client};
// This holds the root certificate used for verification
load_root_certificates(ctx);
typedef std::shared_ptr< async_http_ssl::session > pointer;
for(int i = 0; i < total_run; ++i){
pointer s = std::make_shared< async_http_ssl::session >(ioc , ctx ) ;
usleep( 1000000 / total_run ) ;
s->run( host, port, target, version ) ;
}
// Launch the asynchronous operation
//std::make_shared<session>(ioc, ctx)->run(host, port, target, version);
// Run the I/O service. The call will return when
// the get operation is complete.
std::thread t{ io_context_runner{ &ioc } } ;
t.join();
// If we get here then the connection is closed gracefully
}
catch(std::exception const& e)
{
std::cerr << "Error: " << e.what() << std::endl;
return EXIT_FAILURE;
}
return EXIT_SUCCESS ;
}
编辑:ubuntu 14.04,boost 1.66,g++ 4.9.4。 OpenSSL 1.0.1f 2014 年 1 月 6 日。
EDIT2:根据 question malloc_trim 释放( return 回到 OS )大量未使用的内存。如果 boost asio 本身支持 malloc_trim 用于 unix 系统上的 ssl 连接,那将是最好的!
您改编该示例的方式存在几个问题:
- 工作线程使用
work
实例锁定 io_service,因此它永远不会完成
- 你
usleep
在生成异步任务之前的某个时间,但你 永远不会 运行 任何任务 在循环完成之前... 这意味着所有延迟都在开始 any 工作之前完成。
这是我的建议:
- 运行启动异步任务前的服务
- 有 1 个
work
实例锁定服务,以防服务在发布下一个 http 请求之前变得空闲
- 不要在工作线程内锁定
work
生活在 Coliru
#include "example/common/root_certificates.hpp"
#include <boost/beast.hpp>
#include <boost/asio.hpp>
using tcp = boost::asio::ip::tcp; // from <boost/asio/ip/tcp.hpp>
namespace ssl = boost::asio::ssl; // from <boost/asio/ssl.hpp>
namespace http = boost::beast::http; // from <boost/beast/http.hpp>
//------------------------------------------------------------------------------
// Report a failure
void
fail(boost::system::error_code ec, char const* what)
{
std::cerr << what << ": " << ec.message() << "\n";
}
// Performs an HTTP GET and prints the response
class session : public std::enable_shared_from_this<session>
{
tcp::resolver resolver_;
ssl::stream<tcp::socket> stream_;
boost::beast::flat_buffer buffer_; // (Must persist between reads)
http::request<http::empty_body> req_;
http::response<http::string_body> res_;
public:
// Resolver and stream require an io_context
explicit
session(boost::asio::io_context& ioc, ssl::context& ctx)
: resolver_(ioc)
, stream_(ioc, ctx)
{
}
// Start the asynchronous operation
void
run(
char const* host,
char const* port,
char const* target,
int version)
{
// Set SNI Hostname (many hosts need this to handshake successfully)
if(! SSL_set_tlsext_host_name(stream_.native_handle(), host))
{
boost::system::error_code ec{static_cast<int>(::ERR_get_error()), boost::asio::error::get_ssl_category()};
std::cerr << ec.message() << "\n";
return;
}
// Set up an HTTP GET request message
req_.version(version);
req_.method(http::verb::get);
req_.target(target);
req_.set(http::field::host, host);
req_.set(http::field::user_agent, BOOST_BEAST_VERSION_STRING);
// Look up the domain name
resolver_.async_resolve(
host,
port,
std::bind(
&session::on_resolve,
shared_from_this(),
std::placeholders::_1,
std::placeholders::_2));
}
void
on_resolve(
boost::system::error_code ec,
tcp::resolver::results_type results)
{
if(ec)
return fail(ec, "resolve");
// Make the connection on the IP address we get from a lookup
boost::asio::async_connect(
stream_.next_layer(),
results.begin(),
results.end(),
std::bind(
&session::on_connect,
shared_from_this(),
std::placeholders::_1));
}
void
on_connect(boost::system::error_code ec)
{
if(ec)
return fail(ec, "connect");
// Perform the SSL handshake
stream_.async_handshake(
ssl::stream_base::client,
std::bind(
&session::on_handshake,
shared_from_this(),
std::placeholders::_1));
}
void
on_handshake(boost::system::error_code ec)
{
if(ec)
return fail(ec, "handshake");
// Send the HTTP request to the remote host
http::async_write(stream_, req_,
std::bind(
&session::on_write,
shared_from_this(),
std::placeholders::_1,
std::placeholders::_2));
}
void
on_write(
boost::system::error_code ec,
std::size_t bytes_transferred)
{
boost::ignore_unused(bytes_transferred);
if(ec)
return fail(ec, "write");
// Receive the HTTP response
http::async_read(stream_, buffer_, res_,
std::bind(
&session::on_read,
shared_from_this(),
std::placeholders::_1,
std::placeholders::_2));
}
void
on_read(
boost::system::error_code ec,
std::size_t bytes_transferred)
{
boost::ignore_unused(bytes_transferred);
if(ec)
return fail(ec, "read");
// Write the message to standard out
//std::cout << res_ << std::endl;
// Gracefully close the stream
stream_.async_shutdown(
std::bind(
&session::on_shutdown,
shared_from_this(),
std::placeholders::_1));
}
void
on_shutdown(boost::system::error_code ec)
{
if(ec == boost::asio::error::eof)
{
// Rationale:
//
ec.assign(0, ec.category());
}
if(ec)
return fail(ec, "shutdown");
// If we get here then the connection is closed gracefully
}
};
//up boost-beast-client-async-ssl session code.
struct io_context_runner
{
boost::asio::io_context& ioc;
void operator()()const
{
try{
ioc.run();
}catch(std::exception& e){
fprintf(stderr, "e: %s\n", e.what());
}
}
};
namespace async_http_ssl {
using ::session;
}
#include <thread>
int main(int argc, char *argv[]) {
// The io_context is required for all I/O
boost::asio::io_context ioc;
std::thread t;
try {
// Run the I/O service. The call will return when all work is complete
boost::asio::io_context::work w(ioc);
t = std::thread { io_context_runner{ioc} };
int total_run = 1;
if (argc > 1)
total_run = atoi(argv[1]);
#if 0
auto host = "104.236.162.70"; // IP of isocpp.org
auto port = "443"; //
auto target = "/"; //
#else
auto host = "127.0.0.1";
auto port = "443";
auto target = "/BBB/http_client_async_ssl.cpp";
#endif
std::string const body = ""; //
int version = 11;
// The SSL context is required, and holds certificates
ssl::context ctx{ssl::context::sslv23_client};
// This holds the root certificate used for verification
load_root_certificates(ctx);
typedef std::shared_ptr<async_http_ssl::session> pointer;
for (int i = 0; i < total_run; ++i) {
pointer s = std::make_shared<async_http_ssl::session>(ioc, ctx);
usleep(1000000 / total_run);
s->run(host, port, target, version);
}
} catch (std::exception const &e) {
std::cerr << "Error: " << e.what() << std::endl;
return EXIT_FAILURE;
}
if (t.joinable())
t.join();
// If we get here then the connections have been closed gracefully
}
在我的系统上,使用 1 个连接进行内存分析:
有 100 个连接:
有 1000 个连接:
分析
这是什么意思?发送更多请求时,Beast 似乎仍在逐渐使用更多内存,对吗?
嗯,不。问题是您开始请求的速度快于完成请求的速度。因此,内存负载增加主要是因为许多 session
个实例在给定时间存在。完成后,他们将自动释放资源(由于使用 shared_ptr<session>
)。
按顺序发出请求
为了说明问题,这里有一个修改版本,它接受 on_completion_
会话处理程序:
std::function<void()> on_complete_;
// Resolver and stream require an io_context
template <typename Handler>
explicit
session(boost::asio::io_context& ioc, ssl::context& ctx, Handler&& handler)
: resolver_(ioc)
, stream_(ioc, ctx)
, on_complete_(std::forward<Handler>(handler))
{
}
~session() {
if (on_complete_) on_complete_();
}
现在您可以将主程序逻辑重写为异步操作 chain:
struct Tester {
boost::asio::io_context ioc;
boost::optional<boost::asio::io_context::work> work{ioc};
std::thread t { io_context_runner{ioc} };
ssl::context ctx{ssl::context::sslv23_client};
Tester() {
load_root_certificates(ctx);
}
void run(int remaining = 1) {
if (remaining <= 0)
return;
auto s = std::make_shared<session>(ioc, ctx, [=] { run(remaining - 1); });
s->run("127.0.0.1", "443", "/BBB/http_client_async_ssl.cpp", 11);
}
~Tester() {
work.reset();
if (t.joinable()) t.join();
}
};
int main(int argc, char *argv[]) {
Tester tester;
tester.run(argc>1? atoi(argv[1]):1);
}
使用这个程序 (Full Code On Coliru),我们得到更稳定的结果:
1 个请求:
100 个请求:
1000 次请求:
正在恢复吞吐量
嗯,这有点太保守了,发送 许多 请求可能会变得非常慢。 一些并发怎么样?简单:
int main(int argc, char *argv[]) {
int const total = argc>1? atoi(argv[1]) : 1;
int const concurrent = argc>2? atoi(argv[2]) : 1;
{
std::vector<Tester> chains(concurrent);
for (auto& chain : chains)
chain.run(total / concurrent);
}
std::cout << "All done\n";
}
就是这样!现在,我们可以有 concurrent
个单独的执行链来服务于 ~total 请求。查看 运行 时间的差异:
$ time ./sotest 1000
All done
real 0m53.295s
user 0m13.124s
sys 0m0.232s
$ time ./sotest 1000 10
All done
real 0m8.808s
user 0m8.884s
sys 0m1.096s
随着内存使用情况继续保持健康:
我运行这个 boost-beast-client-async-ssl 示例,没关系。但是,如果我同时创建 10000 个会话,我的程序内存使用量会增长到 400 MB,而且永远不会下降。我会在没有 ssl(简单的 http)的情况下进行测试,并且没有长大的记忆。
问:openssl 有什么问题?
有我的 main 函数。
//up boost-beast-client-async-ssl session code.
struct io_context_runner
{
boost::asio::io_context * ioc;
void operator()()const
{
try{
boost::asio::io_context::work w(*ioc);
ioc->run();
}catch(std::exception& e){
fprintf(stderr, "e: %s\n", e.what());
}
}
};
int main(int argc, char* argv[] ){
try
{
int total_run = 1;
if (argc > 1) total_run = atoi(argv[1]);
const char* const host = "104.236.162.70" ;// IP of isocpp.org
const char* const port = "443"; //
const char* const target= "/" ; //
std::string const body = ""; //
int version = 11;
// The io_context is required for all I/O
boost::asio::io_context ioc;
// The SSL context is required, and holds certificates
ssl::context ctx{ssl::context::sslv23_client};
// This holds the root certificate used for verification
load_root_certificates(ctx);
typedef std::shared_ptr< async_http_ssl::session > pointer;
for(int i = 0; i < total_run; ++i){
pointer s = std::make_shared< async_http_ssl::session >(ioc , ctx ) ;
usleep( 1000000 / total_run ) ;
s->run( host, port, target, version ) ;
}
// Launch the asynchronous operation
//std::make_shared<session>(ioc, ctx)->run(host, port, target, version);
// Run the I/O service. The call will return when
// the get operation is complete.
std::thread t{ io_context_runner{ &ioc } } ;
t.join();
// If we get here then the connection is closed gracefully
}
catch(std::exception const& e)
{
std::cerr << "Error: " << e.what() << std::endl;
return EXIT_FAILURE;
}
return EXIT_SUCCESS ;
}
编辑:ubuntu 14.04,boost 1.66,g++ 4.9.4。 OpenSSL 1.0.1f 2014 年 1 月 6 日。
EDIT2:根据
您改编该示例的方式存在几个问题:
- 工作线程使用
work
实例锁定 io_service,因此它永远不会完成 - 你
usleep
在生成异步任务之前的某个时间,但你 永远不会 运行 任何任务 在循环完成之前... 这意味着所有延迟都在开始 any 工作之前完成。
这是我的建议:
- 运行启动异步任务前的服务
- 有 1 个
work
实例锁定服务,以防服务在发布下一个 http 请求之前变得空闲 - 不要在工作线程内锁定
work
生活在 Coliru
#include "example/common/root_certificates.hpp"
#include <boost/beast.hpp>
#include <boost/asio.hpp>
using tcp = boost::asio::ip::tcp; // from <boost/asio/ip/tcp.hpp>
namespace ssl = boost::asio::ssl; // from <boost/asio/ssl.hpp>
namespace http = boost::beast::http; // from <boost/beast/http.hpp>
//------------------------------------------------------------------------------
// Report a failure
void
fail(boost::system::error_code ec, char const* what)
{
std::cerr << what << ": " << ec.message() << "\n";
}
// Performs an HTTP GET and prints the response
class session : public std::enable_shared_from_this<session>
{
tcp::resolver resolver_;
ssl::stream<tcp::socket> stream_;
boost::beast::flat_buffer buffer_; // (Must persist between reads)
http::request<http::empty_body> req_;
http::response<http::string_body> res_;
public:
// Resolver and stream require an io_context
explicit
session(boost::asio::io_context& ioc, ssl::context& ctx)
: resolver_(ioc)
, stream_(ioc, ctx)
{
}
// Start the asynchronous operation
void
run(
char const* host,
char const* port,
char const* target,
int version)
{
// Set SNI Hostname (many hosts need this to handshake successfully)
if(! SSL_set_tlsext_host_name(stream_.native_handle(), host))
{
boost::system::error_code ec{static_cast<int>(::ERR_get_error()), boost::asio::error::get_ssl_category()};
std::cerr << ec.message() << "\n";
return;
}
// Set up an HTTP GET request message
req_.version(version);
req_.method(http::verb::get);
req_.target(target);
req_.set(http::field::host, host);
req_.set(http::field::user_agent, BOOST_BEAST_VERSION_STRING);
// Look up the domain name
resolver_.async_resolve(
host,
port,
std::bind(
&session::on_resolve,
shared_from_this(),
std::placeholders::_1,
std::placeholders::_2));
}
void
on_resolve(
boost::system::error_code ec,
tcp::resolver::results_type results)
{
if(ec)
return fail(ec, "resolve");
// Make the connection on the IP address we get from a lookup
boost::asio::async_connect(
stream_.next_layer(),
results.begin(),
results.end(),
std::bind(
&session::on_connect,
shared_from_this(),
std::placeholders::_1));
}
void
on_connect(boost::system::error_code ec)
{
if(ec)
return fail(ec, "connect");
// Perform the SSL handshake
stream_.async_handshake(
ssl::stream_base::client,
std::bind(
&session::on_handshake,
shared_from_this(),
std::placeholders::_1));
}
void
on_handshake(boost::system::error_code ec)
{
if(ec)
return fail(ec, "handshake");
// Send the HTTP request to the remote host
http::async_write(stream_, req_,
std::bind(
&session::on_write,
shared_from_this(),
std::placeholders::_1,
std::placeholders::_2));
}
void
on_write(
boost::system::error_code ec,
std::size_t bytes_transferred)
{
boost::ignore_unused(bytes_transferred);
if(ec)
return fail(ec, "write");
// Receive the HTTP response
http::async_read(stream_, buffer_, res_,
std::bind(
&session::on_read,
shared_from_this(),
std::placeholders::_1,
std::placeholders::_2));
}
void
on_read(
boost::system::error_code ec,
std::size_t bytes_transferred)
{
boost::ignore_unused(bytes_transferred);
if(ec)
return fail(ec, "read");
// Write the message to standard out
//std::cout << res_ << std::endl;
// Gracefully close the stream
stream_.async_shutdown(
std::bind(
&session::on_shutdown,
shared_from_this(),
std::placeholders::_1));
}
void
on_shutdown(boost::system::error_code ec)
{
if(ec == boost::asio::error::eof)
{
// Rationale:
//
ec.assign(0, ec.category());
}
if(ec)
return fail(ec, "shutdown");
// If we get here then the connection is closed gracefully
}
};
//up boost-beast-client-async-ssl session code.
struct io_context_runner
{
boost::asio::io_context& ioc;
void operator()()const
{
try{
ioc.run();
}catch(std::exception& e){
fprintf(stderr, "e: %s\n", e.what());
}
}
};
namespace async_http_ssl {
using ::session;
}
#include <thread>
int main(int argc, char *argv[]) {
// The io_context is required for all I/O
boost::asio::io_context ioc;
std::thread t;
try {
// Run the I/O service. The call will return when all work is complete
boost::asio::io_context::work w(ioc);
t = std::thread { io_context_runner{ioc} };
int total_run = 1;
if (argc > 1)
total_run = atoi(argv[1]);
#if 0
auto host = "104.236.162.70"; // IP of isocpp.org
auto port = "443"; //
auto target = "/"; //
#else
auto host = "127.0.0.1";
auto port = "443";
auto target = "/BBB/http_client_async_ssl.cpp";
#endif
std::string const body = ""; //
int version = 11;
// The SSL context is required, and holds certificates
ssl::context ctx{ssl::context::sslv23_client};
// This holds the root certificate used for verification
load_root_certificates(ctx);
typedef std::shared_ptr<async_http_ssl::session> pointer;
for (int i = 0; i < total_run; ++i) {
pointer s = std::make_shared<async_http_ssl::session>(ioc, ctx);
usleep(1000000 / total_run);
s->run(host, port, target, version);
}
} catch (std::exception const &e) {
std::cerr << "Error: " << e.what() << std::endl;
return EXIT_FAILURE;
}
if (t.joinable())
t.join();
// If we get here then the connections have been closed gracefully
}
在我的系统上,使用 1 个连接进行内存分析:
有 100 个连接:
有 1000 个连接:
分析
这是什么意思?发送更多请求时,Beast 似乎仍在逐渐使用更多内存,对吗?
嗯,不。问题是您开始请求的速度快于完成请求的速度。因此,内存负载增加主要是因为许多 session
个实例在给定时间存在。完成后,他们将自动释放资源(由于使用 shared_ptr<session>
)。
按顺序发出请求
为了说明问题,这里有一个修改版本,它接受 on_completion_
会话处理程序:
std::function<void()> on_complete_;
// Resolver and stream require an io_context
template <typename Handler>
explicit
session(boost::asio::io_context& ioc, ssl::context& ctx, Handler&& handler)
: resolver_(ioc)
, stream_(ioc, ctx)
, on_complete_(std::forward<Handler>(handler))
{
}
~session() {
if (on_complete_) on_complete_();
}
现在您可以将主程序逻辑重写为异步操作 chain:
struct Tester {
boost::asio::io_context ioc;
boost::optional<boost::asio::io_context::work> work{ioc};
std::thread t { io_context_runner{ioc} };
ssl::context ctx{ssl::context::sslv23_client};
Tester() {
load_root_certificates(ctx);
}
void run(int remaining = 1) {
if (remaining <= 0)
return;
auto s = std::make_shared<session>(ioc, ctx, [=] { run(remaining - 1); });
s->run("127.0.0.1", "443", "/BBB/http_client_async_ssl.cpp", 11);
}
~Tester() {
work.reset();
if (t.joinable()) t.join();
}
};
int main(int argc, char *argv[]) {
Tester tester;
tester.run(argc>1? atoi(argv[1]):1);
}
使用这个程序 (Full Code On Coliru),我们得到更稳定的结果:
1 个请求:
100 个请求:
1000 次请求:
正在恢复吞吐量
嗯,这有点太保守了,发送 许多 请求可能会变得非常慢。 一些并发怎么样?简单:
int main(int argc, char *argv[]) {
int const total = argc>1? atoi(argv[1]) : 1;
int const concurrent = argc>2? atoi(argv[2]) : 1;
{
std::vector<Tester> chains(concurrent);
for (auto& chain : chains)
chain.run(total / concurrent);
}
std::cout << "All done\n";
}
就是这样!现在,我们可以有 concurrent
个单独的执行链来服务于 ~total 请求。查看 运行 时间的差异:
$ time ./sotest 1000
All done
real 0m53.295s
user 0m13.124s
sys 0m0.232s
$ time ./sotest 1000 10
All done
real 0m8.808s
user 0m8.884s
sys 0m1.096s
随着内存使用情况继续保持健康: