如何以字符串形式访问boost :: asio :: streambuf输入?

时间:2016-12-21 02:36:00

标签: c++ boost boost-asio

我正在编写一个非常简单的HTTP服务器,基于:http://www.boost.org/doc/libs/1_62_0/doc/html/boost_asio/example/cpp11/echo/async_tcp_echo_server.cpp

我尝试过很多技术从boost :: asio :: streambuf中提取数据,以便解析HTTP头。 streambuf对象似乎没有正确管理它的内存(或者,更可能的是,我误用了它)&我最终得到了一个段错误。

从代码中可以看出,建议的herehere工作方法都不起作用。我怀疑这是因为我使用boost::asio::async_read_until()来读取所有标题,而不是像大多数其他编码器一样只读一个标题。

任何建议/指示都将不胜感激。

/*
    g++ -D TRY1 -ggdb3 -I $e/boost-1.62/include /tmp/streambuf.bug.cc $e/boost-1.62/lib/libboost_system.a -D TRY1

    or

    g++ -D TRY2 -ggdb3 -I $e/boost-1.62/include /tmp/streambuf.bug.cc $e/boost-1.62/lib/libboost_system.a -D TRY2

    or

    g++ -D TRY3 -ggdb3 -I $e/boost-1.62/include /tmp/streambuf.bug.cc $e/boost-1.62/lib/libboost_system.a -D TRY3
*/

#include <cstdlib>
#include <iostream>
#include <memory>
#include <utility>
#include <boost/asio.hpp>
#include <boost/bind.hpp>

using boost::asio::ip::tcp;

class session : public std::enable_shared_from_this<session>
{
    public:
        session(tcp::socket socket) : socket_(std::move(socket)), dbg(true) {
            assert(headers.empty());
            memset(padding, 0, 10000);
            std::cout << "buffer size: " << buffer.max_size() << '\n';
        }

        void start() { readHeaders(); }

    private:
        void readHeaders() {
            if (dbg)
                std::cout << "readHeaders() start\n";
            //auto self(shared_from_this());

            boost::asio::async_read_until(socket_, buffer, "\r\n\r\n", [this](const boost::system::error_code &ec, std::size_t length) {
                if (dbg)
                    std::cout << "Read " << length << " bytes of headers in async_read_until()\n";
                if (ec)
                    throw std::runtime_error("Error code in readHeaders()");


#ifdef TRY1
                std::istream stream(&buffer);
                std::string str;
                assert(!corrupted("A1"));
                while (std::getline(stream, str)) { // seg fault! (on 3rd invocation)
                    assert(!corrupted("A2"));
                    std::cout << "str=" << str << '\n';
                    assert(!corrupted("A3"));
                }
#endif


#if 0
                std::string str;
                boost::asio::buffer_copy(boost::asio::buffer(str), buffer); // ugh, won't compile
#endif


#if 0
                std::vector<unsigned char> v(buffer.size());
                boost::asio::buffer_copy(boost::asio::buffer(v), buffer); // ugh, won't compile
                const std::string str(v.begin(), v.end());
#endif


#ifdef TRY2
                std::string str;
                auto data = buffer.data();
                assert(!corrupted("B1"));
                for (auto it = data.begin(); it != data.end(); ++it) {
                    const auto buf = *it;
                    std::cout << "buf_size=" << boost::asio::buffer_size(buf) << '\n';
                    assert(!corrupted("B2"));
                    const char *tmp = boost::asio::buffer_cast<const char *>(buf);
                    assert(!corrupted("B3"));
                    str.append(tmp); // BUG!!
                    assert(!corrupted("B4")); // fails
                }
#endif


#ifdef TRY3
                auto data = buffer.data();
                auto end = data.end();
                std::string str;
                assert(!corrupted("C1"));
                for (auto it = data.begin(); it != end; ++it) {
                    assert(!corrupted("C2"));
                    std::vector<unsigned char> v(boost::asio::buffer_size(*it));
                    assert(!corrupted("C3"));
                    boost::asio::buffer_copy(boost::asio::buffer(v), *it); // BUG!!
                    assert(!corrupted("C4")); // fails
                    str.append(v.begin(), v.end());
                    assert(!corrupted("C5"));
                }
#endif

#ifdef TRY4
                assert(!corrupted("D1"));
                const std::string str(boost::asio::buffers_begin(buffer.data()), boost::asio::buffers_end(buffer.data())); // BUG!!
                assert(!corrupted("D2")); // fails
#endif

#ifdef TRY5
                assert(!corrupted("E1"));
                const std::string str((std::istreambuf_iterator<char>(&buffer)), std::istreambuf_iterator<char>()); // seg faults!
                assert(!corrupted("E2"));
#endif

#ifdef TRY6
                boost::asio::streambuf::const_buffers_type bufs = buffer.data();
                assert(!corrupted("F1"));
                std::string str(boost::asio::buffers_begin(bufs), boost::asio::buffers_begin(bufs) + buffer.size()); // BUG!!
                assert(!corrupted("F2")); // fails
#endif

                assert(!corrupted("Z1"));
                std::cout << "str=" << str << "end of data\n";
                std::istringstream input(str);
                std::string line;
                while (std::getline(input, line)) {
                    assert(!corrupted("Z2"));
                    if (line.size() == 1)
                        continue; // blank line
                    if (line.substr(0, 3) == "GET")
                        continue; // TODO: handle properly
                    const auto idx = line.find(':');
                    assert(idx != std::string::npos);
                    const std::string key(line.begin(), line.begin() + idx);
                    const std::string val(line.begin() + idx + 2, line.end());
                    // std::cout << "key=" << key << " val=" << val << '\n';
                    assert(!corrupted("Z3"));
                    headers[key] = val;
                    assert(!corrupted("Z4"));
                }
                assert(!corrupted("Z5"));
                for (auto it3 : headers) {
                    std::cout << it3.first << '=' << it3.second << '\n';
                }

                const auto it2 = headers.find("Content Length");
                contentLength = (it2 == headers.end() ? 0 : atoi(it2->second.c_str()));
                if (contentLength > 0) {
                    const boost::system::error_code ec; // (boost::system::errc::success);
                    readBody(ec);
                }
            });
            if (dbg)
                std::cout << "readHeaders() end\n";
        }

        void readBody (const boost::system::error_code &ec) {
            if (dbg)
                std::cout << "readBody()\n";
            if (ec)
                throw std::runtime_error("Error code in readBody()");

            boost::asio::streambuf::const_buffers_type bufs = buffer.data();
            body.append(boost::asio::buffers_begin(bufs), boost::asio::buffers_begin(bufs) + buffer.size());

            if (dbg)
                std::cout << "body.size=" << body.size() << " content length=" << contentLength << '\n';

            boost::asio::async_read(socket_,
                                    buffer,
                                    boost::asio::transfer_at_least(1),
                                    boost::bind(&session::readBody, this, boost::asio::placeholders::error));
        }

        bool corrupted (const std::string s) const {
            bool b = false;
            if (strlen(padding) > 0) {
                std::cout << "buffer overflow detected @ " << s << "! padding is: " << padding << '\n';
                std::cout.flush();
                b = true;
            }
            if (headers.size() > 1000) {
                std::cout << headers.size() << " headers!!\n";
                b = true;
            }
            return b;
        }

        tcp::socket socket_;
        boost::asio::streambuf buffer;
        char padding[10000]; // $buffer appears not to manage it's memory properly. Add some padding to detect overflows.
        std::map<std::string, std::string> headers;
        uint contentLength;
        std::string body;
        const bool dbg;
};

class server
{
    public:
        server(boost::asio::io_service& io_service, short port) : acceptor_(io_service, tcp::endpoint(tcp::v4(), port)), socket_(io_service) {
            do_accept();
        }

    private:
        void do_accept() {
            acceptor_.async_accept(socket_, [this](boost::system::error_code ec) {
                if (!ec) {
                    std::cout << "Connection accepted\n";
                    std::make_shared<session>(std::move(socket_))->start();
                }
                do_accept();
            });
        }

        tcp::acceptor acceptor_;
        tcp::socket socket_;
};

int main(int argc, char* argv[])
{
    try {
        if (argc != 2) {
            std::cerr << "Usage: async_tcp_echo_server <port>\n";
            return 1;
        }

        boost::asio::io_service io_service;
        server s(io_service, std::atoi(argv[1]));

        io_service.run();
    } catch (std::exception& e) {
        std::cerr << "Exception: " << e.what() << "\n";
    }

    return 0;
}

我在Linux上使用boost v1.62,gcc v6.1(Ubuntu 12.04)。

3 个答案:

答案 0 :(得分:3)

  • 您可以阅读streambuf

    • 手动(参见文档)
    • 使用std::istream

      boost::asio::streambuf buf;
      std::istream is(&buf);
      
      // usual extraction:
      int i;
      if (is >> i) {
          // use `i`
      }         
      
      // or usual line-wise extraction:
      std::string line;
      while (std::getline(is, line)) {
          // do something with `line`
      }
      
  • 替代使用boost::asio::buffer_*函数(buffer_begin()buffer_end()buffer_copy) - How copy or reuse boost::asio::streambuf?

答案 1 :(得分:1)

boost::asio::streambufCopy a streambuf's contents to a string问题都回复了将boost::asio::streambuf source; ... std::string target{buffers_begin(source.data()), buffers_end(source.data())}; 的内容复制为字符串:

b

观察到的问题是未定义行为的结果。该程序无法满足How copy or reuse boost::asio::streambufstreambuf参数的生命周期要求,因为streambuf在调用完成处理程序之前被销毁:

  

[...] streambuf的所有权由调用者保留,调用者必须保证它在调用处理程序之前一直有效。

在这种情况下,sessionsession的数据成员,session个对象由共享指针管理。管理std::make_shared<session>(std::move(socket_))->start(); 的唯一共享指针在以下表达式中创建和销毁:

start()

async_read_until()内,启动start()操作。但是,在返回表单session后,buffer的{​​{1}}会在调用async_read_until()完成处理程序之前销毁,违反了生命周期要求

官方Asio示例使用的惯用解决方案是在完成处理程序的lambda捕获中捕获shared_from_this()的结果。这可以保证session的生命周期至少与完成处理程序一样长。

auto self(shared_from_this());
async_read_until(socket_, buffer_, ...,
  [this, self](boost::system::error_code& ec, std::size_t length)
  {
    // `self` keeps the `session` alive for the lifetime of the
    // handler.  If more async operations are initiated from within
    // this handler, then the completion handlers should capture
    // `self` as well.
    ...
  });

答案 2 :(得分:0)

你的问题的确切答案给了他们。下面是我目前用于解析标题的一些伪代码。

// This is where to store headers.
_STL::map<_STL::string, _STL::string> m_headers;

// buffer is of type asio::streambuf and contains response from asio::async_read_until
_STL::istream response_stream_headers(&buffer);

// Some helper variables.
_STL::string header, header_name, header_value;

while (true) {
  _STL::getline(response_stream_headers, header, '\r');

  // Remove \n symbol from the stream.
  response_stream_headers.get();

  if (header == "") {
    // We reached end of headers, there might be still some more data!!
    break;
  }

  // Parse header to key->value
  size_t separator_pos = header.find(':');
  if (separator_pos != _STL::string::npos) {
    header_name = header.substr(0, separator_pos);

    if (separator_pos < header.length() - 1) {
      header_value = header.substr(separator_pos + 1);
    }
    else {
      header_value = "";
    }

    boost::trim_left(header_value);
    m_headers[name] = value;
  }
}

// Parsing is done, but some of the request response could have been reed by 
// asio::async_read_until, so whe read response_stream_headers untill end.
// You should use body_response_start as the begining of your response.
std::string body_response_start(std::istreambuf_iterator<char>(response_stream_headers), {});