2008-01-12 10:36:03 +01:00
|
|
|
/*
|
|
|
|
|
2016-01-18 00:57:46 +01:00
|
|
|
Copyright (c) 2008-2016, Arvid Norberg
|
2008-01-12 10:36:03 +01:00
|
|
|
All rights reserved.
|
|
|
|
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
|
|
modification, are permitted provided that the following conditions
|
|
|
|
are met:
|
|
|
|
|
|
|
|
* Redistributions of source code must retain the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer.
|
|
|
|
* Redistributions in binary form must reproduce the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer in
|
|
|
|
the documentation and/or other materials provided with the distribution.
|
|
|
|
* Neither the name of the author nor the names of its
|
|
|
|
contributors may be used to endorse or promote products derived
|
|
|
|
from this software without specific prior written permission.
|
|
|
|
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
|
|
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef TORRENT_HTTP_PARSER_HPP_INCLUDED
|
|
|
|
#define TORRENT_HTTP_PARSER_HPP_INCLUDED
|
|
|
|
|
|
|
|
#include <map>
|
|
|
|
#include <string>
|
|
|
|
#include <utility>
|
2011-01-06 05:08:57 +01:00
|
|
|
#include <vector>
|
2016-06-18 20:01:38 +02:00
|
|
|
#include <cstdint>
|
2016-06-20 17:32:06 +02:00
|
|
|
#include <tuple>
|
2008-01-12 10:36:03 +01:00
|
|
|
|
|
|
|
#include "libtorrent/config.hpp"
|
2017-08-28 11:37:53 +02:00
|
|
|
#include "libtorrent/span.hpp"
|
2017-11-09 23:43:26 +01:00
|
|
|
#include "libtorrent/string_view.hpp"
|
2017-11-16 00:25:46 +01:00
|
|
|
#include "libtorrent/time.hpp" // for seconds32
|
|
|
|
#include "libtorrent/optional.hpp"
|
2008-01-12 10:36:03 +01:00
|
|
|
|
2017-04-12 19:00:57 +02:00
|
|
|
namespace libtorrent {
|
|
|
|
|
2010-09-21 08:34:13 +02:00
|
|
|
// return true if the status code is 200, 206, or in the 300-400 range
|
2015-03-16 05:38:28 +01:00
|
|
|
TORRENT_EXTRA_EXPORT bool is_ok_status(int http_status);
|
2010-09-21 08:34:13 +02:00
|
|
|
|
|
|
|
// return true if the status code is a redirect
|
2015-03-16 05:38:28 +01:00
|
|
|
TORRENT_EXTRA_EXPORT bool is_redirect(int http_status);
|
2010-09-21 08:34:13 +02:00
|
|
|
|
2014-09-01 10:59:12 +02:00
|
|
|
TORRENT_EXTRA_EXPORT std::string resolve_redirect_location(std::string referrer
|
2014-07-09 22:53:39 +02:00
|
|
|
, std::string location);
|
|
|
|
|
2012-03-20 04:53:07 +01:00
|
|
|
class TORRENT_EXTRA_EXPORT http_parser
|
2008-01-12 10:36:03 +01:00
|
|
|
{
|
|
|
|
public:
|
2011-03-24 17:46:26 +01:00
|
|
|
enum flags_t { dont_parse_chunks = 1 };
|
2016-10-08 20:07:11 +02:00
|
|
|
explicit http_parser(int flags = 0);
|
2012-03-19 07:06:52 +01:00
|
|
|
~http_parser();
|
2017-11-09 23:43:26 +01:00
|
|
|
std::string const& header(string_view key) const;
|
2017-11-16 00:25:46 +01:00
|
|
|
boost::optional<seconds32> header_duration(string_view key) const;
|
2008-01-12 10:36:03 +01:00
|
|
|
std::string const& protocol() const { return m_protocol; }
|
|
|
|
int status_code() const { return m_status_code; }
|
|
|
|
std::string const& method() const { return m_method; }
|
|
|
|
std::string const& path() const { return m_path; }
|
|
|
|
std::string const& message() const { return m_server_message; }
|
2016-07-26 08:15:31 +02:00
|
|
|
span<char const> get_body() const;
|
2008-01-12 10:36:03 +01:00
|
|
|
bool header_finished() const { return m_state == read_body; }
|
|
|
|
bool finished() const { return m_finished; }
|
2016-07-24 09:52:20 +02:00
|
|
|
std::tuple<int, int> incoming(span<char const> recv_buffer
|
2008-01-12 10:36:03 +01:00
|
|
|
, bool& error);
|
|
|
|
int body_start() const { return m_body_start_pos; }
|
2016-06-18 20:01:38 +02:00
|
|
|
std::int64_t content_length() const { return m_content_length; }
|
|
|
|
std::pair<std::int64_t, std::int64_t> content_range() const
|
2009-04-12 19:52:25 +02:00
|
|
|
{ return std::make_pair(m_range_start, m_range_end); }
|
2008-01-12 10:36:03 +01:00
|
|
|
|
2010-10-27 08:39:18 +02:00
|
|
|
// returns true if this response is using chunked encoding.
|
|
|
|
// in this case the body is split up into chunks. You need
|
|
|
|
// to call parse_chunk_header() for each chunk, starting with
|
|
|
|
// the start of the body.
|
|
|
|
bool chunked_encoding() const { return m_chunked_encoding; }
|
|
|
|
|
2012-05-16 07:32:12 +02:00
|
|
|
// removes the chunk headers from the supplied buffer. The buffer
|
|
|
|
// must be the stream received from the http server this parser
|
|
|
|
// instanced parsed. It will use the internal chunk list to determine
|
|
|
|
// where the chunks are in the buffer. It returns the new length of
|
|
|
|
// the buffer
|
2017-09-04 00:13:08 +02:00
|
|
|
span<char> collapse_chunk_headers(span<char> buffer) const;
|
2012-05-16 07:32:12 +02:00
|
|
|
|
2010-10-27 08:39:18 +02:00
|
|
|
// returns false if the buffer doesn't contain a complete
|
|
|
|
// chunk header. In this case, call the function again with
|
|
|
|
// a bigger buffer once more bytes have been received.
|
|
|
|
// chunk_size is filled in with the number of bytes in the
|
|
|
|
// chunk that follows. 0 means the response terminated. In
|
|
|
|
// this case there might be additional headers in the parser
|
|
|
|
// object.
|
|
|
|
// header_size is filled in with the number of bytes the header
|
|
|
|
// itself was. Skip this number of bytes to get to the actual
|
|
|
|
// chunk data.
|
|
|
|
// if the function returns false, the chunk size and header
|
|
|
|
// size may still have been modified, but their values are
|
|
|
|
// undefined
|
2016-07-24 09:52:20 +02:00
|
|
|
bool parse_chunk_header(span<char const> buf
|
2016-06-18 20:01:38 +02:00
|
|
|
, std::int64_t* chunk_size, int* header_size);
|
2010-10-27 08:39:18 +02:00
|
|
|
|
|
|
|
// reset the whole state and start over
|
2008-01-12 10:36:03 +01:00
|
|
|
void reset();
|
|
|
|
|
2013-10-20 04:40:43 +02:00
|
|
|
bool connection_close() const { return m_connection_close; }
|
|
|
|
|
2011-02-16 08:41:44 +01:00
|
|
|
std::multimap<std::string, std::string> const& headers() const { return m_header; }
|
2016-10-14 22:12:02 +02:00
|
|
|
std::vector<std::pair<std::int64_t, std::int64_t>> const& chunks() const { return m_chunked_ranges; }
|
2015-08-18 13:55:50 +02:00
|
|
|
|
2008-01-12 10:36:03 +01:00
|
|
|
private:
|
2016-07-24 09:52:20 +02:00
|
|
|
std::int64_t m_recv_pos = 0;
|
2008-01-12 10:36:03 +01:00
|
|
|
std::string m_method;
|
|
|
|
std::string m_path;
|
|
|
|
std::string m_protocol;
|
|
|
|
std::string m_server_message;
|
|
|
|
|
2016-07-24 09:52:20 +02:00
|
|
|
std::int64_t m_content_length = -1;
|
|
|
|
std::int64_t m_range_start = -1;
|
|
|
|
std::int64_t m_range_end = -1;
|
2008-01-12 10:36:03 +01:00
|
|
|
|
2011-02-16 08:41:44 +01:00
|
|
|
std::multimap<std::string, std::string> m_header;
|
2016-07-24 09:52:20 +02:00
|
|
|
span<char const> m_recv_buffer;
|
2011-01-06 05:08:57 +01:00
|
|
|
// contains offsets of the first and one-past-end of
|
|
|
|
// each chunked range in the response
|
2016-10-25 23:27:48 +02:00
|
|
|
std::vector<std::pair<std::int64_t, std::int64_t>> m_chunked_ranges;
|
2011-01-06 05:08:57 +01:00
|
|
|
|
|
|
|
// while reading a chunk, this is the offset where the
|
|
|
|
// current chunk will end (it refers to the first character
|
|
|
|
// in the chunk tail header or the next chunk header)
|
2016-07-24 09:52:20 +02:00
|
|
|
std::int64_t m_cur_chunk_end = -1;
|
2011-01-06 05:08:57 +01:00
|
|
|
|
2016-07-24 09:52:20 +02:00
|
|
|
int m_status_code = -1;
|
2014-07-06 21:18:00 +02:00
|
|
|
|
2011-01-06 05:08:57 +01:00
|
|
|
// the sum of all chunk headers read so far
|
2016-07-24 09:52:20 +02:00
|
|
|
int m_chunk_header_size = 0;
|
2011-01-06 05:08:57 +01:00
|
|
|
|
2016-07-24 09:52:20 +02:00
|
|
|
int m_partial_chunk_header = 0;
|
2011-03-24 17:46:26 +01:00
|
|
|
|
|
|
|
// controls some behaviors of the parser
|
|
|
|
int m_flags;
|
2014-07-06 21:18:00 +02:00
|
|
|
|
2016-07-24 09:52:20 +02:00
|
|
|
int m_body_start_pos = 0;
|
2014-07-06 21:18:00 +02:00
|
|
|
|
2016-07-24 09:52:20 +02:00
|
|
|
enum { read_status, read_header, read_body, error_state } m_state = read_status;
|
2014-07-06 21:18:00 +02:00
|
|
|
|
|
|
|
// this is true if the server is HTTP/1.0 or
|
|
|
|
// if it sent "connection: close"
|
2016-07-24 09:52:20 +02:00
|
|
|
bool m_connection_close = false;
|
|
|
|
bool m_chunked_encoding = false;
|
|
|
|
bool m_finished = false;
|
2008-01-12 10:36:03 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif // TORRENT_HTTP_PARSER_HPP_INCLUDED
|