536 lines
17 KiB
C++
536 lines
17 KiB
C++
|
/*
|
||
|
|
||
|
Copyright (c) 2010-2013, Arvid Norberg
|
||
|
All rights reserved.
|
||
|
|
||
|
Redistribution and use in source and binary forms, with or without
|
||
|
modification, are permitted provided that the following conditions
|
||
|
are met:
|
||
|
|
||
|
* Redistributions of source code must retain the above copyright
|
||
|
notice, this list of conditions and the following disclaimer.
|
||
|
* Redistributions in binary form must reproduce the above copyright
|
||
|
notice, this list of conditions and the following disclaimer in
|
||
|
the documentation and/or other materials provided with the distribution.
|
||
|
* Neither the name of the author nor the names of its
|
||
|
contributors may be used to endorse or promote products derived
|
||
|
from this software without specific prior written permission.
|
||
|
|
||
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
||
|
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||
|
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
||
|
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
||
|
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
||
|
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
||
|
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
||
|
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
||
|
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
||
|
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||
|
POSSIBILITY OF SUCH DAMAGE.
|
||
|
|
||
|
*/
|
||
|
|
||
|
#ifndef TORRENT_BLOCK_CACHE
|
||
|
#define TORRENT_BLOCK_CACHE
|
||
|
|
||
|
#include <boost/unordered_set.hpp>
|
||
|
#include <boost/cstdint.hpp>
|
||
|
#include <boost/shared_ptr.hpp>
|
||
|
#include <boost/shared_array.hpp>
|
||
|
#include <list>
|
||
|
#include <vector>
|
||
|
|
||
|
#include "libtorrent/time.hpp"
|
||
|
#include "libtorrent/error_code.hpp"
|
||
|
#include "libtorrent/io_service_fwd.hpp"
|
||
|
#include "libtorrent/hasher.hpp"
|
||
|
#include "libtorrent/sliding_average.hpp"
|
||
|
#include "libtorrent/time.hpp"
|
||
|
#include "libtorrent/tailqueue.hpp"
|
||
|
#include "libtorrent/linked_list.hpp"
|
||
|
#include "libtorrent/disk_buffer_pool.hpp"
|
||
|
#include "libtorrent/file.hpp" // for iovec_t
|
||
|
|
||
|
#if TORRENT_USE_ASSERTS
|
||
|
#include "libtorrent/disk_io_job.hpp"
|
||
|
#endif
|
||
|
|
||
|
namespace libtorrent
|
||
|
{
|
||
|
struct disk_io_job;
|
||
|
class piece_manager;
|
||
|
struct disk_buffer_pool;
|
||
|
struct cache_status;
|
||
|
struct block_cache_reference;
|
||
|
struct counters;
|
||
|
namespace aux { struct session_settings; }
|
||
|
struct alert_dispatcher;
|
||
|
#if TORRENT_USE_ASSERTS
|
||
|
class file_storage;
|
||
|
#endif
|
||
|
|
||
|
#if TORRENT_USE_ASSERTS
|
||
|
struct piece_log_t
|
||
|
{
|
||
|
piece_log_t(int j, int b= -1): job(j), block(b) {}
|
||
|
int job;
|
||
|
int block;
|
||
|
|
||
|
// these are "jobs" thar cause piece_refcount
|
||
|
// to be incremented
|
||
|
enum artificial_jobs
|
||
|
{
|
||
|
flushing = disk_io_job::num_job_ids, // 20
|
||
|
flush_expired,
|
||
|
try_flush_write_blocks,
|
||
|
try_flush_write_blocks2,
|
||
|
flush_range,
|
||
|
clear_outstanding_jobs,
|
||
|
set_outstanding_jobs,
|
||
|
|
||
|
last_job
|
||
|
};
|
||
|
|
||
|
static char const* job_names[7];
|
||
|
};
|
||
|
|
||
|
char const* job_name(int j);
|
||
|
|
||
|
void print_piece_log(std::vector<piece_log_t> const& piece_log);
|
||
|
|
||
|
#endif
|
||
|
|
||
|
struct TORRENT_EXTRA_EXPORT partial_hash
|
||
|
{
|
||
|
partial_hash(): offset(0) {}
|
||
|
// the number of bytes in the piece that has been hashed
|
||
|
int offset;
|
||
|
// the sha-1 context
|
||
|
hasher h;
|
||
|
};
|
||
|
|
||
|
struct cached_block_entry
|
||
|
{
|
||
|
cached_block_entry()
|
||
|
: buf(0)
|
||
|
, refcount(0)
|
||
|
, dirty(false)
|
||
|
, hitcount(0)
|
||
|
, pending(false)
|
||
|
{
|
||
|
#if TORRENT_USE_ASSERTS
|
||
|
hashing_count = 0;
|
||
|
reading_count = 0;
|
||
|
flushing_count = 0;
|
||
|
#endif
|
||
|
}
|
||
|
|
||
|
char* buf;
|
||
|
|
||
|
enum { max_refcount = (1 << 15) -1 };
|
||
|
|
||
|
// the number of references to this buffer. These references
|
||
|
// might be in outstanding asyncronous requests or in peer
|
||
|
// connection send buffers. We can't free the buffer until
|
||
|
// all references are gone and refcount reaches 0. The buf
|
||
|
// pointer in this struct doesn't count as a reference and
|
||
|
// is always the last to be cleared
|
||
|
boost::uint16_t refcount:15;
|
||
|
|
||
|
// if this is true, this block needs to be written to
|
||
|
// disk before it's freed. Typically all blocks in a piece
|
||
|
// would either be dirty (write coalesce cache) or not dirty
|
||
|
// (read-ahead cache). Once blocks are written to disk, the
|
||
|
// dirty flag is cleared and effectively turns the block
|
||
|
// into a read cache block
|
||
|
boost::uint16_t dirty:1;
|
||
|
|
||
|
// the number of times this block has been copied out of
|
||
|
// the cache, serving a request.
|
||
|
boost::uint16_t hitcount:15;
|
||
|
|
||
|
// pending means that this buffer has not yet been filled in
|
||
|
// with valid data. There's an outstanding read job for this.
|
||
|
// If the dirty flag is set, it means there's an outstanding
|
||
|
// write job to write this block.
|
||
|
boost::uint16_t pending:1;
|
||
|
|
||
|
#if TORRENT_USE_ASSERTS
|
||
|
// this many of the references are held by hashing operations
|
||
|
int hashing_count;
|
||
|
// this block is being used in this many peer's send buffers currently
|
||
|
int reading_count;
|
||
|
// the number of references held by flushing operations
|
||
|
int flushing_count;
|
||
|
#endif
|
||
|
};
|
||
|
|
||
|
// list_node is here to be able to link this cache entry
|
||
|
// into one of the LRU lists
|
||
|
struct TORRENT_EXTRA_EXPORT cached_piece_entry : list_node
|
||
|
{
|
||
|
cached_piece_entry();
|
||
|
~cached_piece_entry();
|
||
|
|
||
|
bool ok_to_evict(bool ignore_hash = false) const
|
||
|
{
|
||
|
return refcount == 0
|
||
|
&& piece_refcount == 0
|
||
|
&& num_blocks == 0
|
||
|
&& !hashing
|
||
|
&& read_jobs.size() == 0
|
||
|
&& (ignore_hash || !hash || hash->offset == 0);
|
||
|
}
|
||
|
|
||
|
// storage this piece belongs to
|
||
|
boost::shared_ptr<piece_manager> storage;
|
||
|
|
||
|
// write jobs hanging off of this piece
|
||
|
tailqueue jobs;
|
||
|
|
||
|
// read jobs waiting for the read job currently outstanding
|
||
|
// on this piece to complete. These are executed at that point.
|
||
|
tailqueue read_jobs;
|
||
|
|
||
|
int get_piece() const { return piece; }
|
||
|
void* get_storage() const { return storage.get(); }
|
||
|
|
||
|
bool operator==(cached_piece_entry const& rhs) const
|
||
|
{ return storage.get() == rhs.storage.get() && piece == rhs.piece; }
|
||
|
|
||
|
// if this is set, we'll be calculating the hash
|
||
|
// for this piece. This member stores the interim
|
||
|
// state while we're calulcating the hash.
|
||
|
partial_hash* hash;
|
||
|
|
||
|
// set to a unique identifier of a peer that last
|
||
|
// requested from this piece.
|
||
|
void* last_requester;
|
||
|
|
||
|
// the pointers to the block data. If this is a ghost
|
||
|
// cache entry, there won't be any data here
|
||
|
// TODO: 3 could this be a scoped_array instead? does cached_piece_entry really need to be copyable?
|
||
|
// cached_piece_entry does need to be copyable since it's part of a container, but it's possible
|
||
|
// it could be a raw pointer or boost::unique_ptr perhaps
|
||
|
boost::shared_array<cached_block_entry> blocks;
|
||
|
|
||
|
// the last time a block was written to this piece
|
||
|
// plus the minimum amount of time the block is guaranteed
|
||
|
// to stay in the cache
|
||
|
//TODO: make this 32 bits and to count seconds since the block cache was created
|
||
|
ptime expire;
|
||
|
|
||
|
boost::uint64_t piece:22;
|
||
|
|
||
|
// the number of dirty blocks in this piece
|
||
|
boost::uint64_t num_dirty:14;
|
||
|
|
||
|
// the number of blocks in the cache for this piece
|
||
|
boost::uint64_t num_blocks:14;
|
||
|
|
||
|
// the total number of blocks in this piece (and the number
|
||
|
// of elements in the blocks array)
|
||
|
boost::uint64_t blocks_in_piece:14;
|
||
|
|
||
|
// ---- 64 bit boundary ----
|
||
|
|
||
|
// while we have an outstanding async hash operation
|
||
|
// working on this piece, 'hashing' is set to 1
|
||
|
// When the operation returns, this is set to 0.
|
||
|
boost::uint32_t hashing:1;
|
||
|
|
||
|
// if we've completed at least one hash job on this
|
||
|
// piece, and returned it. This is set to one
|
||
|
boost::uint32_t hashing_done:1;
|
||
|
|
||
|
// if this is true, whenever refcount hits 0,
|
||
|
// this piece should be deleted
|
||
|
boost::uint32_t marked_for_deletion:1;
|
||
|
|
||
|
// this is set to true once we flush blocks past
|
||
|
// the hash cursor. Once this happens, there's
|
||
|
// no point in keeping cache blocks around for
|
||
|
// it in avoid_readback mode
|
||
|
boost::uint32_t need_readback:1;
|
||
|
|
||
|
// indicates which LRU list this piece is chained into
|
||
|
enum cache_state_t
|
||
|
{
|
||
|
// this is the LRU list for pieces with dirty blocks
|
||
|
write_lru,
|
||
|
|
||
|
// this is the LRU list for volatile pieces. i.e.
|
||
|
// pieces with very low cache priority. These are
|
||
|
// always the first ones to be evicted.
|
||
|
volatile_read_lru,
|
||
|
|
||
|
// this is the LRU list for read blocks that have
|
||
|
// been requested once
|
||
|
read_lru1,
|
||
|
|
||
|
// the is the LRU list for read blocks that have
|
||
|
// been requested once recently, but then was evicted.
|
||
|
// if these are requested again, they will be moved
|
||
|
// to list 2, the frequently requested pieces
|
||
|
read_lru1_ghost,
|
||
|
|
||
|
// this is the LRU of frequently used pieces. Any
|
||
|
// piece that has been requested by a second peer
|
||
|
// while pulled in to list 1 by a different peer
|
||
|
// is moved into this list
|
||
|
read_lru2,
|
||
|
|
||
|
// this is the LRU of frequently used pieces but
|
||
|
// that has been recently evicted. If a piece in
|
||
|
// this list is requested, it's moved back into list 2.
|
||
|
read_lru2_ghost,
|
||
|
num_lrus
|
||
|
};
|
||
|
|
||
|
boost::uint32_t cache_state:3;
|
||
|
|
||
|
// this is the number of threads that are currently holding
|
||
|
// a reference to this piece. A piece may not be removed from
|
||
|
// the cache while this is > 0
|
||
|
boost::uint32_t piece_refcount:7;
|
||
|
|
||
|
// if this is set to one, it means there is an outstanding
|
||
|
// flush_hashed job for this piece, and there's no need to
|
||
|
// issue another one.
|
||
|
boost::uint32_t outstanding_flush:1;
|
||
|
|
||
|
// as long as there is a read operation outstanding on this
|
||
|
// piece, this is set to 1. Otherwise 0.
|
||
|
// the purpose is to make sure not two threads are reading
|
||
|
// the same blocks at the same time. If a new read job is
|
||
|
// added when this is 1, that new job should be hung on the
|
||
|
// read job queue (read_jobs).
|
||
|
boost::uint32_t outstanding_read:1;
|
||
|
|
||
|
// the number of blocks that have >= 1 refcount
|
||
|
boost::uint32_t pinned:16;
|
||
|
|
||
|
// ---- 32 bit boundary ---
|
||
|
|
||
|
// the sum of all refcounts in all blocks
|
||
|
boost::uint32_t refcount;
|
||
|
|
||
|
#if TORRENT_USE_ASSERTS
|
||
|
// the number of times this piece has finished hashing
|
||
|
int hash_passes;
|
||
|
|
||
|
// this is a debug facility to keep a log
|
||
|
// of which operations have been run on this piece
|
||
|
std::vector<piece_log_t> piece_log;
|
||
|
|
||
|
bool in_storage;
|
||
|
bool in_use;
|
||
|
#endif
|
||
|
};
|
||
|
|
||
|
inline std::size_t hash_value(cached_piece_entry const& p)
|
||
|
{
|
||
|
return std::size_t(p.storage.get()) + p.piece;
|
||
|
}
|
||
|
|
||
|
struct TORRENT_EXTRA_EXPORT block_cache : disk_buffer_pool
|
||
|
{
|
||
|
block_cache(int block_size, io_service& ios
|
||
|
, boost::function<void()> const& trigger_trim
|
||
|
, alert_dispatcher* alert_disp);
|
||
|
|
||
|
private:
|
||
|
|
||
|
typedef boost::unordered_set<cached_piece_entry> cache_t;
|
||
|
|
||
|
public:
|
||
|
|
||
|
typedef cache_t::iterator iterator;
|
||
|
typedef cache_t::const_iterator const_iterator;
|
||
|
|
||
|
// returns the number of blocks this job would cause to be read in
|
||
|
int pad_job(disk_io_job const* j, int blocks_in_piece
|
||
|
, int read_ahead) const;
|
||
|
|
||
|
int allocate_iovec(file::iovec_t* iov, int iov_len);
|
||
|
void free_iovec(file::iovec_t* iov, int iov_len);
|
||
|
|
||
|
void reclaim_block(block_cache_reference const& ref);
|
||
|
|
||
|
// returns a range of all pieces. This migh be a very
|
||
|
// long list, use carefully
|
||
|
std::pair<iterator, iterator> all_pieces() const;
|
||
|
int num_pieces() const { return m_pieces.size(); }
|
||
|
|
||
|
list_iterator write_lru_pieces() const
|
||
|
{ return m_lru[cached_piece_entry::write_lru].iterate(); }
|
||
|
|
||
|
int num_write_lru_pieces() const { return m_lru[cached_piece_entry::write_lru].size(); }
|
||
|
|
||
|
// mark this piece for deletion. If there are no outstanding
|
||
|
// requests to this piece, it's removed immediately, and the
|
||
|
// passed in iterator will be invalidated
|
||
|
void mark_for_deletion(cached_piece_entry* p);
|
||
|
|
||
|
// similar to mark_for_deletion, except for actually marking the
|
||
|
// piece for deletion. If the piece was actually deleted,
|
||
|
// the function returns true
|
||
|
bool evict_piece(cached_piece_entry* p, tailqueue& jobs);
|
||
|
|
||
|
// if this piece is in L1 or L2 proper, move it to
|
||
|
// its respective ghost list
|
||
|
void move_to_ghost(cached_piece_entry* p);
|
||
|
|
||
|
// returns the number of bytes read on success (cache hit)
|
||
|
// -1 on cache miss
|
||
|
int try_read(disk_io_job* j, bool count_stats = true, bool expect_no_fail = false);
|
||
|
|
||
|
// called when we're reading and we found the piece we're
|
||
|
// reading from in the hash table (not necessarily that we
|
||
|
// hit the block we needed)
|
||
|
void cache_hit(cached_piece_entry* p, void* requester, bool volatile_read);
|
||
|
|
||
|
// free block from piece entry
|
||
|
void free_block(cached_piece_entry* pe, int block);
|
||
|
|
||
|
// erase a piece (typically from the ghost list). Reclaim all
|
||
|
// its blocks and unlink it and free it.
|
||
|
void erase_piece(cached_piece_entry* p);
|
||
|
|
||
|
// bump the piece 'p' to the back of the LRU list it's
|
||
|
// in (back == MRU)
|
||
|
// this is only used for the write cache
|
||
|
void bump_lru(cached_piece_entry* p);
|
||
|
|
||
|
// move p into the correct lru queue
|
||
|
void update_cache_state(cached_piece_entry* p);
|
||
|
|
||
|
// if the piece is marked for deletion and has a refcount
|
||
|
// of 0, this function will post any sync jobs and
|
||
|
// delete the piece from the cache
|
||
|
bool maybe_free_piece(cached_piece_entry* p);
|
||
|
|
||
|
// either returns the piece in the cache, or allocates
|
||
|
// a new empty piece and returns it.
|
||
|
// cache_state is one of cache_state_t enum
|
||
|
cached_piece_entry* allocate_piece(disk_io_job const* j, int cache_state);
|
||
|
|
||
|
// looks for this piece in the cache. If it's there, returns a pointer
|
||
|
// to it, otherwise 0.
|
||
|
cached_piece_entry* find_piece(block_cache_reference const& ref);
|
||
|
cached_piece_entry* find_piece(disk_io_job const* j);
|
||
|
cached_piece_entry* find_piece(piece_manager* st, int piece);
|
||
|
|
||
|
// clear free all buffers marked as dirty with
|
||
|
// refcount of 0.
|
||
|
void abort_dirty(cached_piece_entry* p);
|
||
|
|
||
|
// used to convert dirty blocks into non-dirty ones
|
||
|
// i.e. from being part of the write cache to being part
|
||
|
// of the read cache. it's used when flushing blocks to disk
|
||
|
void blocks_flushed(cached_piece_entry* pe, int const* flushed, int num_flushed);
|
||
|
|
||
|
// adds a block to the cache, marks it as dirty and
|
||
|
// associates the job with it. When the block is
|
||
|
// flushed, the callback is posted
|
||
|
cached_piece_entry* add_dirty_block(disk_io_job* j);
|
||
|
|
||
|
enum { blocks_inc_refcount = 1 };
|
||
|
void insert_blocks(cached_piece_entry* pe, int block, file::iovec_t *iov
|
||
|
, int iov_len, disk_io_job* j, int flags = 0);
|
||
|
|
||
|
#if TORRENT_USE_INVARIANT_CHECKS
|
||
|
void check_invariant() const;
|
||
|
#endif
|
||
|
|
||
|
// try to remove num number of read cache blocks from the cache
|
||
|
// pick the least recently used ones first
|
||
|
// return the number of blocks that was requested to be evicted
|
||
|
// that couldn't be
|
||
|
int try_evict_blocks(int num, cached_piece_entry* ignore = 0);
|
||
|
|
||
|
// if there are any dirty blocks
|
||
|
void clear(tailqueue& jobs);
|
||
|
|
||
|
void update_stats_counters(counters& c) const;
|
||
|
void get_stats(cache_status* ret) const;
|
||
|
void set_settings(aux::session_settings const& sett);
|
||
|
|
||
|
enum reason_t { ref_hashing = 0, ref_reading = 1, ref_flushing = 2 };
|
||
|
bool inc_block_refcount(cached_piece_entry* pe, int block, int reason);
|
||
|
void dec_block_refcount(cached_piece_entry* pe, int block, int reason);
|
||
|
|
||
|
int pinned_blocks() const { return m_pinned_blocks; }
|
||
|
|
||
|
#if TORRENT_USE_ASSERTS
|
||
|
void mark_deleted(file_storage const& fs);
|
||
|
#endif
|
||
|
|
||
|
private:
|
||
|
|
||
|
// returns number of bytes read on success, -1 on cache miss
|
||
|
// (just because the piece is in the cache, doesn't mean all
|
||
|
// the blocks are there)
|
||
|
int copy_from_piece(cached_piece_entry* p, disk_io_job* j, bool expect_no_fail = false);
|
||
|
|
||
|
void free_piece(cached_piece_entry* p);
|
||
|
int drain_piece_bufs(cached_piece_entry& p, std::vector<char*>& buf);
|
||
|
|
||
|
// block container
|
||
|
cache_t m_pieces;
|
||
|
|
||
|
// linked list of all elements in m_pieces, in usage order
|
||
|
// the most recently used are in the tail. iterating from head
|
||
|
// to tail gives the least recently used entries first
|
||
|
// the read-list is for read blocks and the write-list is for
|
||
|
// dirty blocks that needs flushing before being evicted
|
||
|
// [0] = write-LRU
|
||
|
// [1] = read-LRU1
|
||
|
// [2] = read-LRU1-ghost
|
||
|
// [3] = read-LRU2
|
||
|
// [4] = read-LRU2-ghost
|
||
|
linked_list m_lru[cached_piece_entry::num_lrus];
|
||
|
|
||
|
// this is used to determine whether to evict blocks from
|
||
|
// L1 or L2.
|
||
|
enum cache_op_t
|
||
|
{
|
||
|
cache_miss,
|
||
|
ghost_hit_lru1,
|
||
|
ghost_hit_lru2
|
||
|
};
|
||
|
int m_last_cache_op;
|
||
|
|
||
|
// the number of pieces to keep in the ARC ghost lists
|
||
|
// this is determined by being a fraction of the cache size
|
||
|
int m_ghost_size;
|
||
|
|
||
|
// the number of blocks in the cache
|
||
|
// that are in the read cache
|
||
|
boost::uint32_t m_read_cache_size;
|
||
|
// the number of blocks in the cache
|
||
|
// that are in the write cache
|
||
|
boost::uint32_t m_write_cache_size;
|
||
|
|
||
|
// the number of blocks that are currently sitting
|
||
|
// in peer's send buffers. If two peers are sending
|
||
|
// the same block, it counts as 2, even though there're
|
||
|
// no buffer duplication
|
||
|
boost::uint32_t m_send_buffer_blocks;
|
||
|
|
||
|
boost::uint32_t m_blocks_read_hit;
|
||
|
|
||
|
// the number of blocks with a refcount > 0, i.e.
|
||
|
// they may not be evicted
|
||
|
int m_pinned_blocks;
|
||
|
|
||
|
#if TORRENT_USE_ASSERTS
|
||
|
std::vector<std::pair<std::string, void const*> > m_deleted_storages;
|
||
|
#endif
|
||
|
};
|
||
|
|
||
|
}
|
||
|
|
||
|
#endif // TORRENT_BLOCK_CACHE
|
||
|
|