openethereum/sync/src/light_sync/mod.rs

461 lines
13 KiB
Rust
Raw Normal View History

2016-12-13 21:09:43 +01:00
// Copyright 2015, 2016 Parity Technologies (UK) Ltd.
// This file is part of Parity.
// Parity is free software: you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
// (at your option) any later version.
// Parity is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
// You should have received a copy of the GNU General Public License
// along with Parity. If not, see <http://www.gnu.org/licenses/>.
//! Light client synchronization.
//!
//! This will synchronize the header chain using LES messages.
//! Dataflow is largely one-directional as headers are pushed into
//! the light client queue for import. Where possible, they are batched
//! in groups.
//!
//! This is written assuming that the client and sync service are running
2016-12-14 23:26:15 +01:00
//! in the same binary; unlike a full node which might communicate via IPC.
2016-12-13 21:09:43 +01:00
use std::collections::HashMap;
2016-12-15 21:51:08 +01:00
use std::mem;
2016-12-13 21:09:43 +01:00
use std::sync::Arc;
2016-12-14 23:26:15 +01:00
use light::client::LightChainClient;
2016-12-15 21:51:08 +01:00
use light::net::{
Announcement, Handler, BasicContext, EventContext,
2016-12-16 14:53:36 +01:00
Capabilities, ReqId, Status,
2016-12-15 21:51:08 +01:00
};
2016-12-13 21:09:43 +01:00
use light::request;
use network::PeerId;
use util::{Bytes, U256, H256, Mutex, RwLock};
use rand::{Rng, OsRng};
2016-12-13 21:09:43 +01:00
use self::sync_round::{AbortReason, SyncRound, ResponseContext};
2016-12-15 21:51:08 +01:00
2016-12-14 23:26:15 +01:00
mod response;
mod sync_round;
2016-12-13 21:09:43 +01:00
/// Peer chain info.
#[derive(Clone)]
struct ChainInfo {
head_td: U256,
head_hash: H256,
head_num: u64,
}
2016-12-14 23:26:15 +01:00
struct Peer {
status: ChainInfo,
2016-12-13 21:09:43 +01:00
}
2016-12-14 23:26:15 +01:00
impl Peer {
2016-12-16 15:26:39 +01:00
// Create a new peer.
2016-12-14 23:26:15 +01:00
fn new(chain_info: ChainInfo) -> Self {
Peer {
2016-12-16 15:26:39 +01:00
status: chain_info,
2016-12-13 21:09:43 +01:00
}
}
}
2016-12-16 14:53:36 +01:00
// search for a common ancestor with the best chain.
enum AncestorSearch {
Queued(u64), // queued to search for blocks starting from here.
Awaiting(ReqId, u64, request::Headers), // awaiting response for this request.
Prehistoric, // prehistoric block found. TODO: start to roll back CHTs.
FoundCommon(u64, H256), // common block found.
Genesis, // common ancestor is the genesis.
}
impl AncestorSearch {
fn begin(best_num: u64) -> Self {
match best_num {
0 => AncestorSearch::Genesis,
2016-12-16 15:26:39 +01:00
_ => AncestorSearch::Queued(best_num),
2016-12-16 14:53:36 +01:00
}
}
2016-12-16 15:26:39 +01:00
fn process_response<L>(self, ctx: &ResponseContext, client: &L) -> AncestorSearch
2016-12-16 14:53:36 +01:00
where L: LightChainClient
{
let first_num = client.chain_info().first_block_number.unwrap_or(0);
match self {
AncestorSearch::Awaiting(id, start, req) => {
if &id == ctx.req_id() {
match response::decode_and_verify(ctx.data(), &req) {
Ok(headers) => {
for header in &headers {
if client.is_known(&header.hash()) {
debug!(target: "sync", "Found common ancestor with best chain");
return AncestorSearch::FoundCommon(header.number(), header.hash());
}
if header.number() <= first_num {
debug!(target: "sync", "Prehistoric common ancestor with best chain.");
return AncestorSearch::Prehistoric;
}
}
AncestorSearch::Queued(start - headers.len() as u64)
}
Err(e) => {
trace!(target: "sync", "Bad headers response from {}: {}", ctx.responder(), e);
ctx.punish_responder();
AncestorSearch::Queued(start)
}
}
} else {
AncestorSearch::Awaiting(id, start, req)
}
}
other => other,
}
}
2016-12-16 15:26:39 +01:00
fn dispatch_request<F>(self, mut dispatcher: F) -> AncestorSearch
where F: FnMut(request::Headers) -> Option<ReqId>
{
const BATCH_SIZE: usize = 64;
match self {
AncestorSearch::Queued(start) => {
let req = request::Headers {
start: start.into(),
max: ::std::cmp::min(start as usize, BATCH_SIZE),
skip: 0,
reverse: true,
};
match dispatcher(req.clone()) {
Some(req_id) => AncestorSearch::Awaiting(req_id, start, req),
None => AncestorSearch::Queued(start),
}
}
other => other,
}
}
2016-12-15 21:51:08 +01:00
}
// synchronization state machine.
enum SyncState {
// Idle (waiting for peers)
Idle,
// searching for common ancestor with best chain.
// queue should be cleared at this phase.
AncestorSearch(AncestorSearch),
// Doing sync rounds.
Rounds(SyncRound),
}
struct ResponseCtx<'a> {
peer: PeerId,
req_id: ReqId,
ctx: &'a BasicContext,
data: &'a [Bytes],
}
impl<'a> ResponseContext for ResponseCtx<'a> {
fn responder(&self) -> PeerId { self.peer }
fn req_id(&self) -> &ReqId { &self.req_id }
fn data(&self) -> &[Bytes] { self.data }
fn punish_responder(&self) { self.ctx.disable_peer(self.peer) }
}
2016-12-13 21:09:43 +01:00
/// Light client synchronization manager. See module docs for more details.
2016-12-14 23:26:15 +01:00
pub struct LightSync<L: LightChainClient> {
2016-12-13 21:09:43 +01:00
best_seen: Mutex<Option<(H256, U256)>>, // best seen block on the network.
peers: RwLock<HashMap<PeerId, Mutex<Peer>>>, // peers which are relevant to synchronization.
2016-12-14 23:26:15 +01:00
client: Arc<L>,
2016-12-16 15:26:39 +01:00
rng: Mutex<OsRng>,
2016-12-15 21:51:08 +01:00
state: Mutex<SyncState>,
2016-12-13 21:09:43 +01:00
}
2016-12-14 23:26:15 +01:00
impl<L: LightChainClient> Handler for LightSync<L> {
2016-12-13 21:09:43 +01:00
fn on_connect(&self, ctx: &EventContext, status: &Status, capabilities: &Capabilities) {
let our_best = self.client.chain_info().best_block_number;
if !capabilities.serve_headers || status.head_num <= our_best {
2016-12-15 21:51:08 +01:00
trace!(target: "sync", "Disconnecting irrelevant peer: {}", ctx.peer());
ctx.disconnect_peer(ctx.peer());
2016-12-13 21:09:43 +01:00
return;
}
let chain_info = ChainInfo {
head_td: status.head_td,
head_hash: status.head_hash,
head_num: status.head_num,
};
2016-12-16 22:09:29 +01:00
{
let mut best = self.best_seen.lock();
if best.as_ref().map_or(true, |b| status.head_td > b.1) {
*best = Some((status.head_hash, status.head_td));
}
2016-12-15 21:51:08 +01:00
}
2016-12-14 23:26:15 +01:00
self.peers.write().insert(ctx.peer(), Mutex::new(Peer::new(chain_info)));
2016-12-15 21:51:08 +01:00
self.maintain_sync(ctx.as_basic());
}
2016-12-15 21:51:08 +01:00
fn on_disconnect(&self, ctx: &EventContext, unfulfilled: &[ReqId]) {
2016-12-14 23:26:15 +01:00
let peer_id = ctx.peer();
2016-12-15 21:51:08 +01:00
let peer = match self.peers.write().remove(&peer_id).map(|p| p.into_inner()) {
Some(peer) => peer,
None => return,
};
2016-12-16 22:09:29 +01:00
trace!(target: "sync", "peer {} disconnecting", peer_id);
2016-12-15 21:51:08 +01:00
let new_best = {
let mut best = self.best_seen.lock();
let peer_best = (peer.status.head_hash, peer.status.head_td);
if best.as_ref().map_or(false, |b| b == &peer_best) {
// search for next-best block.
let next_best: Option<(H256, U256)> = self.peers.read().values()
.map(|p| p.lock())
.map(|p| (p.status.head_hash, p.status.head_td))
.fold(None, |acc, x| match acc {
Some(acc) => if x.1 > acc.1 { Some(x) } else { Some(acc) },
None => Some(x),
});
*best = next_best;
}
best.clone()
};
if new_best.is_none() {
debug!(target: "sync", "No peers remain. Reverting to idle");
*self.state.lock() = SyncState::Idle;
} else {
let mut state = self.state.lock();
*state = match mem::replace(&mut *state, SyncState::Idle) {
SyncState::Idle => SyncState::Idle,
SyncState::AncestorSearch(search) => SyncState::AncestorSearch(search),
SyncState::Rounds(round) => SyncState::Rounds(round.requests_abandoned(unfulfilled)),
};
}
self.maintain_sync(ctx.as_basic());
}
fn on_announcement(&self, ctx: &EventContext, announcement: &Announcement) {
2016-12-15 21:51:08 +01:00
let last_td = {
let peers = self.peers.read();
2016-12-16 22:09:29 +01:00
match peers.get(&ctx.peer()) {
2016-12-15 21:51:08 +01:00
None => return,
Some(peer) => {
let mut peer = peer.lock();
let last_td = peer.status.head_td;
peer.status = ChainInfo {
head_td: announcement.head_td,
head_hash: announcement.head_hash,
head_num: announcement.head_num,
};
last_td
}
}
};
trace!(target: "sync", "Announcement from peer {}: new chain head {:?}, reorg depth {}",
ctx.peer(), (announcement.head_hash, announcement.head_num), announcement.reorg_depth);
2016-12-15 21:51:08 +01:00
2016-12-16 23:53:36 +01:00
if last_td > announcement.head_td {
2016-12-15 21:51:08 +01:00
trace!(target: "sync", "Peer {} moved backwards.", ctx.peer());
self.peers.write().remove(&ctx.peer());
ctx.disconnect_peer(ctx.peer());
}
2016-12-16 22:09:29 +01:00
{
let mut best = self.best_seen.lock();
if best.as_ref().map_or(true, |b| announcement.head_td > b.1) {
*best = Some((announcement.head_hash, announcement.head_td));
}
2016-12-15 21:51:08 +01:00
}
self.maintain_sync(ctx.as_basic());
}
fn on_block_headers(&self, ctx: &EventContext, req_id: ReqId, headers: &[Bytes]) {
if !self.peers.read().contains_key(&ctx.peer()) {
return
2016-12-15 21:51:08 +01:00
}
{
let mut state = self.state.lock();
2016-12-16 14:53:36 +01:00
let ctx = ResponseCtx {
peer: ctx.peer(),
req_id: req_id,
ctx: ctx.as_basic(),
data: headers,
};
2016-12-15 21:51:08 +01:00
*state = match mem::replace(&mut *state, SyncState::Idle) {
SyncState::Idle => SyncState::Idle,
2016-12-16 14:53:36 +01:00
SyncState::AncestorSearch(search) =>
SyncState::AncestorSearch(search.process_response(&ctx, &*self.client)),
SyncState::Rounds(round) => SyncState::Rounds(round.process_response(&ctx)),
2016-12-15 21:51:08 +01:00
};
}
self.maintain_sync(ctx.as_basic());
}
fn tick(&self, ctx: &BasicContext) {
self.maintain_sync(ctx);
}
}
// private helpers
impl<L: LightChainClient> LightSync<L> {
// Begins a search for the common ancestor and our best block.
// does not lock state, instead has a mutable reference to it passed.
2016-12-16 14:53:36 +01:00
fn begin_search(&self, state: &mut SyncState) {
self.client.clear_queue();
2016-12-16 14:53:36 +01:00
let chain_info = self.client.chain_info();
if let None = *self.best_seen.lock() {
// no peers.
*state = SyncState::Idle;
return;
}
2016-12-16 22:09:29 +01:00
trace!(target: "sync", "Beginning search for common ancestor");
2016-12-16 14:53:36 +01:00
*state = SyncState::AncestorSearch(AncestorSearch::begin(chain_info.best_block_number));
}
2016-12-15 21:51:08 +01:00
fn maintain_sync(&self, ctx: &BasicContext) {
const DRAIN_AMOUNT: usize = 128;
2016-12-16 22:09:29 +01:00
debug!(target: "sync", "Maintaining sync.");
let mut state = self.state.lock();
// drain any pending blocks into the queue.
{
let mut sink = Vec::with_capacity(DRAIN_AMOUNT);
2016-12-15 21:51:08 +01:00
'a:
loop {
let queue_info = self.client.queue_info();
if queue_info.is_full() { break }
*state = match mem::replace(&mut *state, SyncState::Idle) {
SyncState::Rounds(round)
=> SyncState::Rounds(round.drain(&mut sink, Some(DRAIN_AMOUNT))),
other => other,
};
if sink.is_empty() { break }
for header in sink.drain(..) {
if let Err(e) = self.client.queue_header(header) {
debug!(target: "sync", "Found bad header ({:?}). Reset to search state.", e);
self.begin_search(&mut state);
break 'a;
}
}
}
}
2016-12-16 14:53:36 +01:00
// handle state transitions.
{
match mem::replace(&mut *state, SyncState::Idle) {
SyncState::Rounds(SyncRound::Abort(reason)) => {
match reason {
AbortReason::BadScaffold(bad_peers) => {
debug!(target: "sync", "Disabling peers responsible for bad scaffold");
for peer in bad_peers {
ctx.disable_peer(peer);
}
}
AbortReason::NoResponses => {}
}
debug!(target: "sync", "Beginning search after aborted sync round");
self.begin_search(&mut state);
}
2016-12-16 14:53:36 +01:00
SyncState::AncestorSearch(AncestorSearch::FoundCommon(num, hash)) => {
// TODO: compare to best block and switch to another downloading
// method when close.
*state = SyncState::Rounds(SyncRound::begin(num, hash));
}
SyncState::AncestorSearch(AncestorSearch::Genesis) => {
// Same here.
let g_hash = self.client.chain_info().genesis_hash;
*state = SyncState::Rounds(SyncRound::begin(0, g_hash));
}
SyncState::Idle => self.begin_search(&mut state),
other => *state = other, // restore displaced state.
}
}
// allow dispatching of requests.
2016-12-16 14:53:36 +01:00
// TODO: maybe wait until the amount of cumulative requests remaining is high enough
// to avoid pumping the failure rate.
{
2016-12-16 15:26:39 +01:00
let peers = self.peers.read();
let mut peer_ids: Vec<_> = peers.keys().cloned().collect();
let mut rng = self.rng.lock();
// naive request dispatcher: just give to any peer which says it will
// give us responses.
let dispatcher = move |req: request::Headers| {
rng.shuffle(&mut peer_ids);
for peer in &peer_ids {
if ctx.max_requests(*peer, request::Kind::Headers) >= req.max {
match ctx.request_from(*peer, request::Request::Headers(req.clone())) {
2016-12-16 23:21:17 +01:00
Ok(id) => {
return Some(id)
}
2016-12-16 15:26:39 +01:00
Err(e) =>
trace!(target: "sync", "Error requesting headers from viable peer: {}", e),
}
}
}
None
};
*state = match mem::replace(&mut *state, SyncState::Idle) {
2016-12-16 15:26:39 +01:00
SyncState::Rounds(round) =>
SyncState::Rounds(round.dispatch_requests(dispatcher)),
SyncState::AncestorSearch(search) =>
SyncState::AncestorSearch(search.dispatch_request(dispatcher)),
other => other,
};
}
2016-12-13 21:09:43 +01:00
}
}
// public API
2016-12-14 23:26:15 +01:00
impl<L: LightChainClient> LightSync<L> {
2016-12-13 21:09:43 +01:00
/// Create a new instance of `LightSync`.
///
/// This won't do anything until registered as a handler
/// so it can act on events.
pub fn new(client: Arc<L>) -> Result<Self, ::std::io::Error> {
Ok(LightSync {
2016-12-13 21:09:43 +01:00
best_seen: Mutex::new(None),
peers: RwLock::new(HashMap::new()),
2016-12-13 21:09:43 +01:00
client: client,
2016-12-16 15:26:39 +01:00
rng: Mutex::new(try!(OsRng::new())),
2016-12-15 21:51:08 +01:00
state: Mutex::new(SyncState::Idle),
})
2016-12-13 21:09:43 +01:00
}
}