2017-01-25 18:51:41 +01:00
|
|
|
// Copyright 2015-2017 Parity Technologies (UK) Ltd.
|
2016-08-05 17:00:46 +02:00
|
|
|
// This file is part of Parity.
|
|
|
|
|
|
|
|
// Parity is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
|
|
|
|
// Parity is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU General Public License for more details.
|
|
|
|
|
|
|
|
// You should have received a copy of the GNU General Public License
|
|
|
|
// along with Parity. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
//! Snapshot network service implementation.
|
|
|
|
|
2017-04-19 20:31:53 +02:00
|
|
|
use std::collections::HashSet;
|
2016-08-05 17:00:46 +02:00
|
|
|
use std::io::ErrorKind;
|
|
|
|
use std::fs;
|
2016-09-07 15:27:28 +02:00
|
|
|
use std::path::PathBuf;
|
2016-08-05 17:00:46 +02:00
|
|
|
use std::sync::Arc;
|
2016-09-07 15:27:14 +02:00
|
|
|
use std::sync::atomic::{AtomicBool, AtomicUsize, Ordering};
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2017-04-19 20:31:53 +02:00
|
|
|
use super::{ManifestData, StateRebuilder, Rebuilder, RestorationStatus, SnapshotService};
|
2016-08-25 22:20:44 +02:00
|
|
|
use super::io::{SnapshotReader, LooseReader, SnapshotWriter, LooseWriter};
|
2016-08-05 17:00:46 +02:00
|
|
|
|
|
|
|
use blockchain::BlockChain;
|
2016-09-21 12:56:13 +02:00
|
|
|
use client::{BlockChainClient, Client};
|
2016-08-05 17:00:46 +02:00
|
|
|
use engines::Engine;
|
|
|
|
use error::Error;
|
2016-12-09 23:01:43 +01:00
|
|
|
use ids::BlockId;
|
2016-08-05 17:00:46 +02:00
|
|
|
use service::ClientIoMessage;
|
|
|
|
|
|
|
|
use io::IoChannel;
|
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
use util::{Bytes, H256, Mutex, RwLock, RwLockReadGuard, UtilError};
|
2016-08-05 17:00:46 +02:00
|
|
|
use util::journaldb::Algorithm;
|
|
|
|
use util::kvdb::{Database, DatabaseConfig};
|
|
|
|
use util::snappy;
|
|
|
|
|
2016-09-02 19:00:20 +02:00
|
|
|
/// Helper for removing directories in case of error.
|
|
|
|
struct Guard(bool, PathBuf);
|
|
|
|
|
|
|
|
impl Guard {
|
|
|
|
fn new(path: PathBuf) -> Self { Guard(true, path) }
|
|
|
|
|
|
|
|
fn disarm(mut self) { self.0 = false }
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Drop for Guard {
|
|
|
|
fn drop(&mut self) {
|
|
|
|
if self.0 {
|
|
|
|
let _ = fs::remove_dir_all(&self.1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-06 15:31:13 +02:00
|
|
|
/// External database restoration handler
|
2016-09-06 15:41:56 +02:00
|
|
|
pub trait DatabaseRestore: Send + Sync {
|
2016-09-06 15:31:13 +02:00
|
|
|
/// Restart with a new backend. Takes ownership of passed database and moves it to a new location.
|
|
|
|
fn restore_db(&self, new_db: &str) -> Result<(), Error>;
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/// State restoration manager.
|
|
|
|
struct Restoration {
|
2016-08-25 22:20:44 +02:00
|
|
|
manifest: ManifestData,
|
2016-08-05 17:00:46 +02:00
|
|
|
state_chunks_left: HashSet<H256>,
|
|
|
|
block_chunks_left: HashSet<H256>,
|
|
|
|
state: StateRebuilder,
|
2017-04-19 20:31:53 +02:00
|
|
|
secondary: Box<Rebuilder>,
|
2016-09-11 14:05:59 +02:00
|
|
|
writer: Option<LooseWriter>,
|
2016-08-05 17:00:46 +02:00
|
|
|
snappy_buffer: Bytes,
|
|
|
|
final_state_root: H256,
|
2016-09-02 19:00:20 +02:00
|
|
|
guard: Guard,
|
2016-10-25 18:40:01 +02:00
|
|
|
db: Arc<Database>,
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
struct RestorationParams<'a> {
|
|
|
|
manifest: ManifestData, // manifest to base restoration on.
|
|
|
|
pruning: Algorithm, // pruning algorithm for the database.
|
|
|
|
db_path: PathBuf, // database path
|
2016-09-11 14:05:59 +02:00
|
|
|
db_config: &'a DatabaseConfig, // configuration for the database.
|
|
|
|
writer: Option<LooseWriter>, // writer for recovered snapshot.
|
2016-08-25 22:20:44 +02:00
|
|
|
genesis: &'a [u8], // genesis block of the chain.
|
2016-09-02 19:00:20 +02:00
|
|
|
guard: Guard, // guard for the restoration directory.
|
2017-04-19 20:31:53 +02:00
|
|
|
engine: &'a Engine,
|
2016-08-25 22:20:44 +02:00
|
|
|
}
|
|
|
|
|
2016-08-05 17:00:46 +02:00
|
|
|
impl Restoration {
|
2016-08-25 22:20:44 +02:00
|
|
|
// make a new restoration using the given parameters.
|
|
|
|
fn new(params: RestorationParams) -> Result<Self, Error> {
|
|
|
|
let manifest = params.manifest;
|
|
|
|
|
|
|
|
let state_chunks = manifest.state_hashes.iter().cloned().collect();
|
|
|
|
let block_chunks = manifest.block_hashes.iter().cloned().collect();
|
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
let raw_db = Arc::new(Database::open(params.db_config, &*params.db_path.to_string_lossy())
|
|
|
|
.map_err(UtilError::SimpleString)?);
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2017-01-23 15:27:11 +01:00
|
|
|
let chain = BlockChain::new(Default::default(), params.genesis, raw_db.clone());
|
2017-04-19 20:31:53 +02:00
|
|
|
let components = params.engine.snapshot_components()
|
|
|
|
.ok_or_else(|| ::snapshot::Error::SnapshotsUnsupported)?;
|
|
|
|
|
|
|
|
let secondary = components.rebuilder(chain, raw_db.clone(), &manifest)?;
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
let root = manifest.state_root.clone();
|
2017-05-17 12:41:33 +02:00
|
|
|
|
2016-08-05 17:00:46 +02:00
|
|
|
Ok(Restoration {
|
2016-08-25 22:20:44 +02:00
|
|
|
manifest: manifest,
|
|
|
|
state_chunks_left: state_chunks,
|
|
|
|
block_chunks_left: block_chunks,
|
2016-10-25 18:40:01 +02:00
|
|
|
state: StateRebuilder::new(raw_db.clone(), params.pruning),
|
2017-04-19 20:31:53 +02:00
|
|
|
secondary: secondary,
|
2016-08-25 22:20:44 +02:00
|
|
|
writer: params.writer,
|
2016-08-05 17:00:46 +02:00
|
|
|
snappy_buffer: Vec::new(),
|
2016-08-25 22:20:44 +02:00
|
|
|
final_state_root: root,
|
2016-09-02 19:00:20 +02:00
|
|
|
guard: params.guard,
|
2016-10-25 18:40:01 +02:00
|
|
|
db: raw_db,
|
2016-08-05 17:00:46 +02:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2016-11-13 13:52:53 +01:00
|
|
|
// feeds a state chunk, aborts early if `flag` becomes false.
|
|
|
|
fn feed_state(&mut self, hash: H256, chunk: &[u8], flag: &AtomicBool) -> Result<(), Error> {
|
2016-08-05 17:00:46 +02:00
|
|
|
if self.state_chunks_left.remove(&hash) {
|
2016-12-27 12:53:56 +01:00
|
|
|
let len = snappy::decompress_into(chunk, &mut self.snappy_buffer)?;
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
self.state.feed(&self.snappy_buffer[..len], flag)?;
|
2016-09-11 14:05:59 +02:00
|
|
|
|
|
|
|
if let Some(ref mut writer) = self.writer.as_mut() {
|
2016-12-27 12:53:56 +01:00
|
|
|
writer.write_state_chunk(hash, chunk)?;
|
2016-09-11 14:05:59 +02:00
|
|
|
}
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
// feeds a block chunk
|
2016-11-13 13:52:53 +01:00
|
|
|
fn feed_blocks(&mut self, hash: H256, chunk: &[u8], engine: &Engine, flag: &AtomicBool) -> Result<(), Error> {
|
2016-08-05 17:00:46 +02:00
|
|
|
if self.block_chunks_left.remove(&hash) {
|
2016-12-27 12:53:56 +01:00
|
|
|
let len = snappy::decompress_into(chunk, &mut self.snappy_buffer)?;
|
2016-08-25 22:20:44 +02:00
|
|
|
|
2017-04-19 20:31:53 +02:00
|
|
|
self.secondary.feed(&self.snappy_buffer[..len], engine, flag)?;
|
2016-09-11 14:05:59 +02:00
|
|
|
if let Some(ref mut writer) = self.writer.as_mut() {
|
2016-12-27 12:53:56 +01:00
|
|
|
writer.write_block_chunk(hash, chunk)?;
|
2016-09-11 14:05:59 +02:00
|
|
|
}
|
2016-08-25 22:20:44 +02:00
|
|
|
}
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
// finish up restoration.
|
2017-05-17 12:41:33 +02:00
|
|
|
fn finalize(mut self, engine: &Engine) -> Result<(), Error> {
|
2016-08-25 22:20:44 +02:00
|
|
|
use util::trie::TrieError;
|
|
|
|
|
|
|
|
if !self.is_done() { return Ok(()) }
|
|
|
|
|
|
|
|
// verify final state root.
|
|
|
|
let root = self.state.state_root();
|
|
|
|
if root != self.final_state_root {
|
|
|
|
warn!("Final restored state has wrong state root: expected {:?}, got {:?}", root, self.final_state_root);
|
|
|
|
return Err(TrieError::InvalidStateRoot(root).into());
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
// check for missing code.
|
2017-05-17 12:41:33 +02:00
|
|
|
let db = self.state.finalize(self.manifest.block_number, self.manifest.block_hash)?;
|
|
|
|
let db = ::state_db::StateDB::new(db, 0);
|
2016-08-25 22:20:44 +02:00
|
|
|
|
2016-10-28 16:10:30 +02:00
|
|
|
// connect out-of-order chunks and verify chain integrity.
|
2017-05-17 12:41:33 +02:00
|
|
|
self.secondary.finalize(db, engine)?;
|
2016-08-25 22:20:44 +02:00
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
if let Some(writer) = self.writer {
|
2016-12-27 12:53:56 +01:00
|
|
|
writer.finish(self.manifest)?;
|
2016-09-11 14:05:59 +02:00
|
|
|
}
|
2016-08-25 22:20:44 +02:00
|
|
|
|
2016-09-02 19:00:20 +02:00
|
|
|
self.guard.disarm();
|
2016-08-05 17:00:46 +02:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
// is everything done?
|
|
|
|
fn is_done(&self) -> bool {
|
|
|
|
self.block_chunks_left.is_empty() && self.state_chunks_left.is_empty()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Type alias for client io channel.
|
|
|
|
pub type Channel = IoChannel<ClientIoMessage>;
|
|
|
|
|
2016-09-07 15:27:28 +02:00
|
|
|
/// Snapshot service parameters.
|
|
|
|
pub struct ServiceParams {
|
|
|
|
/// The consensus engine this is built on.
|
|
|
|
pub engine: Arc<Engine>,
|
|
|
|
/// The chain's genesis block.
|
|
|
|
pub genesis_block: Bytes,
|
|
|
|
/// Database configuration options.
|
|
|
|
pub db_config: DatabaseConfig,
|
|
|
|
/// State pruning algorithm.
|
|
|
|
pub pruning: Algorithm,
|
|
|
|
/// Async IO channel for sending messages.
|
|
|
|
pub channel: Channel,
|
|
|
|
/// The directory to put snapshots in.
|
|
|
|
/// Usually "<chain hash>/snapshot"
|
|
|
|
pub snapshot_root: PathBuf,
|
|
|
|
/// A handle for database restoration.
|
|
|
|
pub db_restore: Arc<DatabaseRestore>,
|
|
|
|
}
|
|
|
|
|
|
|
|
/// `SnapshotService` implementation.
|
|
|
|
/// This controls taking snapshots and restoring from them.
|
2016-08-05 17:00:46 +02:00
|
|
|
pub struct Service {
|
|
|
|
restoration: Mutex<Option<Restoration>>,
|
2016-09-07 15:27:28 +02:00
|
|
|
snapshot_root: PathBuf,
|
|
|
|
db_config: DatabaseConfig,
|
2016-10-30 09:56:34 +01:00
|
|
|
io_channel: Mutex<Channel>,
|
2016-08-05 17:00:46 +02:00
|
|
|
pruning: Algorithm,
|
|
|
|
status: Mutex<RestorationStatus>,
|
2016-08-25 22:20:44 +02:00
|
|
|
reader: RwLock<Option<LooseReader>>,
|
2016-08-05 23:33:55 +02:00
|
|
|
engine: Arc<Engine>,
|
|
|
|
genesis_block: Bytes,
|
2016-08-05 17:00:46 +02:00
|
|
|
state_chunks: AtomicUsize,
|
|
|
|
block_chunks: AtomicUsize,
|
2016-09-06 15:31:13 +02:00
|
|
|
db_restore: Arc<DatabaseRestore>,
|
2016-09-06 17:44:11 +02:00
|
|
|
progress: super::Progress,
|
2016-09-07 15:27:14 +02:00
|
|
|
taking_snapshot: AtomicBool,
|
2016-11-13 13:52:53 +01:00
|
|
|
restoring_snapshot: AtomicBool,
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Service {
|
2016-09-07 15:27:28 +02:00
|
|
|
/// Create a new snapshot service from the given parameters.
|
|
|
|
pub fn new(params: ServiceParams) -> Result<Self, Error> {
|
|
|
|
let mut service = Service {
|
2016-08-05 17:00:46 +02:00
|
|
|
restoration: Mutex::new(None),
|
2016-09-07 15:27:28 +02:00
|
|
|
snapshot_root: params.snapshot_root,
|
|
|
|
db_config: params.db_config,
|
2016-10-30 09:56:34 +01:00
|
|
|
io_channel: Mutex::new(params.channel),
|
2016-09-07 15:27:28 +02:00
|
|
|
pruning: params.pruning,
|
2016-08-05 17:00:46 +02:00
|
|
|
status: Mutex::new(RestorationStatus::Inactive),
|
2016-09-07 15:27:28 +02:00
|
|
|
reader: RwLock::new(None),
|
|
|
|
engine: params.engine,
|
|
|
|
genesis_block: params.genesis_block,
|
2016-08-05 17:00:46 +02:00
|
|
|
state_chunks: AtomicUsize::new(0),
|
|
|
|
block_chunks: AtomicUsize::new(0),
|
2016-09-07 15:27:28 +02:00
|
|
|
db_restore: params.db_restore,
|
2016-09-06 17:44:11 +02:00
|
|
|
progress: Default::default(),
|
2016-09-07 15:27:14 +02:00
|
|
|
taking_snapshot: AtomicBool::new(false),
|
2016-11-13 13:52:53 +01:00
|
|
|
restoring_snapshot: AtomicBool::new(false),
|
2016-08-05 17:00:46 +02:00
|
|
|
};
|
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
// create the root snapshot dir if it doesn't exist.
|
2016-09-07 15:27:28 +02:00
|
|
|
if let Err(e) = fs::create_dir_all(&service.snapshot_root) {
|
2016-08-10 16:29:40 +02:00
|
|
|
if e.kind() != ErrorKind::AlreadyExists {
|
|
|
|
return Err(e.into())
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// delete the temporary restoration dir if it does exist.
|
2016-08-10 16:29:40 +02:00
|
|
|
if let Err(e) = fs::remove_dir_all(service.restoration_dir()) {
|
|
|
|
if e.kind() != ErrorKind::NotFound {
|
|
|
|
return Err(e.into())
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-05 14:25:56 +02:00
|
|
|
// delete the temporary snapshot dir if it does exist.
|
|
|
|
if let Err(e) = fs::remove_dir_all(service.temp_snapshot_dir()) {
|
2016-09-05 14:28:28 +02:00
|
|
|
if e.kind() != ErrorKind::NotFound {
|
2016-09-05 14:25:56 +02:00
|
|
|
return Err(e.into())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-07 15:27:28 +02:00
|
|
|
let reader = LooseReader::new(service.snapshot_dir()).ok();
|
|
|
|
*service.reader.get_mut() = reader;
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2016-09-07 15:27:28 +02:00
|
|
|
Ok(service)
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
// get the current snapshot dir.
|
|
|
|
fn snapshot_dir(&self) -> PathBuf {
|
2016-09-07 15:27:28 +02:00
|
|
|
let mut dir = self.snapshot_root.clone();
|
2016-08-25 22:20:44 +02:00
|
|
|
dir.push("current");
|
|
|
|
dir
|
|
|
|
}
|
|
|
|
|
2016-09-02 16:15:25 +02:00
|
|
|
// get the temporary snapshot dir.
|
|
|
|
fn temp_snapshot_dir(&self) -> PathBuf {
|
2016-09-07 15:27:28 +02:00
|
|
|
let mut dir = self.snapshot_root.clone();
|
2016-09-02 16:15:25 +02:00
|
|
|
dir.push("in_progress");
|
|
|
|
dir
|
|
|
|
}
|
|
|
|
|
2016-08-05 17:00:46 +02:00
|
|
|
// get the restoration directory.
|
|
|
|
fn restoration_dir(&self) -> PathBuf {
|
2016-09-07 15:27:28 +02:00
|
|
|
let mut dir = self.snapshot_root.clone();
|
2016-08-05 17:00:46 +02:00
|
|
|
dir.push("restoration");
|
|
|
|
dir
|
|
|
|
}
|
|
|
|
|
|
|
|
// restoration db path.
|
|
|
|
fn restoration_db(&self) -> PathBuf {
|
|
|
|
let mut dir = self.restoration_dir();
|
|
|
|
dir.push("db");
|
|
|
|
dir
|
|
|
|
}
|
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
// temporary snapshot recovery path.
|
|
|
|
fn temp_recovery_dir(&self) -> PathBuf {
|
|
|
|
let mut dir = self.restoration_dir();
|
|
|
|
dir.push("temp");
|
|
|
|
dir
|
|
|
|
}
|
|
|
|
|
2016-08-05 17:00:46 +02:00
|
|
|
// replace one the client's database with our own.
|
|
|
|
fn replace_client_db(&self) -> Result<(), Error> {
|
|
|
|
let our_db = self.restoration_db();
|
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
self.db_restore.restore_db(&*our_db.to_string_lossy())?;
|
2016-09-06 15:31:13 +02:00
|
|
|
Ok(())
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
/// Get a reference to the snapshot reader.
|
|
|
|
pub fn reader(&self) -> RwLockReadGuard<Option<LooseReader>> {
|
|
|
|
self.reader.read()
|
|
|
|
}
|
|
|
|
|
2016-09-06 17:44:11 +02:00
|
|
|
/// Tick the snapshot service. This will log any active snapshot
|
|
|
|
/// being taken.
|
|
|
|
pub fn tick(&self) {
|
2016-09-07 15:27:14 +02:00
|
|
|
if self.progress.done() || !self.taking_snapshot.load(Ordering::SeqCst) { return }
|
2016-09-06 17:44:11 +02:00
|
|
|
|
|
|
|
let p = &self.progress;
|
|
|
|
info!("Snapshot: {} accounts {} blocks {} bytes", p.accounts(), p.blocks(), p.size());
|
|
|
|
}
|
|
|
|
|
2016-09-02 16:15:25 +02:00
|
|
|
/// Take a snapshot at the block with the given number.
|
|
|
|
/// calling this while a restoration is in progress or vice versa
|
|
|
|
/// will lead to a race condition where the first one to finish will
|
|
|
|
/// have their produced snapshot overwritten.
|
|
|
|
pub fn take_snapshot(&self, client: &Client, num: u64) -> Result<(), Error> {
|
2016-09-07 15:27:14 +02:00
|
|
|
if self.taking_snapshot.compare_and_swap(false, true, Ordering::SeqCst) {
|
|
|
|
info!("Skipping snapshot at #{} as another one is currently in-progress.", num);
|
|
|
|
return Ok(());
|
|
|
|
}
|
|
|
|
|
2016-09-02 16:15:25 +02:00
|
|
|
info!("Taking snapshot at #{}", num);
|
2016-09-06 17:44:11 +02:00
|
|
|
self.progress.reset();
|
2016-09-02 16:15:25 +02:00
|
|
|
|
|
|
|
let temp_dir = self.temp_snapshot_dir();
|
|
|
|
let snapshot_dir = self.snapshot_dir();
|
|
|
|
|
|
|
|
let _ = fs::remove_dir_all(&temp_dir);
|
2016-09-02 19:00:20 +02:00
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
let writer = LooseWriter::new(temp_dir.clone())?;
|
2016-09-02 16:15:25 +02:00
|
|
|
|
2016-09-02 19:00:20 +02:00
|
|
|
let guard = Guard::new(temp_dir.clone());
|
2016-12-09 23:01:43 +01:00
|
|
|
let res = client.take_snapshot(writer, BlockId::Number(num), &self.progress);
|
2016-09-07 15:27:14 +02:00
|
|
|
|
|
|
|
self.taking_snapshot.store(false, Ordering::SeqCst);
|
2016-09-21 12:56:13 +02:00
|
|
|
if let Err(e) = res {
|
2016-10-14 14:44:56 +02:00
|
|
|
if client.chain_info().best_block_number >= num + client.pruning_history() {
|
2016-09-21 12:56:13 +02:00
|
|
|
// "Cancelled" is mincing words a bit -- what really happened
|
|
|
|
// is that the state we were snapshotting got pruned out
|
|
|
|
// before we could finish.
|
2016-10-28 16:10:30 +02:00
|
|
|
info!("Periodic snapshot failed: block state pruned.\
|
|
|
|
Run with a longer `--pruning-history` or with `--no-periodic-snapshot`");
|
2016-09-21 12:56:13 +02:00
|
|
|
return Ok(())
|
|
|
|
} else {
|
|
|
|
return Err(e);
|
|
|
|
}
|
|
|
|
}
|
2016-09-06 17:44:11 +02:00
|
|
|
|
|
|
|
info!("Finished taking snapshot at #{}", num);
|
|
|
|
|
2016-09-02 16:15:25 +02:00
|
|
|
let mut reader = self.reader.write();
|
|
|
|
|
|
|
|
// destroy the old snapshot reader.
|
|
|
|
*reader = None;
|
|
|
|
|
2016-09-13 10:33:03 +02:00
|
|
|
if snapshot_dir.exists() {
|
2016-12-27 12:53:56 +01:00
|
|
|
fs::remove_dir_all(&snapshot_dir)?;
|
2016-09-13 10:33:03 +02:00
|
|
|
}
|
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
fs::rename(temp_dir, &snapshot_dir)?;
|
2016-09-02 16:15:25 +02:00
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
*reader = Some(LooseReader::new(snapshot_dir)?);
|
2016-09-02 16:15:25 +02:00
|
|
|
|
2016-09-02 19:00:20 +02:00
|
|
|
guard.disarm();
|
2016-09-02 16:15:25 +02:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
/// Initialize the restoration synchronously.
|
2016-09-11 14:05:59 +02:00
|
|
|
/// The recover flag indicates whether to recover the restored snapshot.
|
|
|
|
pub fn init_restore(&self, manifest: ManifestData, recover: bool) -> Result<(), Error> {
|
2016-08-25 22:20:44 +02:00
|
|
|
let rest_dir = self.restoration_dir();
|
|
|
|
|
|
|
|
let mut res = self.restoration.lock();
|
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
self.state_chunks.store(0, Ordering::SeqCst);
|
|
|
|
self.block_chunks.store(0, Ordering::SeqCst);
|
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
// tear down existing restoration.
|
|
|
|
*res = None;
|
|
|
|
|
|
|
|
// delete and restore the restoration dir.
|
|
|
|
if let Err(e) = fs::remove_dir_all(&rest_dir) {
|
|
|
|
match e.kind() {
|
|
|
|
ErrorKind::NotFound => {},
|
|
|
|
_ => return Err(e.into()),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
fs::create_dir_all(&rest_dir)?;
|
2016-08-25 22:20:44 +02:00
|
|
|
|
|
|
|
// make new restoration.
|
2016-09-11 14:05:59 +02:00
|
|
|
let writer = match recover {
|
2016-12-27 12:53:56 +01:00
|
|
|
true => Some(LooseWriter::new(self.temp_recovery_dir())?),
|
2016-09-11 14:05:59 +02:00
|
|
|
false => None
|
|
|
|
};
|
2016-08-25 22:20:44 +02:00
|
|
|
|
|
|
|
let params = RestorationParams {
|
|
|
|
manifest: manifest,
|
|
|
|
pruning: self.pruning,
|
|
|
|
db_path: self.restoration_db(),
|
2016-09-07 15:27:28 +02:00
|
|
|
db_config: &self.db_config,
|
2016-08-25 22:20:44 +02:00
|
|
|
writer: writer,
|
|
|
|
genesis: &self.genesis_block,
|
2016-09-02 19:00:20 +02:00
|
|
|
guard: Guard::new(rest_dir),
|
2017-04-19 20:31:53 +02:00
|
|
|
engine: &*self.engine,
|
2016-08-25 22:20:44 +02:00
|
|
|
};
|
|
|
|
|
2016-10-18 18:16:00 +02:00
|
|
|
let state_chunks = params.manifest.state_hashes.len();
|
|
|
|
let block_chunks = params.manifest.block_hashes.len();
|
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
*res = Some(Restoration::new(params)?);
|
2016-08-25 22:20:44 +02:00
|
|
|
|
2016-09-06 15:31:13 +02:00
|
|
|
*self.status.lock() = RestorationStatus::Ongoing {
|
2016-10-18 18:16:00 +02:00
|
|
|
state_chunks: state_chunks as u32,
|
|
|
|
block_chunks: block_chunks as u32,
|
2016-09-11 14:05:59 +02:00
|
|
|
state_chunks_done: self.state_chunks.load(Ordering::SeqCst) as u32,
|
|
|
|
block_chunks_done: self.block_chunks.load(Ordering::SeqCst) as u32,
|
2016-09-06 15:31:13 +02:00
|
|
|
};
|
2016-11-13 13:52:53 +01:00
|
|
|
|
|
|
|
self.restoring_snapshot.store(true, Ordering::SeqCst);
|
2016-08-25 22:20:44 +02:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
2016-08-05 17:00:46 +02:00
|
|
|
// finalize the restoration. this accepts an already-locked
|
|
|
|
// restoration as an argument -- so acquiring it again _will_
|
|
|
|
// lead to deadlock.
|
|
|
|
fn finalize_restoration(&self, rest: &mut Option<Restoration>) -> Result<(), Error> {
|
|
|
|
trace!(target: "snapshot", "finalizing restoration");
|
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
let recover = rest.as_ref().map_or(false, |rest| rest.writer.is_some());
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
// destroy the restoration before replacing databases and snapshot.
|
2017-05-17 12:41:33 +02:00
|
|
|
rest.take()
|
|
|
|
.map(|r| r.finalize(&*self.engine))
|
|
|
|
.unwrap_or(Ok(()))?;
|
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
self.replace_client_db()?;
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
if recover {
|
|
|
|
let mut reader = self.reader.write();
|
|
|
|
*reader = None; // destroy the old reader if it existed.
|
2016-08-25 22:20:44 +02:00
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
let snapshot_dir = self.snapshot_dir();
|
2016-08-25 22:20:44 +02:00
|
|
|
|
2016-09-13 10:33:03 +02:00
|
|
|
if snapshot_dir.exists() {
|
|
|
|
trace!(target: "snapshot", "removing old snapshot dir at {}", snapshot_dir.to_string_lossy());
|
2016-12-27 12:53:56 +01:00
|
|
|
fs::remove_dir_all(&snapshot_dir)?;
|
2016-08-25 22:20:44 +02:00
|
|
|
}
|
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
trace!(target: "snapshot", "copying restored snapshot files over");
|
2016-12-27 12:53:56 +01:00
|
|
|
fs::rename(self.temp_recovery_dir(), &snapshot_dir)?;
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2016-12-27 12:53:56 +01:00
|
|
|
*reader = Some(LooseReader::new(snapshot_dir)?);
|
2016-09-11 14:05:59 +02:00
|
|
|
}
|
2016-08-25 22:20:44 +02:00
|
|
|
|
2016-09-11 14:05:59 +02:00
|
|
|
let _ = fs::remove_dir_all(self.restoration_dir());
|
2016-08-25 22:20:44 +02:00
|
|
|
*self.status.lock() = RestorationStatus::Inactive;
|
|
|
|
|
2016-08-05 17:00:46 +02:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Feed a chunk of either kind. no-op if no restoration or status is wrong.
|
|
|
|
fn feed_chunk(&self, hash: H256, chunk: &[u8], is_state: bool) -> Result<(), Error> {
|
2016-08-25 22:20:44 +02:00
|
|
|
// TODO: be able to process block chunks and state chunks at same time?
|
2016-10-25 18:40:01 +02:00
|
|
|
let (result, db) = {
|
|
|
|
let mut restoration = self.restoration.lock();
|
|
|
|
|
|
|
|
match self.status() {
|
|
|
|
RestorationStatus::Inactive | RestorationStatus::Failed => return Ok(()),
|
|
|
|
RestorationStatus::Ongoing { .. } => {
|
|
|
|
let (res, db) = {
|
|
|
|
let rest = match *restoration {
|
|
|
|
Some(ref mut r) => r,
|
|
|
|
None => return Ok(()),
|
2016-08-05 17:00:46 +02:00
|
|
|
};
|
|
|
|
|
2016-10-25 18:40:01 +02:00
|
|
|
(match is_state {
|
2016-11-13 13:52:53 +01:00
|
|
|
true => rest.feed_state(hash, chunk, &self.restoring_snapshot),
|
|
|
|
false => rest.feed_blocks(hash, chunk, &*self.engine, &self.restoring_snapshot),
|
2016-10-25 18:40:01 +02:00
|
|
|
}.map(|_| rest.is_done()), rest.db.clone())
|
|
|
|
};
|
|
|
|
|
|
|
|
let res = match res {
|
|
|
|
Ok(is_done) => {
|
|
|
|
match is_state {
|
|
|
|
true => self.state_chunks.fetch_add(1, Ordering::SeqCst),
|
|
|
|
false => self.block_chunks.fetch_add(1, Ordering::SeqCst),
|
|
|
|
};
|
|
|
|
|
|
|
|
match is_done {
|
|
|
|
true => {
|
2016-12-27 12:53:56 +01:00
|
|
|
db.flush().map_err(::util::UtilError::SimpleString)?;
|
2016-10-26 16:14:13 +02:00
|
|
|
drop(db);
|
|
|
|
return self.finalize_restoration(&mut *restoration);
|
2016-10-25 18:40:01 +02:00
|
|
|
},
|
|
|
|
false => Ok(())
|
|
|
|
}
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
2016-10-25 18:40:01 +02:00
|
|
|
other => other.map(drop),
|
|
|
|
};
|
|
|
|
(res, db)
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
}
|
2016-10-25 18:40:01 +02:00
|
|
|
};
|
|
|
|
result.and_then(|_| db.flush().map_err(|e| ::util::UtilError::SimpleString(e).into()))
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/// Feed a state chunk to be processed synchronously.
|
|
|
|
pub fn feed_state_chunk(&self, hash: H256, chunk: &[u8]) {
|
|
|
|
match self.feed_chunk(hash, chunk, true) {
|
|
|
|
Ok(()) => (),
|
|
|
|
Err(e) => {
|
|
|
|
warn!("Encountered error during state restoration: {}", e);
|
|
|
|
*self.restoration.lock() = None;
|
|
|
|
*self.status.lock() = RestorationStatus::Failed;
|
|
|
|
let _ = fs::remove_dir_all(self.restoration_dir());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Feed a block chunk to be processed synchronously.
|
|
|
|
pub fn feed_block_chunk(&self, hash: H256, chunk: &[u8]) {
|
|
|
|
match self.feed_chunk(hash, chunk, false) {
|
|
|
|
Ok(()) => (),
|
|
|
|
Err(e) => {
|
|
|
|
warn!("Encountered error during block restoration: {}", e);
|
|
|
|
*self.restoration.lock() = None;
|
|
|
|
*self.status.lock() = RestorationStatus::Failed;
|
|
|
|
let _ = fs::remove_dir_all(self.restoration_dir());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl SnapshotService for Service {
|
|
|
|
fn manifest(&self) -> Option<ManifestData> {
|
2016-08-25 22:20:44 +02:00
|
|
|
self.reader.read().as_ref().map(|r| r.manifest().clone())
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
2017-05-17 12:41:33 +02:00
|
|
|
fn min_supported_version(&self) -> Option<u64> {
|
|
|
|
self.engine.snapshot_components()
|
|
|
|
.map(|c| c.min_supported_version())
|
|
|
|
}
|
|
|
|
|
2016-08-05 17:00:46 +02:00
|
|
|
fn chunk(&self, hash: H256) -> Option<Bytes> {
|
2016-08-25 22:20:44 +02:00
|
|
|
self.reader.read().as_ref().and_then(|r| r.chunk(hash).ok())
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
fn status(&self) -> RestorationStatus {
|
2016-09-11 14:05:59 +02:00
|
|
|
let mut cur_status = self.status.lock();
|
2016-10-18 18:16:00 +02:00
|
|
|
if let RestorationStatus::Ongoing { ref mut state_chunks_done, ref mut block_chunks_done, .. } = *cur_status {
|
2016-09-11 14:05:59 +02:00
|
|
|
*state_chunks_done = self.state_chunks.load(Ordering::SeqCst) as u32;
|
|
|
|
*block_chunks_done = self.block_chunks.load(Ordering::SeqCst) as u32;
|
|
|
|
}
|
|
|
|
|
|
|
|
cur_status.clone()
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
fn begin_restore(&self, manifest: ManifestData) {
|
2016-10-30 09:56:34 +01:00
|
|
|
if let Err(e) = self.io_channel.lock().send(ClientIoMessage::BeginRestoration(manifest)) {
|
2016-10-25 18:40:01 +02:00
|
|
|
trace!("Error sending snapshot service message: {:?}", e);
|
|
|
|
}
|
2016-08-25 22:20:44 +02:00
|
|
|
}
|
2016-08-05 17:00:46 +02:00
|
|
|
|
2016-08-25 22:20:44 +02:00
|
|
|
fn abort_restore(&self) {
|
2016-11-13 13:52:53 +01:00
|
|
|
self.restoring_snapshot.store(false, Ordering::SeqCst);
|
2016-08-25 22:20:44 +02:00
|
|
|
*self.restoration.lock() = None;
|
|
|
|
*self.status.lock() = RestorationStatus::Inactive;
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
fn restore_state_chunk(&self, hash: H256, chunk: Bytes) {
|
2016-10-30 09:56:34 +01:00
|
|
|
if let Err(e) = self.io_channel.lock().send(ClientIoMessage::FeedStateChunk(hash, chunk)) {
|
2016-10-25 18:40:01 +02:00
|
|
|
trace!("Error sending snapshot service message: {:?}", e);
|
|
|
|
}
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
fn restore_block_chunk(&self, hash: H256, chunk: Bytes) {
|
2016-10-30 09:56:34 +01:00
|
|
|
if let Err(e) = self.io_channel.lock().send(ClientIoMessage::FeedBlockChunk(hash, chunk)) {
|
2016-10-25 18:40:01 +02:00
|
|
|
trace!("Error sending snapshot service message: {:?}", e);
|
|
|
|
}
|
2016-08-05 17:00:46 +02:00
|
|
|
}
|
2016-08-10 16:29:40 +02:00
|
|
|
}
|
2016-09-05 12:24:03 +02:00
|
|
|
|
2016-09-06 15:41:56 +02:00
|
|
|
impl Drop for Service {
|
|
|
|
fn drop(&mut self) {
|
|
|
|
self.abort_restore();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-05 12:24:03 +02:00
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
2016-09-06 15:31:13 +02:00
|
|
|
use std::sync::Arc;
|
2016-09-05 12:24:03 +02:00
|
|
|
use service::ClientIoMessage;
|
|
|
|
use io::{IoService};
|
|
|
|
use devtools::RandomTempPath;
|
|
|
|
use tests::helpers::get_test_spec;
|
|
|
|
use util::journaldb::Algorithm;
|
2016-09-06 15:31:13 +02:00
|
|
|
use error::Error;
|
|
|
|
use snapshot::{ManifestData, RestorationStatus, SnapshotService};
|
2016-09-05 12:24:03 +02:00
|
|
|
use super::*;
|
|
|
|
|
2016-09-06 15:31:13 +02:00
|
|
|
struct NoopDBRestore;
|
|
|
|
impl DatabaseRestore for NoopDBRestore {
|
|
|
|
fn restore_db(&self, _new_db: &str) -> Result<(), Error> {
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-05 12:24:03 +02:00
|
|
|
#[test]
|
|
|
|
fn sends_async_messages() {
|
|
|
|
let service = IoService::<ClientIoMessage>::start().unwrap();
|
2016-09-07 15:27:28 +02:00
|
|
|
let spec = get_test_spec();
|
2016-09-05 12:24:03 +02:00
|
|
|
|
|
|
|
let dir = RandomTempPath::new();
|
|
|
|
let mut dir = dir.as_path().to_owned();
|
2016-09-07 15:27:28 +02:00
|
|
|
let mut client_db = dir.clone();
|
|
|
|
dir.push("snapshot");
|
|
|
|
client_db.push("client");
|
|
|
|
|
|
|
|
let snapshot_params = ServiceParams {
|
|
|
|
engine: spec.engine.clone(),
|
|
|
|
genesis_block: spec.genesis_block(),
|
|
|
|
db_config: Default::default(),
|
|
|
|
pruning: Algorithm::Archive,
|
|
|
|
channel: service.channel(),
|
|
|
|
snapshot_root: dir,
|
|
|
|
db_restore: Arc::new(NoopDBRestore),
|
|
|
|
};
|
2016-09-05 12:24:03 +02:00
|
|
|
|
2016-09-07 15:27:28 +02:00
|
|
|
let service = Service::new(snapshot_params).unwrap();
|
2016-09-05 12:24:03 +02:00
|
|
|
|
|
|
|
assert!(service.manifest().is_none());
|
|
|
|
assert!(service.chunk(Default::default()).is_none());
|
|
|
|
assert_eq!(service.status(), RestorationStatus::Inactive);
|
|
|
|
|
|
|
|
let manifest = ManifestData {
|
2017-03-24 14:02:04 +01:00
|
|
|
version: 2,
|
2016-09-05 12:24:03 +02:00
|
|
|
state_hashes: vec![],
|
|
|
|
block_hashes: vec![],
|
|
|
|
state_root: Default::default(),
|
|
|
|
block_number: 0,
|
|
|
|
block_hash: Default::default(),
|
|
|
|
};
|
|
|
|
|
|
|
|
service.begin_restore(manifest);
|
|
|
|
service.abort_restore();
|
|
|
|
service.restore_state_chunk(Default::default(), vec![]);
|
|
|
|
service.restore_block_chunk(Default::default(), vec![]);
|
|
|
|
}
|
2016-10-18 18:16:00 +02:00
|
|
|
}
|