2020-09-22 14:53:52 +02:00
|
|
|
// Copyright 2015-2020 Parity Technologies (UK) Ltd.
|
|
|
|
// This file is part of OpenEthereum.
|
2016-05-24 22:38:11 +02:00
|
|
|
|
2020-09-22 14:53:52 +02:00
|
|
|
// OpenEthereum is free software: you can redistribute it and/or modify
|
2016-05-24 22:38:11 +02:00
|
|
|
// it under the terms of the GNU General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
|
2020-09-22 14:53:52 +02:00
|
|
|
// OpenEthereum is distributed in the hope that it will be useful,
|
2016-05-24 22:38:11 +02:00
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU General Public License for more details.
|
|
|
|
|
|
|
|
// You should have received a copy of the GNU General Public License
|
2020-09-22 14:53:52 +02:00
|
|
|
// along with OpenEthereum. If not, see <http://www.gnu.org/licenses/>.
|
2016-05-24 22:38:11 +02:00
|
|
|
|
|
|
|
//! DB Migration module.
|
|
|
|
|
2017-10-10 20:01:27 +02:00
|
|
|
#[macro_use]
|
|
|
|
extern crate log;
|
|
|
|
#[macro_use]
|
|
|
|
extern crate macros;
|
|
|
|
|
|
|
|
extern crate kvdb;
|
2017-10-12 15:36:27 +02:00
|
|
|
extern crate kvdb_rocksdb;
|
2017-10-10 20:01:27 +02:00
|
|
|
|
2020-08-05 06:08:03 +02:00
|
|
|
use std::{
|
|
|
|
collections::BTreeMap,
|
|
|
|
error, fs, io,
|
|
|
|
path::{Path, PathBuf},
|
|
|
|
sync::Arc,
|
|
|
|
};
|
2016-07-06 12:05:23 +02:00
|
|
|
|
2017-10-12 15:36:27 +02:00
|
|
|
use kvdb::DBTransaction;
|
|
|
|
use kvdb_rocksdb::{CompactionProfile, Database, DatabaseConfig};
|
2016-07-06 12:05:23 +02:00
|
|
|
|
2020-08-05 06:08:03 +02:00
|
|
|
fn other_io_err<E>(e: E) -> io::Error
|
|
|
|
where
|
2020-07-29 10:36:15 +02:00
|
|
|
E: Into<Box<dyn error::Error + Send + Sync>>,
|
2020-08-05 06:08:03 +02:00
|
|
|
{
|
|
|
|
io::Error::new(io::ErrorKind::Other, e)
|
2017-10-16 12:11:35 +02:00
|
|
|
}
|
|
|
|
|
2016-07-06 12:05:23 +02:00
|
|
|
/// Migration config.
|
2016-07-11 09:46:33 +02:00
|
|
|
#[derive(Clone)]
|
2016-07-06 12:05:23 +02:00
|
|
|
pub struct Config {
|
2020-08-05 06:08:03 +02:00
|
|
|
/// Defines how many elements should be migrated at once.
|
|
|
|
pub batch_size: usize,
|
|
|
|
/// Database compaction profile.
|
|
|
|
pub compaction_profile: CompactionProfile,
|
2016-07-06 12:05:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Default for Config {
|
2020-08-05 06:08:03 +02:00
|
|
|
fn default() -> Self {
|
|
|
|
Config {
|
|
|
|
batch_size: 1024,
|
|
|
|
compaction_profile: Default::default(),
|
|
|
|
}
|
|
|
|
}
|
2016-07-06 12:05:23 +02:00
|
|
|
}
|
|
|
|
|
2016-07-11 09:46:33 +02:00
|
|
|
/// A batch of key-value pairs to be written into the database.
|
|
|
|
pub struct Batch {
|
2020-08-05 06:08:03 +02:00
|
|
|
inner: BTreeMap<Vec<u8>, Vec<u8>>,
|
|
|
|
batch_size: usize,
|
|
|
|
column: Option<u32>,
|
2016-07-11 09:46:33 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Batch {
|
2020-08-05 06:08:03 +02:00
|
|
|
/// Make a new batch with the given config.
|
|
|
|
pub fn new(config: &Config, col: Option<u32>) -> Self {
|
|
|
|
Batch {
|
|
|
|
inner: BTreeMap::new(),
|
|
|
|
batch_size: config.batch_size,
|
|
|
|
column: col,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Insert a value into the batch, committing if necessary.
|
|
|
|
pub fn insert(&mut self, key: Vec<u8>, value: Vec<u8>, dest: &mut Database) -> io::Result<()> {
|
|
|
|
self.inner.insert(key, value);
|
|
|
|
if self.inner.len() == self.batch_size {
|
|
|
|
self.commit(dest)?;
|
|
|
|
}
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Commit all the items in the batch to the given database.
|
|
|
|
pub fn commit(&mut self, dest: &mut Database) -> io::Result<()> {
|
|
|
|
if self.inner.is_empty() {
|
|
|
|
return Ok(());
|
|
|
|
}
|
|
|
|
|
|
|
|
let mut transaction = DBTransaction::new();
|
|
|
|
|
|
|
|
for keypair in &self.inner {
|
|
|
|
transaction.put(self.column, &keypair.0, &keypair.1);
|
|
|
|
}
|
|
|
|
|
|
|
|
self.inner.clear();
|
|
|
|
dest.write(transaction)
|
|
|
|
}
|
2016-10-03 12:02:43 +02:00
|
|
|
}
|
|
|
|
|
2016-07-06 12:05:23 +02:00
|
|
|
/// A generalized migration from the given db to a destination db.
|
2016-05-24 22:38:11 +02:00
|
|
|
pub trait Migration: 'static {
|
2020-08-05 06:08:03 +02:00
|
|
|
/// Number of columns in the database before the migration.
|
|
|
|
fn pre_columns(&self) -> Option<u32> {
|
|
|
|
self.columns()
|
|
|
|
}
|
|
|
|
/// Number of columns in database after the migration.
|
|
|
|
fn columns(&self) -> Option<u32>;
|
|
|
|
/// Whether this migration alters any existing columns.
|
|
|
|
/// if not, then column families will simply be added and `migrate` will never be called.
|
|
|
|
fn alters_existing(&self) -> bool {
|
|
|
|
true
|
|
|
|
}
|
|
|
|
/// Version of the database after the migration.
|
|
|
|
fn version(&self) -> u32;
|
|
|
|
/// Migrate a source to a destination.
|
|
|
|
fn migrate(
|
|
|
|
&mut self,
|
|
|
|
source: Arc<Database>,
|
|
|
|
config: &Config,
|
|
|
|
destination: &mut Database,
|
|
|
|
col: Option<u32>,
|
|
|
|
) -> io::Result<()>;
|
2016-07-06 12:05:23 +02:00
|
|
|
}
|
|
|
|
|
2018-02-22 14:53:10 +01:00
|
|
|
/// A simple migration over key-value pairs of a single column.
|
2016-07-06 12:05:23 +02:00
|
|
|
pub trait SimpleMigration: 'static {
|
2020-08-05 06:08:03 +02:00
|
|
|
/// Number of columns in database after the migration.
|
|
|
|
fn columns(&self) -> Option<u32>;
|
|
|
|
/// Version of database after the migration.
|
|
|
|
fn version(&self) -> u32;
|
|
|
|
/// Index of column which should be migrated.
|
|
|
|
fn migrated_column_index(&self) -> Option<u32>;
|
|
|
|
/// Should migrate existing object to new database.
|
|
|
|
/// Returns `None` if the object does not exist in new version of database.
|
|
|
|
fn simple_migrate(&mut self, key: Vec<u8>, value: Vec<u8>) -> Option<(Vec<u8>, Vec<u8>)>;
|
2016-05-24 22:38:11 +02:00
|
|
|
}
|
|
|
|
|
2016-07-06 12:05:23 +02:00
|
|
|
impl<T: SimpleMigration> Migration for T {
|
2020-08-05 06:08:03 +02:00
|
|
|
fn columns(&self) -> Option<u32> {
|
|
|
|
SimpleMigration::columns(self)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn version(&self) -> u32 {
|
|
|
|
SimpleMigration::version(self)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn alters_existing(&self) -> bool {
|
|
|
|
true
|
|
|
|
}
|
|
|
|
|
|
|
|
fn migrate(
|
|
|
|
&mut self,
|
|
|
|
source: Arc<Database>,
|
|
|
|
config: &Config,
|
|
|
|
dest: &mut Database,
|
|
|
|
col: Option<u32>,
|
|
|
|
) -> io::Result<()> {
|
|
|
|
let migration_needed = col == SimpleMigration::migrated_column_index(self);
|
|
|
|
let mut batch = Batch::new(config, col);
|
|
|
|
|
|
|
|
let iter = match source.iter(col) {
|
|
|
|
Some(iter) => iter,
|
|
|
|
None => return Ok(()),
|
|
|
|
};
|
|
|
|
|
|
|
|
for (key, value) in iter {
|
|
|
|
if migration_needed {
|
|
|
|
if let Some((key, value)) = self.simple_migrate(key.into_vec(), value.into_vec()) {
|
|
|
|
batch.insert(key, value, dest)?;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
batch.insert(key.into_vec(), value.into_vec(), dest)?;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
batch.commit(dest)
|
|
|
|
}
|
2016-05-24 22:38:11 +02:00
|
|
|
}
|
2016-07-06 12:05:23 +02:00
|
|
|
|
2017-02-26 18:41:40 +01:00
|
|
|
/// An even simpler migration which just changes the number of columns.
|
|
|
|
pub struct ChangeColumns {
|
2020-08-05 06:08:03 +02:00
|
|
|
/// The amount of columns before this migration.
|
|
|
|
pub pre_columns: Option<u32>,
|
|
|
|
/// The amount of columns after this migration.
|
|
|
|
pub post_columns: Option<u32>,
|
|
|
|
/// The version after this migration.
|
|
|
|
pub version: u32,
|
2017-02-26 18:41:40 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Migration for ChangeColumns {
|
2020-08-05 06:08:03 +02:00
|
|
|
fn pre_columns(&self) -> Option<u32> {
|
|
|
|
self.pre_columns
|
|
|
|
}
|
|
|
|
fn columns(&self) -> Option<u32> {
|
|
|
|
self.post_columns
|
|
|
|
}
|
|
|
|
fn version(&self) -> u32 {
|
|
|
|
self.version
|
|
|
|
}
|
|
|
|
fn alters_existing(&self) -> bool {
|
|
|
|
false
|
|
|
|
}
|
|
|
|
fn migrate(
|
|
|
|
&mut self,
|
|
|
|
_: Arc<Database>,
|
|
|
|
_: &Config,
|
|
|
|
_: &mut Database,
|
|
|
|
_: Option<u32>,
|
|
|
|
) -> io::Result<()> {
|
|
|
|
Ok(())
|
|
|
|
}
|
2017-02-26 18:41:40 +01:00
|
|
|
}
|
|
|
|
|
2016-07-06 12:05:23 +02:00
|
|
|
/// Get the path where all databases reside.
|
|
|
|
fn database_path(path: &Path) -> PathBuf {
|
2020-08-05 06:08:03 +02:00
|
|
|
let mut temp_path = path.to_owned();
|
|
|
|
temp_path.pop();
|
|
|
|
temp_path
|
2016-07-06 12:05:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
enum TempIndex {
|
2020-08-05 06:08:03 +02:00
|
|
|
One,
|
|
|
|
Two,
|
2016-07-06 12:05:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
impl TempIndex {
|
2020-08-05 06:08:03 +02:00
|
|
|
fn swap(&mut self) {
|
|
|
|
match *self {
|
|
|
|
TempIndex::One => *self = TempIndex::Two,
|
|
|
|
TempIndex::Two => *self = TempIndex::One,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// given the path to the old database, get the path of this one.
|
|
|
|
fn path(&self, db_root: &Path) -> PathBuf {
|
|
|
|
let mut buf = db_root.to_owned();
|
|
|
|
|
|
|
|
match *self {
|
|
|
|
TempIndex::One => buf.push("temp_migration_1"),
|
|
|
|
TempIndex::Two => buf.push("temp_migration_2"),
|
|
|
|
};
|
|
|
|
|
|
|
|
buf
|
|
|
|
}
|
2016-07-06 12:05:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/// Manages database migration.
|
|
|
|
pub struct Manager {
|
2020-08-05 06:08:03 +02:00
|
|
|
config: Config,
|
2020-07-29 10:36:15 +02:00
|
|
|
migrations: Vec<Box<dyn Migration>>,
|
2016-07-06 12:05:23 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Manager {
|
2020-08-05 06:08:03 +02:00
|
|
|
/// Creates new migration manager with given configuration.
|
|
|
|
pub fn new(config: Config) -> Self {
|
|
|
|
Manager {
|
|
|
|
config: config,
|
|
|
|
migrations: vec![],
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Adds new migration rules.
|
|
|
|
pub fn add_migration<T>(&mut self, migration: T) -> io::Result<()>
|
|
|
|
where
|
|
|
|
T: Migration,
|
|
|
|
{
|
|
|
|
let is_new = match self.migrations.last() {
|
|
|
|
Some(last) => migration.version() > last.version(),
|
|
|
|
None => true,
|
|
|
|
};
|
|
|
|
|
|
|
|
match is_new {
|
|
|
|
true => Ok(self.migrations.push(Box::new(migration))),
|
|
|
|
false => Err(other_io_err("Cannot add migration.")),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Performs migration in order, starting with a source path, migrating between two temporary databases,
|
|
|
|
/// and producing a path where the final migration lives.
|
|
|
|
pub fn execute(&mut self, old_path: &Path, version: u32) -> io::Result<PathBuf> {
|
|
|
|
let config = self.config.clone();
|
|
|
|
let migrations = self.migrations_from(version);
|
|
|
|
trace!(target: "migration", "Total migrations to execute for version {}: {}", version, migrations.len());
|
|
|
|
if migrations.is_empty() {
|
|
|
|
return Err(other_io_err("Migration impossible"));
|
|
|
|
};
|
|
|
|
|
|
|
|
let columns = migrations.get(0).and_then(|m| m.pre_columns());
|
|
|
|
|
|
|
|
trace!(target: "migration", "Expecting database to contain {:?} columns", columns);
|
|
|
|
let mut db_config = DatabaseConfig {
|
|
|
|
max_open_files: 64,
|
|
|
|
memory_budget: None,
|
|
|
|
compaction: config.compaction_profile,
|
|
|
|
columns: columns,
|
|
|
|
};
|
|
|
|
|
|
|
|
let db_root = database_path(old_path);
|
|
|
|
let mut temp_idx = TempIndex::One;
|
|
|
|
let mut temp_path = old_path.to_path_buf();
|
|
|
|
|
|
|
|
// start with the old db.
|
|
|
|
let old_path_str = old_path
|
|
|
|
.to_str()
|
|
|
|
.ok_or_else(|| other_io_err("Migration impossible."))?;
|
|
|
|
let mut cur_db = Arc::new(Database::open(&db_config, old_path_str)?);
|
|
|
|
|
|
|
|
for migration in migrations {
|
|
|
|
trace!(target: "migration", "starting migration to version {}", migration.version());
|
|
|
|
// Change number of columns in new db
|
|
|
|
let current_columns = db_config.columns;
|
|
|
|
db_config.columns = migration.columns();
|
|
|
|
|
|
|
|
// slow migrations: alter existing data.
|
|
|
|
if migration.alters_existing() {
|
|
|
|
temp_path = temp_idx.path(&db_root);
|
|
|
|
|
|
|
|
// open the target temporary database.
|
|
|
|
let temp_path_str = temp_path
|
|
|
|
.to_str()
|
|
|
|
.ok_or_else(|| other_io_err("Migration impossible."))?;
|
|
|
|
let mut new_db = Database::open(&db_config, temp_path_str)?;
|
|
|
|
|
|
|
|
match current_columns {
|
|
|
|
// migrate only default column
|
|
|
|
None => migration.migrate(cur_db.clone(), &config, &mut new_db, None)?,
|
|
|
|
Some(v) => {
|
|
|
|
// Migrate all columns in previous DB
|
|
|
|
for col in 0..v {
|
|
|
|
migration.migrate(cur_db.clone(), &config, &mut new_db, Some(col))?
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// next iteration, we will migrate from this db into the other temp.
|
|
|
|
cur_db = Arc::new(new_db);
|
|
|
|
temp_idx.swap();
|
|
|
|
|
|
|
|
// remove the other temporary migration database.
|
|
|
|
let _ = fs::remove_dir_all(temp_idx.path(&db_root));
|
|
|
|
} else {
|
|
|
|
// migrations which simply add or remove column families.
|
|
|
|
// we can do this in-place.
|
|
|
|
let goal_columns = migration.columns().unwrap_or(0);
|
|
|
|
while cur_db.num_columns() < goal_columns {
|
|
|
|
cur_db.add_column().map_err(other_io_err)?;
|
|
|
|
}
|
|
|
|
|
|
|
|
while cur_db.num_columns() > goal_columns {
|
|
|
|
cur_db.drop_column().map_err(other_io_err)?;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(temp_path)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Returns true if migration is needed.
|
|
|
|
pub fn is_needed(&self, version: u32) -> bool {
|
|
|
|
match self.migrations.last() {
|
|
|
|
Some(last) => version < last.version(),
|
|
|
|
None => false,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Find all needed migrations.
|
2020-07-29 10:36:15 +02:00
|
|
|
fn migrations_from(&mut self, version: u32) -> Vec<&mut Box<dyn Migration>> {
|
2020-08-05 06:08:03 +02:00
|
|
|
self.migrations
|
|
|
|
.iter_mut()
|
|
|
|
.filter(|m| m.version() > version)
|
|
|
|
.collect()
|
|
|
|
}
|
2016-07-28 23:46:24 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/// Prints a dot every `max` ticks
|
|
|
|
pub struct Progress {
|
2020-08-05 06:08:03 +02:00
|
|
|
current: usize,
|
|
|
|
max: usize,
|
2016-07-06 12:05:23 +02:00
|
|
|
}
|
|
|
|
|
2016-07-28 23:46:24 +02:00
|
|
|
impl Default for Progress {
|
2020-08-05 06:08:03 +02:00
|
|
|
fn default() -> Self {
|
|
|
|
Progress {
|
|
|
|
current: 0,
|
|
|
|
max: 100_000,
|
|
|
|
}
|
|
|
|
}
|
2016-07-28 23:46:24 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Progress {
|
2020-08-05 06:08:03 +02:00
|
|
|
/// Tick progress meter.
|
|
|
|
pub fn tick(&mut self) {
|
|
|
|
self.current += 1;
|
|
|
|
if self.current == self.max {
|
|
|
|
self.current = 0;
|
|
|
|
flush!(".");
|
|
|
|
}
|
|
|
|
}
|
2016-07-28 23:46:24 +02:00
|
|
|
}
|