use prelude::*; use super::*; use std::path::{Path, PathBuf}; use std::time::Duration; use pbr::ProgressBar; quick_error!{ #[derive(Debug)] pub enum IntegrityError { MissingChunk(hash: Hash) { description("Missing chunk") display("Missing chunk: {}", hash) } MissingBundleId(id: u32) { description("Missing bundle") display("Missing bundle: {}", id) } MissingBundle(id: BundleId) { description("Missing bundle") display("Missing bundle: {}", id) } NoSuchChunk(bundle: BundleId, chunk: u32) { description("No such chunk") display("Bundle {} does not contain the chunk {}", bundle, chunk) } RemoteBundlesNotInMap { description("Remote bundles missing from map") } MapContainsDuplicates { description("Map contains duplicates") } BrokenInode(path: PathBuf, err: Box) { cause(err) description("Broken inode") display("Broken inode: {:?}\n\tcaused by: {}", path, err) } MissingInodeData(path: PathBuf, err: Box) { cause(err) description("Missing inode data") display("Missing inode data in: {:?}\n\tcaused by: {}", path, err) } } } impl Repository { fn check_index_chunks(&self) -> Result<(), RepositoryError> { let mut progress = ProgressBar::new(self.index.len() as u64); progress.message("checking index: "); progress.set_max_refresh_rate(Some(Duration::from_millis(100))); for (count, (_hash, location)) in self.index.iter().enumerate() { // Lookup bundle id from map let bundle_id = try!(self.get_bundle_id(location.bundle)); // Get bundle object from bundledb let bundle = if let Some(bundle) = self.bundles.get_bundle_info(&bundle_id) { bundle } else { progress.finish_print("checking index: done."); return Err(IntegrityError::MissingBundle(bundle_id.clone()).into()); }; // Get chunk from bundle if bundle.info.chunk_count <= location.chunk as usize { progress.finish_print("checking index: done."); return Err( IntegrityError::NoSuchChunk(bundle_id.clone(), location.chunk).into() ); } if count % 1000 == 0 { progress.set(count as u64); } } progress.finish_print("checking index: done."); Ok(()) } fn check_chunks( &self, checked: &mut Bitmap, chunks: &[Chunk], mark: bool, ) -> Result { let mut new = false; for &(hash, _len) in chunks { if let Some(pos) = self.index.pos(&hash) { new |= !checked.get(pos); if mark { checked.set(pos); } } else { return Err(IntegrityError::MissingChunk(hash).into()); } } Ok(new) } fn check_inode_contents( &mut self, inode: &Inode, checked: &mut Bitmap, ) -> Result<(), RepositoryError> { match inode.data { None | Some(FileData::Inline(_)) => (), Some(FileData::ChunkedDirect(ref chunks)) => { try!(self.check_chunks(checked, chunks, true)); } Some(FileData::ChunkedIndirect(ref chunks)) => { if try!(self.check_chunks(checked, chunks, true)) { let chunk_data = try!(self.get_data(chunks)); let chunks = ChunkList::read_from(&chunk_data); try!(self.check_chunks(checked, &chunks, true)); } } } Ok(()) } fn check_subtree( &mut self, path: PathBuf, chunks: &[Chunk], checked: &mut Bitmap, repair: bool, ) -> Result, RepositoryError> { let mut modified = false; match self.check_chunks(checked, chunks, false) { Ok(false) => return Ok(None), Ok(true) => (), Err(err) => return Err(IntegrityError::BrokenInode(path, Box::new(err)).into()), } let mut inode = try!(self.get_inode(chunks)); // Mark the content chunks as used if let Err(err) = self.check_inode_contents(&inode, checked) { if repair { warn!( "Problem detected: data of {:?} is corrupt\n\tcaused by: {}", path, err ); info!("Removing inode data"); inode.data = Some(FileData::Inline(vec![].into())); inode.size = 0; modified = true; } else { return Err(IntegrityError::MissingInodeData(path, Box::new(err)).into()); } } // Put children in todo if let Some(ref mut children) = inode.children { let mut removed = vec![]; for (name, chunks) in children.iter_mut() { match self.check_subtree(path.join(name), chunks, checked, repair) { Ok(None) => (), Ok(Some(c)) => { *chunks = c; modified = true; } Err(err) => { if repair { warn!( "Problem detected: inode {:?} is corrupt\n\tcaused by: {}", path.join(name), err ); info!("Removing broken inode from backup"); removed.push(name.to_string()); modified = true; } else { return Err(err); } } } } for name in removed { children.remove(&name); } } if modified { Ok(Some(try!(self.put_inode(&inode)))) } else { try!(self.check_chunks(checked, chunks, true)); Ok(None) } } fn evacuate_broken_backup(&self, name: &str) -> Result<(), RepositoryError> { warn!( "The backup {} was corrupted and needed to be modified.", name ); let src = self.layout.backup_path(name); let mut dst = src.with_extension("backup.broken"); let mut num = 1; while dst.exists() { dst = src.with_extension(&format!("backup.{}.broken", num)); num += 1; } if fs::rename(&src, &dst).is_err() { try!(fs::copy(&src, &dst)); try!(fs::remove_file(&src)); } info!("The original backup was renamed to {:?}", dst); Ok(()) } #[inline] pub fn check_backup( &mut self, name: &str, backup: &mut Backup, repair: bool, ) -> Result<(), RepositoryError> { let _lock = if repair { try!(self.write_mode()); Some(self.lock(false)) } else { None }; info!("Checking backup..."); let mut checked = Bitmap::new(self.index.capacity()); match self.check_subtree( Path::new("").to_path_buf(), &backup.root, &mut checked, repair ) { Ok(None) => (), Ok(Some(chunks)) => { try!(self.flush()); backup.root = chunks; backup.modified = true; try!(self.evacuate_broken_backup(name)); try!(self.save_backup(backup, name)); } Err(err) => { if repair { warn!( "The root of the backup {} has been corrupted\n\tcaused by: {}", name, err ); try!(self.evacuate_broken_backup(name)); } else { return Err(err); } } } Ok(()) } pub fn check_backup_inode( &mut self, name: &str, backup: &mut Backup, path: &Path, repair: bool, ) -> Result<(), RepositoryError> { let _lock = if repair { try!(self.write_mode()); Some(self.lock(false)) } else { None }; info!("Checking inode..."); let mut checked = Bitmap::new(self.index.capacity()); let mut inodes = try!(self.get_backup_path(backup, path)); let mut inode = inodes.pop().unwrap(); let mut modified = false; if let Err(err) = self.check_inode_contents(&inode, &mut checked) { if repair { warn!( "Problem detected: data of {:?} is corrupt\n\tcaused by: {}", path, err ); info!("Removing inode data"); inode.data = Some(FileData::Inline(vec![].into())); inode.size = 0; modified = true; } else { return Err( IntegrityError::MissingInodeData(path.to_path_buf(), Box::new(err)).into() ); } } if let Some(ref mut children) = inode.children { let mut removed = vec![]; for (name, chunks) in children.iter_mut() { match self.check_subtree(path.join(name), chunks, &mut checked, repair) { Ok(None) => (), Ok(Some(c)) => { *chunks = c; modified = true; } Err(err) => { if repair { warn!( "Problem detected: inode {:?} is corrupt\n\tcaused by: {}", path.join(name), err ); info!("Removing broken inode from backup"); removed.push(name.to_string()); modified = true; } else { return Err(err); } } } } for name in removed { children.remove(&name); } } let mut chunks = try!(self.put_inode(&inode)); while let Some(mut parent) = inodes.pop() { parent.children.as_mut().unwrap().insert(inode.name, chunks); inode = parent; chunks = try!(self.put_inode(&inode)); } if modified { try!(self.flush()); backup.root = chunks; backup.modified = true; try!(self.evacuate_broken_backup(name)); try!(self.save_backup(backup, name)); } Ok(()) } pub fn check_backups(&mut self, repair: bool) -> Result<(), RepositoryError> { let _lock = if repair { try!(self.write_mode()); Some(self.lock(false)) } else { None }; info!("Checking backups..."); let mut checked = Bitmap::new(self.index.capacity()); let backup_map = match self.get_all_backups() { Ok(backup_map) => backup_map, Err(RepositoryError::BackupFile(BackupFileError::PartialBackupsList(backup_map, _failed))) => { warn!("Some backups could not be read, ignoring them"); backup_map } Err(err) => return Err(err), }; for (name, mut backup) in ProgressIter::new("checking backups", backup_map.len(), backup_map.into_iter()) { let path = format!("{}::", name); match self.check_subtree( Path::new(&path).to_path_buf(), &backup.root, &mut checked, repair ) { Ok(None) => (), Ok(Some(chunks)) => { try!(self.flush()); backup.root = chunks; backup.modified = true; try!(self.evacuate_broken_backup(&name)); try!(self.save_backup(&backup, &name)); } Err(err) => { if repair { warn!( "The root of the backup {} has been corrupted\n\tcaused by: {}", name, err ); try!(self.evacuate_broken_backup(&name)); } else { return Err(err); } } } } Ok(()) } pub fn check_repository(&mut self, repair: bool) -> Result<(), RepositoryError> { info!("Checking repository integrity..."); let mut rebuild = false; for (_id, bundle_id) in self.bundle_map.bundles() { if self.bundles.get_bundle_info(&bundle_id).is_none() { if repair { warn!( "Problem detected: bundle map contains unknown bundle {}", bundle_id ); rebuild = true; } else { return Err(IntegrityError::MissingBundle(bundle_id).into()); } } } if self.bundle_map.len() < self.bundles.len() { if repair { warn!("Problem detected: bundle map does not contain all remote bundles"); rebuild = true; } else { return Err(IntegrityError::RemoteBundlesNotInMap.into()); } } if self.bundle_map.len() > self.bundles.len() { if repair { warn!("Problem detected: bundle map contains bundles multiple times"); rebuild = true; } else { return Err(IntegrityError::MapContainsDuplicates.into()); } } if rebuild { try!(self.rebuild_bundle_map()); try!(self.rebuild_index()); } Ok(()) } pub fn rebuild_bundle_map(&mut self) -> Result<(), RepositoryError> { info!("Rebuilding bundle map from bundles"); self.bundle_map = BundleMap::create(); for bundle in self.bundles.list_bundles() { let bundle_id = match bundle.mode { BundleMode::Data => self.next_data_bundle, BundleMode::Meta => self.next_meta_bundle, }; self.bundle_map.set(bundle_id, bundle.id.clone()); if self.next_meta_bundle == bundle_id { self.next_meta_bundle = self.next_free_bundle_id() } if self.next_data_bundle == bundle_id { self.next_data_bundle = self.next_free_bundle_id() } } self.save_bundle_map() } pub fn rebuild_index(&mut self) -> Result<(), RepositoryError> { info!("Rebuilding index from bundles"); self.index.clear(); let mut bundles = self.bundle_map.bundles(); bundles.sort_by_key(|&(_, ref v)| v.clone()); for (num, id) in ProgressIter::new("Rebuilding index from bundles", bundles.len(), bundles.into_iter()) { let chunks = try!(self.bundles.get_chunk_list(&id)); for (i, (hash, _len)) in chunks.into_inner().into_iter().enumerate() { try!(self.index.set( &hash, &Location { bundle: num as u32, chunk: i as u32 } )); } } Ok(()) } #[inline] pub fn check_index(&mut self, repair: bool) -> Result<(), RepositoryError> { if repair { try!(self.write_mode()); } info!("Checking index integrity..."); if let Err(err) = self.index.check() { if repair { warn!( "Problem detected: index was corrupted\n\tcaused by: {}", err ); return self.rebuild_index(); } else { return Err(err.into()); } } info!("Checking index entries..."); if let Err(err) = self.check_index_chunks() { if repair { warn!( "Problem detected: index entries were inconsistent\n\tcaused by: {}", err ); return self.rebuild_index(); } else { return Err(err.into()); } } Ok(()) } #[inline] pub fn check_bundles(&mut self, full: bool, repair: bool) -> Result<(), RepositoryError> { if repair { try!(self.write_mode()); } info!("Checking bundle integrity..."); if try!(self.bundles.check(full, repair)) { // Some bundles got repaired warn!("Some bundles have been rewritten, please remove the broken bundles manually."); try!(self.rebuild_bundle_map()); try!(self.rebuild_index()); } Ok(()) } }