aboutsummaryrefslogblamecommitdiff
path: root/src/garage/repair.rs
blob: 762a8300d6c9a9469f498cd623064128beeee7f5 (plain) (tree)
1
2
3
4
5
6
7
8
9
                     



                       
                                 


                                         

                              







                                
                                                                                             








                                                                              
                                























                                                                                   
                                                              


                                                                              
                                                                                  

                                                
                 





                                                                                                 

                                                                                             
 
                                                                                                   
                                                  




                                             
                                                                      

                                                           



                                                                                                                   
                                              






                                                                                                    
                                                                  

                                                            










                                                

                                                                                                   
                               
                                      

                              
                                                                                     
                               
                 






                                                                                          
 

                                                                                                  
 



                                                                                                      
                                                    






                                                                   

                                                                                            









                                                                                               
                                                                     









                                                
















                                                                                                     
 
use core::ops::Bound;
use std::sync::Arc;

use tokio::sync::watch;

use garage_model::garage::Garage;
use garage_model::s3::block_ref_table::*;
use garage_model::s3::object_table::*;
use garage_model::s3::version_table::*;
use garage_table::*;
use garage_util::error::Error;

use crate::*;

pub struct Repair {
	pub garage: Arc<Garage>,
}

impl Repair {
	pub async fn repair_worker(&self, opt: RepairOpt, must_exit: watch::Receiver<bool>) {
		if let Err(e) = self.repair_worker_aux(opt, must_exit).await {
			warn!("Repair worker failed with error: {}", e);
		}
	}

	async fn repair_worker_aux(
		&self,
		opt: RepairOpt,
		must_exit: watch::Receiver<bool>,
	) -> Result<(), Error> {
		match opt.what {
			RepairWhat::Tables => {
				info!("Launching a full sync of tables");
				self.garage.bucket_table.syncer.add_full_sync();
				self.garage.object_table.syncer.add_full_sync();
				self.garage.version_table.syncer.add_full_sync();
				self.garage.block_ref_table.syncer.add_full_sync();
				self.garage.key_table.syncer.add_full_sync();
			}
			RepairWhat::Versions => {
				info!("Repairing the versions table");
				self.repair_versions(&must_exit).await?;
			}
			RepairWhat::BlockRefs => {
				info!("Repairing the block refs table");
				self.repair_block_ref(&must_exit).await?;
			}
			RepairWhat::Blocks => {
				info!("Repairing the stored blocks");
				self.garage
					.block_manager
					.repair_data_store(&must_exit)
					.await?;
			}
			RepairWhat::Scrub { tranquility } => {
				info!("Verifying integrity of stored blocks");
				self.garage
					.block_manager
					.scrub_data_store(&must_exit, tranquility)
					.await?;
			}
		}
		Ok(())
	}

	async fn repair_versions(&self, must_exit: &watch::Receiver<bool>) -> Result<(), Error> {
		let mut pos = vec![];

		while let Some((item_key, item_bytes)) = self.get_next_version_after(&pos)? {
			pos = item_key;

			let version = rmp_serde::decode::from_read_ref::<_, Version>(&item_bytes)?;
			if version.deleted.get() {
				continue;
			}
			let object = self
				.garage
				.object_table
				.get(&version.bucket_id, &version.key)
				.await?;
			let version_exists = match object {
				Some(o) => o
					.versions()
					.iter()
					.any(|x| x.uuid == version.uuid && x.state != ObjectVersionState::Aborted),
				None => false,
			};
			if !version_exists {
				info!("Repair versions: marking version as deleted: {:?}", version);
				self.garage
					.version_table
					.insert(&Version::new(
						version.uuid,
						version.bucket_id,
						version.key,
						true,
					))
					.await?;
			}

			if *must_exit.borrow() {
				break;
			}
		}
		Ok(())
	}

	fn get_next_version_after(&self, pos: &[u8]) -> Result<Option<(Vec<u8>, Vec<u8>)>, Error> {
		match self
			.garage
			.version_table
			.data
			.store
			.range::<&[u8], _>((Bound::Excluded(pos), Bound::Unbounded))?
			.next()
		{
			None => Ok(None),
			Some(item) => {
				let (item_key, item_bytes) = item?;
				Ok(Some((item_key.into_owned(), item_bytes.into_owned())))
			}
		}
	}

	async fn repair_block_ref(&self, must_exit: &watch::Receiver<bool>) -> Result<(), Error> {
		let mut pos = vec![];

		while let Some((item_key, item_bytes)) = self.get_next_block_ref_after(&pos)? {
			pos = item_key;

			let block_ref = rmp_serde::decode::from_read_ref::<_, BlockRef>(&item_bytes)?;
			if block_ref.deleted.get() {
				continue;
			}
			let version = self
				.garage
				.version_table
				.get(&block_ref.version, &EmptyKey)
				.await?;
			// The version might not exist if it has been GC'ed
			let ref_exists = version.map(|v| !v.deleted.get()).unwrap_or(false);
			if !ref_exists {
				info!(
					"Repair block ref: marking block_ref as deleted: {:?}",
					block_ref
				);
				self.garage
					.block_ref_table
					.insert(&BlockRef {
						block: block_ref.block,
						version: block_ref.version,
						deleted: true.into(),
					})
					.await?;
			}

			if *must_exit.borrow() {
				break;
			}
		}
		Ok(())
	}

	fn get_next_block_ref_after(&self, pos: &[u8]) -> Result<Option<(Vec<u8>, Vec<u8>)>, Error> {
		match self
			.garage
			.block_ref_table
			.data
			.store
			.range::<&[u8], _>((Bound::Excluded(pos), Bound::Unbounded))?
			.next()
		{
			None => Ok(None),
			Some(item) => {
				let (item_key, item_bytes) = item?;
				Ok(Some((item_key.into_owned(), item_bytes.into_owned())))
			}
		}
	}
}