use std::str::FromStr; use std::sync::Arc; use garage_net::NetworkKey; use garage_db as db; use garage_util::background::*; use garage_util::config::*; use garage_util::error::*; use garage_util::persister::PersisterShared; use garage_rpc::replication_mode::*; use garage_rpc::system::System; use garage_block::manager::*; use garage_table::replication::TableFullReplication; use garage_table::replication::TableShardedReplication; use garage_table::*; use crate::s3::block_ref_table::*; use crate::s3::lifecycle_worker; use crate::s3::mpu_table::*; use crate::s3::object_table::*; use crate::s3::version_table::*; use crate::bucket_alias_table::*; use crate::bucket_table::*; use crate::helper; use crate::index_counter::*; use crate::key_table::*; #[cfg(feature = "k2v")] use crate::k2v::{item_table::*, rpc::*, sub::*}; /// An entire Garage full of data pub struct Garage { /// The parsed configuration Garage is running pub config: Config, /// The set of background variables that can be viewed/modified at runtime pub bg_vars: vars::BgVars, /// The replication factor of this cluster pub replication_factor: ReplicationFactor, /// The local database pub db: db::Db, /// The membership manager pub system: Arc, /// The block manager pub block_manager: Arc, /// Table containing buckets pub bucket_table: Arc>, /// Table containing bucket aliases pub bucket_alias_table: Arc>, /// Table containing api keys pub key_table: Arc>, /// Lock to prevent concurrent modification of buckets and access keys bucket_lock: tokio::sync::Mutex<()>, /// Table containing S3 objects pub object_table: Arc>, /// Counting table containing object counters pub object_counter_table: Arc>, /// Table containing S3 multipart uploads pub mpu_table: Arc>, /// Counting table containing multipart object counters pub mpu_counter_table: Arc>, /// Table containing S3 object versions pub version_table: Arc>, /// Table containing S3 block references (not blocks themselves) pub block_ref_table: Arc>, /// Persister for lifecycle worker info pub lifecycle_persister: PersisterShared, #[cfg(feature = "k2v")] pub k2v: GarageK2V, } #[cfg(feature = "k2v")] pub struct GarageK2V { /// Table containing K2V items pub item_table: Arc>, /// Indexing table containing K2V item counters pub counter_table: Arc>, /// K2V RPC handler pub rpc: Arc, } impl Garage { /// Create and run garage pub fn new(config: Config) -> Result, Error> { // Create meta dir and data dir if they don't exist already std::fs::create_dir_all(&config.metadata_dir) .ok_or_message("Unable to create Garage metadata directory")?; match &config.data_dir { DataDirEnum::Single(data_dir) => { std::fs::create_dir_all(data_dir).ok_or_message(format!( "Unable to create Garage data directory: {}", data_dir.to_string_lossy() ))?; } DataDirEnum::Multiple(data_dirs) => { for dir in data_dirs { std::fs::create_dir_all(&dir.path).ok_or_message(format!( "Unable to create Garage data directory: {}", dir.path.to_string_lossy() ))?; } } } info!("Opening database..."); let db_engine = db::Engine::from_str(&config.db_engine) .ok_or_message("Invalid `db_engine` value in configuration file")?; let mut db_path = config.metadata_dir.clone(); match db_engine { db::Engine::Sqlite => { db_path.push("db.sqlite"); } db::Engine::Lmdb => { db_path.push("db.lmdb"); } } let db_opt = db::OpenOpt { fsync: config.metadata_fsync, lmdb_map_size: match config.lmdb_map_size { v if v == usize::default() => None, v => Some(v), }, }; let db = db::open_db(&db_path, db_engine, &db_opt) .ok_or_message("Unable to open metadata db")?; info!("Initializing RPC..."); let network_key = hex::decode(config.rpc_secret.as_ref().ok_or_message( "rpc_secret value is missing, not present in config file or in environment", )?) .ok() .and_then(|x| NetworkKey::from_slice(&x)) .ok_or_message("Invalid RPC secret key: expected 32 bytes of random hex, please check the documentation for requirements")?; let (replication_factor, consistency_mode) = parse_replication_mode(&config)?; info!("Initialize background variable system..."); let mut bg_vars = vars::BgVars::new(); info!("Initialize membership management system..."); let system = System::new(network_key, replication_factor, consistency_mode, &config)?; let data_rep_param = TableShardedReplication { system: system.clone(), replication_factor: replication_factor.into(), write_quorum: replication_factor.write_quorum(consistency_mode), read_quorum: 1, }; let meta_rep_param = TableShardedReplication { system: system.clone(), replication_factor: replication_factor.into(), write_quorum: replication_factor.write_quorum(consistency_mode), read_quorum: replication_factor.read_quorum(consistency_mode), }; let control_rep_param = TableFullReplication { system: system.clone(), }; info!("Initialize block manager..."); let block_manager = BlockManager::new(&db, &config, data_rep_param, system.clone())?; block_manager.register_bg_vars(&mut bg_vars); // ---- admin tables ---- info!("Initialize bucket_table..."); let bucket_table = Table::new(BucketTable, control_rep_param.clone(), system.clone(), &db); info!("Initialize bucket_alias_table..."); let bucket_alias_table = Table::new( BucketAliasTable, control_rep_param.clone(), system.clone(), &db, ); info!("Initialize key_table_table..."); let key_table = Table::new(KeyTable, control_rep_param, system.clone(), &db); // ---- S3 tables ---- info!("Initialize block_ref_table..."); let block_ref_table = Table::new( BlockRefTable { block_manager: block_manager.clone(), }, meta_rep_param.clone(), system.clone(), &db, ); info!("Initialize version_table..."); let version_table = Table::new( VersionTable { block_ref_table: block_ref_table.clone(), }, meta_rep_param.clone(), system.clone(), &db, ); info!("Initialize multipart upload counter table..."); let mpu_counter_table = IndexCounter::new(system.clone(), meta_rep_param.clone(), &db); info!("Initialize multipart upload table..."); let mpu_table = Table::new( MultipartUploadTable { version_table: version_table.clone(), mpu_counter_table: mpu_counter_table.clone(), }, meta_rep_param.clone(), system.clone(), &db, ); info!("Initialize object counter table..."); let object_counter_table = IndexCounter::new(system.clone(), meta_rep_param.clone(), &db); info!("Initialize object_table..."); #[allow(clippy::redundant_clone)] let object_table = Table::new( ObjectTable { version_table: version_table.clone(), mpu_table: mpu_table.clone(), object_counter_table: object_counter_table.clone(), }, meta_rep_param.clone(), system.clone(), &db, ); info!("Load lifecycle worker state..."); let lifecycle_persister = PersisterShared::new(&system.metadata_dir, "lifecycle_worker_state"); lifecycle_worker::register_bg_vars(&lifecycle_persister, &mut bg_vars); // ---- K2V ---- #[cfg(feature = "k2v")] let k2v = GarageK2V::new(system.clone(), &db, meta_rep_param); // ---- setup block refcount recalculation ---- // this function can be used to fix inconsistencies in the RC table block_manager.set_recalc_rc(vec![ block_ref_recount_fn(&block_ref_table), // other functions could be added here if we had other tables // that hold references to data blocks ]); // -- done -- Ok(Arc::new(Self { config, bg_vars, replication_factor, db, system, block_manager, bucket_table, bucket_alias_table, key_table, bucket_lock: tokio::sync::Mutex::new(()), object_table, object_counter_table, mpu_table, mpu_counter_table, version_table, block_ref_table, lifecycle_persister, #[cfg(feature = "k2v")] k2v, })) } pub fn spawn_workers(self: &Arc, bg: &BackgroundRunner) -> Result<(), Error> { self.block_manager.spawn_workers(bg); self.bucket_table.spawn_workers(bg); self.bucket_alias_table.spawn_workers(bg); self.key_table.spawn_workers(bg); self.object_table.spawn_workers(bg); self.object_counter_table.spawn_workers(bg); self.mpu_table.spawn_workers(bg); self.mpu_counter_table.spawn_workers(bg); self.version_table.spawn_workers(bg); self.block_ref_table.spawn_workers(bg); bg.spawn_worker(lifecycle_worker::LifecycleWorker::new( self.clone(), self.lifecycle_persister.clone(), )); #[cfg(feature = "k2v")] self.k2v.spawn_workers(bg); if let Some(itv) = self.config.metadata_auto_snapshot_interval.as_deref() { let interval = parse_duration::parse(itv) .ok_or_message("Invalid `metadata_auto_snapshot_interval`")?; if interval < std::time::Duration::from_secs(600) { return Err(Error::Message( "metadata_auto_snapshot_interval too small or negative".into(), )); } bg.spawn_worker(crate::snapshot::AutoSnapshotWorker::new( self.clone(), interval, )); } Ok(()) } pub fn bucket_helper(&self) -> helper::bucket::BucketHelper { helper::bucket::BucketHelper(self) } pub fn key_helper(&self) -> helper::key::KeyHelper { helper::key::KeyHelper(self) } pub async fn locked_helper(&self) -> helper::locked::LockedHelper { let lock = self.bucket_lock.lock().await; helper::locked::LockedHelper(self, lock) } } #[cfg(feature = "k2v")] impl GarageK2V { fn new(system: Arc, db: &db::Db, meta_rep_param: TableShardedReplication) -> Self { info!("Initialize K2V counter table..."); let counter_table = IndexCounter::new(system.clone(), meta_rep_param.clone(), db); info!("Initialize K2V subscription manager..."); let subscriptions = Arc::new(SubscriptionManager::new()); info!("Initialize K2V item table..."); let item_table = Table::new( K2VItemTable { counter_table: counter_table.clone(), subscriptions: subscriptions.clone(), }, meta_rep_param, system.clone(), db, ); info!("Initialize K2V RPC handler..."); let rpc = K2VRpcHandler::new(system, db, item_table.clone(), subscriptions); Self { item_table, counter_table, rpc, } } pub fn spawn_workers(&self, bg: &BackgroundRunner) { self.item_table.spawn_workers(bg); self.counter_table.spawn_workers(bg); } }