LCOV - code coverage report
Current view: top level - control_plane/src - local_env.rs (source / functions) Coverage Total Hit
Test: b4ae4c4857f9ef3e144e982a35ee23bc84c71983.info Lines: 0.0 % 493 0
Test Date: 2024-10-22 22:13:45 Functions: 0.0 % 183 0

            Line data    Source code
       1              : //! This module is responsible for locating and loading paths in a local setup.
       2              : //!
       3              : //! Now it also provides init method which acts like a stub for proper installation
       4              : //! script which will use local paths.
       5              : 
       6              : use anyhow::{bail, Context};
       7              : 
       8              : use clap::ValueEnum;
       9              : use postgres_backend::AuthType;
      10              : use reqwest::Url;
      11              : use serde::{Deserialize, Serialize};
      12              : use std::collections::HashMap;
      13              : use std::env;
      14              : use std::fs;
      15              : use std::net::IpAddr;
      16              : use std::net::Ipv4Addr;
      17              : use std::net::SocketAddr;
      18              : use std::path::{Path, PathBuf};
      19              : use std::process::{Command, Stdio};
      20              : use std::time::Duration;
      21              : use utils::{
      22              :     auth::{encode_from_key_file, Claims},
      23              :     id::{NodeId, TenantId, TenantTimelineId, TimelineId},
      24              : };
      25              : 
      26              : use crate::pageserver::PageServerNode;
      27              : use crate::pageserver::PAGESERVER_REMOTE_STORAGE_DIR;
      28              : use crate::safekeeper::SafekeeperNode;
      29              : 
      30              : pub const DEFAULT_PG_VERSION: u32 = 16;
      31              : 
      32              : //
      33              : // This data structures represents neon_local CLI config
      34              : //
      35              : // It is deserialized from the .neon/config file, or the config file passed
      36              : // to 'neon_local init --config=<path>' option. See control_plane/simple.conf for
      37              : // an example.
      38              : //
      39              : #[derive(PartialEq, Eq, Clone, Debug)]
      40              : pub struct LocalEnv {
      41              :     // Base directory for all the nodes (the pageserver, safekeepers and
      42              :     // compute endpoints).
      43              :     //
      44              :     // This is not stored in the config file. Rather, this is the path where the
      45              :     // config file itself is. It is read from the NEON_REPO_DIR env variable which
      46              :     // must be an absolute path. If the env var is not set, $PWD/.neon is used.
      47              :     pub base_data_dir: PathBuf,
      48              : 
      49              :     // Path to postgres distribution. It's expected that "bin", "include",
      50              :     // "lib", "share" from postgres distribution are there. If at some point
      51              :     // in time we will be able to run against vanilla postgres we may split that
      52              :     // to four separate paths and match OS-specific installation layout.
      53              :     pub pg_distrib_dir: PathBuf,
      54              : 
      55              :     // Path to pageserver binary.
      56              :     pub neon_distrib_dir: PathBuf,
      57              : 
      58              :     // Default tenant ID to use with the 'neon_local' command line utility, when
      59              :     // --tenant_id is not explicitly specified.
      60              :     pub default_tenant_id: Option<TenantId>,
      61              : 
      62              :     // used to issue tokens during e.g pg start
      63              :     pub private_key_path: PathBuf,
      64              : 
      65              :     pub broker: NeonBroker,
      66              : 
      67              :     // Configuration for the storage controller (1 per neon_local environment)
      68              :     pub storage_controller: NeonStorageControllerConf,
      69              : 
      70              :     /// This Vec must always contain at least one pageserver
      71              :     /// Populdated by [`Self::load_config`] from the individual `pageserver.toml`s.
      72              :     /// NB: not used anymore except for informing users that they need to change their `.neon/config`.
      73              :     pub pageservers: Vec<PageServerConf>,
      74              : 
      75              :     pub safekeepers: Vec<SafekeeperConf>,
      76              : 
      77              :     // Control plane upcall API for pageserver: if None, we will not run storage_controller  If set, this will
      78              :     // be propagated into each pageserver's configuration.
      79              :     pub control_plane_api: Option<Url>,
      80              : 
      81              :     // Control plane upcall API for storage controller.  If set, this will be propagated into the
      82              :     // storage controller's configuration.
      83              :     pub control_plane_compute_hook_api: Option<Url>,
      84              : 
      85              :     /// Keep human-readable aliases in memory (and persist them to config), to hide ZId hex strings from the user.
      86              :     // A `HashMap<String, HashMap<TenantId, TimelineId>>` would be more appropriate here,
      87              :     // but deserialization into a generic toml object as `toml::Value::try_from` fails with an error.
      88              :     // https://toml.io/en/v1.0.0 does not contain a concept of "a table inside another table".
      89              :     pub branch_name_mappings: HashMap<String, Vec<(TenantId, TimelineId)>>,
      90              : }
      91              : 
      92              : /// On-disk state stored in `.neon/config`.
      93            0 : #[derive(PartialEq, Eq, Clone, Debug, Default, Serialize, Deserialize)]
      94              : #[serde(default, deny_unknown_fields)]
      95              : pub struct OnDiskConfig {
      96              :     pub pg_distrib_dir: PathBuf,
      97              :     pub neon_distrib_dir: PathBuf,
      98              :     pub default_tenant_id: Option<TenantId>,
      99              :     pub private_key_path: PathBuf,
     100              :     pub broker: NeonBroker,
     101              :     pub storage_controller: NeonStorageControllerConf,
     102              :     #[serde(
     103              :         skip_serializing,
     104              :         deserialize_with = "fail_if_pageservers_field_specified"
     105              :     )]
     106              :     pub pageservers: Vec<PageServerConf>,
     107              :     pub safekeepers: Vec<SafekeeperConf>,
     108              :     pub control_plane_api: Option<Url>,
     109              :     pub control_plane_compute_hook_api: Option<Url>,
     110              :     branch_name_mappings: HashMap<String, Vec<(TenantId, TimelineId)>>,
     111              : }
     112              : 
     113            0 : fn fail_if_pageservers_field_specified<'de, D>(_: D) -> Result<Vec<PageServerConf>, D::Error>
     114            0 : where
     115            0 :     D: serde::Deserializer<'de>,
     116            0 : {
     117            0 :     Err(serde::de::Error::custom(
     118            0 :         "The 'pageservers' field is no longer used; pageserver.toml is now authoritative; \
     119            0 :          Please remove the `pageservers` from your .neon/config.",
     120            0 :     ))
     121            0 : }
     122              : 
     123              : /// The description of the neon_local env to be initialized by `neon_local init --config`.
     124            0 : #[derive(Clone, Debug, Deserialize)]
     125              : #[serde(deny_unknown_fields)]
     126              : pub struct NeonLocalInitConf {
     127              :     // TODO: do we need this? Seems unused
     128              :     pub pg_distrib_dir: Option<PathBuf>,
     129              :     // TODO: do we need this? Seems unused
     130              :     pub neon_distrib_dir: Option<PathBuf>,
     131              :     pub default_tenant_id: TenantId,
     132              :     pub broker: NeonBroker,
     133              :     pub storage_controller: Option<NeonStorageControllerConf>,
     134              :     pub pageservers: Vec<NeonLocalInitPageserverConf>,
     135              :     pub safekeepers: Vec<SafekeeperConf>,
     136              :     pub control_plane_api: Option<Option<Url>>,
     137              :     pub control_plane_compute_hook_api: Option<Option<Url>>,
     138              : }
     139              : 
     140              : /// Broker config for cluster internal communication.
     141            0 : #[derive(Serialize, Deserialize, PartialEq, Eq, Clone, Debug)]
     142              : #[serde(default)]
     143              : pub struct NeonBroker {
     144              :     /// Broker listen address for storage nodes coordination, e.g. '127.0.0.1:50051'.
     145              :     pub listen_addr: SocketAddr,
     146              : }
     147              : 
     148              : /// Broker config for cluster internal communication.
     149            0 : #[derive(Serialize, Deserialize, PartialEq, Eq, Clone, Debug)]
     150              : #[serde(default)]
     151              : pub struct NeonStorageControllerConf {
     152              :     /// Heartbeat timeout before marking a node offline
     153              :     #[serde(with = "humantime_serde")]
     154              :     pub max_offline: Duration,
     155              : 
     156              :     #[serde(with = "humantime_serde")]
     157              :     pub max_warming_up: Duration,
     158              : 
     159              :     pub start_as_candidate: bool,
     160              : 
     161              :     /// Database url used when running multiple storage controller instances
     162              :     pub database_url: Option<SocketAddr>,
     163              : 
     164              :     /// Threshold for auto-splitting a tenant into shards
     165              :     pub split_threshold: Option<u64>,
     166              : 
     167              :     pub max_secondary_lag_bytes: Option<u64>,
     168              : 
     169              :     #[serde(with = "humantime_serde")]
     170              :     pub heartbeat_interval: Duration,
     171              : 
     172              :     #[serde(with = "humantime_serde")]
     173              :     pub long_reconcile_threshold: Option<Duration>,
     174              : }
     175              : 
     176              : impl NeonStorageControllerConf {
     177              :     // Use a shorter pageserver unavailability interval than the default to speed up tests.
     178              :     const DEFAULT_MAX_OFFLINE_INTERVAL: std::time::Duration = std::time::Duration::from_secs(10);
     179              : 
     180              :     const DEFAULT_MAX_WARMING_UP_INTERVAL: std::time::Duration = std::time::Duration::from_secs(30);
     181              : 
     182              :     // Very tight heartbeat interval to speed up tests
     183              :     const DEFAULT_HEARTBEAT_INTERVAL: std::time::Duration = std::time::Duration::from_millis(100);
     184              : }
     185              : 
     186              : impl Default for NeonStorageControllerConf {
     187            0 :     fn default() -> Self {
     188            0 :         Self {
     189            0 :             max_offline: Self::DEFAULT_MAX_OFFLINE_INTERVAL,
     190            0 :             max_warming_up: Self::DEFAULT_MAX_WARMING_UP_INTERVAL,
     191            0 :             start_as_candidate: false,
     192            0 :             database_url: None,
     193            0 :             split_threshold: None,
     194            0 :             max_secondary_lag_bytes: None,
     195            0 :             heartbeat_interval: Self::DEFAULT_HEARTBEAT_INTERVAL,
     196            0 :             long_reconcile_threshold: None,
     197            0 :         }
     198            0 :     }
     199              : }
     200              : 
     201              : // Dummy Default impl to satisfy Deserialize derive.
     202              : impl Default for NeonBroker {
     203            0 :     fn default() -> Self {
     204            0 :         NeonBroker {
     205            0 :             listen_addr: SocketAddr::new(IpAddr::V4(Ipv4Addr::new(0, 0, 0, 0)), 0),
     206            0 :         }
     207            0 :     }
     208              : }
     209              : 
     210              : impl NeonBroker {
     211            0 :     pub fn client_url(&self) -> Url {
     212            0 :         Url::parse(&format!("http://{}", self.listen_addr)).expect("failed to construct url")
     213            0 :     }
     214              : }
     215              : 
     216              : // neon_local needs to know this subset of pageserver configuration.
     217              : // For legacy reasons, this information is duplicated from `pageserver.toml` into `.neon/config`.
     218              : // It can get stale if `pageserver.toml` is changed.
     219              : // TODO(christian): don't store this at all in `.neon/config`, always load it from `pageserver.toml`
     220            0 : #[derive(Serialize, Deserialize, PartialEq, Eq, Clone, Debug)]
     221              : #[serde(default, deny_unknown_fields)]
     222              : pub struct PageServerConf {
     223              :     pub id: NodeId,
     224              :     pub listen_pg_addr: String,
     225              :     pub listen_http_addr: String,
     226              :     pub pg_auth_type: AuthType,
     227              :     pub http_auth_type: AuthType,
     228              : }
     229              : 
     230              : impl Default for PageServerConf {
     231            0 :     fn default() -> Self {
     232            0 :         Self {
     233            0 :             id: NodeId(0),
     234            0 :             listen_pg_addr: String::new(),
     235            0 :             listen_http_addr: String::new(),
     236            0 :             pg_auth_type: AuthType::Trust,
     237            0 :             http_auth_type: AuthType::Trust,
     238            0 :         }
     239            0 :     }
     240              : }
     241              : 
     242              : /// The toml that can be passed to `neon_local init --config`.
     243              : /// This is a subset of the `pageserver.toml` configuration.
     244              : // TODO(christian): use pageserver_api::config::ConfigToml (PR #7656)
     245            0 : #[derive(Clone, Debug, serde::Deserialize, serde::Serialize)]
     246              : pub struct NeonLocalInitPageserverConf {
     247              :     pub id: NodeId,
     248              :     pub listen_pg_addr: String,
     249              :     pub listen_http_addr: String,
     250              :     pub pg_auth_type: AuthType,
     251              :     pub http_auth_type: AuthType,
     252              :     #[serde(flatten)]
     253              :     pub other: HashMap<String, toml::Value>,
     254              : }
     255              : 
     256              : impl From<&NeonLocalInitPageserverConf> for PageServerConf {
     257            0 :     fn from(conf: &NeonLocalInitPageserverConf) -> Self {
     258            0 :         let NeonLocalInitPageserverConf {
     259            0 :             id,
     260            0 :             listen_pg_addr,
     261            0 :             listen_http_addr,
     262            0 :             pg_auth_type,
     263            0 :             http_auth_type,
     264            0 :             other: _,
     265            0 :         } = conf;
     266            0 :         Self {
     267            0 :             id: *id,
     268            0 :             listen_pg_addr: listen_pg_addr.clone(),
     269            0 :             listen_http_addr: listen_http_addr.clone(),
     270            0 :             pg_auth_type: *pg_auth_type,
     271            0 :             http_auth_type: *http_auth_type,
     272            0 :         }
     273            0 :     }
     274              : }
     275              : 
     276            0 : #[derive(Serialize, Deserialize, PartialEq, Eq, Clone, Debug)]
     277              : #[serde(default)]
     278              : pub struct SafekeeperConf {
     279              :     pub id: NodeId,
     280              :     pub pg_port: u16,
     281              :     pub pg_tenant_only_port: Option<u16>,
     282              :     pub http_port: u16,
     283              :     pub sync: bool,
     284              :     pub remote_storage: Option<String>,
     285              :     pub backup_threads: Option<u32>,
     286              :     pub auth_enabled: bool,
     287              :     pub listen_addr: Option<String>,
     288              : }
     289              : 
     290              : impl Default for SafekeeperConf {
     291            0 :     fn default() -> Self {
     292            0 :         Self {
     293            0 :             id: NodeId(0),
     294            0 :             pg_port: 0,
     295            0 :             pg_tenant_only_port: None,
     296            0 :             http_port: 0,
     297            0 :             sync: true,
     298            0 :             remote_storage: None,
     299            0 :             backup_threads: None,
     300            0 :             auth_enabled: false,
     301            0 :             listen_addr: None,
     302            0 :         }
     303            0 :     }
     304              : }
     305              : 
     306              : #[derive(Clone, Copy)]
     307              : pub enum InitForceMode {
     308              :     MustNotExist,
     309              :     EmptyDirOk,
     310              :     RemoveAllContents,
     311              : }
     312              : 
     313              : impl ValueEnum for InitForceMode {
     314            0 :     fn value_variants<'a>() -> &'a [Self] {
     315            0 :         &[
     316            0 :             Self::MustNotExist,
     317            0 :             Self::EmptyDirOk,
     318            0 :             Self::RemoveAllContents,
     319            0 :         ]
     320            0 :     }
     321              : 
     322            0 :     fn to_possible_value(&self) -> Option<clap::builder::PossibleValue> {
     323            0 :         Some(clap::builder::PossibleValue::new(match self {
     324            0 :             InitForceMode::MustNotExist => "must-not-exist",
     325            0 :             InitForceMode::EmptyDirOk => "empty-dir-ok",
     326            0 :             InitForceMode::RemoveAllContents => "remove-all-contents",
     327              :         }))
     328            0 :     }
     329              : }
     330              : 
     331              : impl SafekeeperConf {
     332              :     /// Compute is served by port on which only tenant scoped tokens allowed, if
     333              :     /// it is configured.
     334            0 :     pub fn get_compute_port(&self) -> u16 {
     335            0 :         self.pg_tenant_only_port.unwrap_or(self.pg_port)
     336            0 :     }
     337              : }
     338              : 
     339              : impl LocalEnv {
     340            0 :     pub fn pg_distrib_dir_raw(&self) -> PathBuf {
     341            0 :         self.pg_distrib_dir.clone()
     342            0 :     }
     343              : 
     344            0 :     pub fn pg_distrib_dir(&self, pg_version: u32) -> anyhow::Result<PathBuf> {
     345            0 :         let path = self.pg_distrib_dir.clone();
     346            0 : 
     347            0 :         #[allow(clippy::manual_range_patterns)]
     348            0 :         match pg_version {
     349            0 :             14 | 15 | 16 | 17 => Ok(path.join(format!("v{pg_version}"))),
     350            0 :             _ => bail!("Unsupported postgres version: {}", pg_version),
     351              :         }
     352            0 :     }
     353              : 
     354            0 :     pub fn pg_dir(&self, pg_version: u32, dir_name: &str) -> anyhow::Result<PathBuf> {
     355            0 :         Ok(self.pg_distrib_dir(pg_version)?.join(dir_name))
     356            0 :     }
     357              : 
     358            0 :     pub fn pg_bin_dir(&self, pg_version: u32) -> anyhow::Result<PathBuf> {
     359            0 :         self.pg_dir(pg_version, "bin")
     360            0 :     }
     361              : 
     362            0 :     pub fn pg_lib_dir(&self, pg_version: u32) -> anyhow::Result<PathBuf> {
     363            0 :         self.pg_dir(pg_version, "lib")
     364            0 :     }
     365              : 
     366            0 :     pub fn pageserver_bin(&self) -> PathBuf {
     367            0 :         self.neon_distrib_dir.join("pageserver")
     368            0 :     }
     369              : 
     370            0 :     pub fn storage_controller_bin(&self) -> PathBuf {
     371            0 :         // Irrespective of configuration, storage controller binary is always
     372            0 :         // run from the same location as neon_local.  This means that for compatibility
     373            0 :         // tests that run old pageserver/safekeeper, they still run latest storage controller.
     374            0 :         let neon_local_bin_dir = env::current_exe().unwrap().parent().unwrap().to_owned();
     375            0 :         neon_local_bin_dir.join("storage_controller")
     376            0 :     }
     377              : 
     378            0 :     pub fn safekeeper_bin(&self) -> PathBuf {
     379            0 :         self.neon_distrib_dir.join("safekeeper")
     380            0 :     }
     381              : 
     382            0 :     pub fn storage_broker_bin(&self) -> PathBuf {
     383            0 :         self.neon_distrib_dir.join("storage_broker")
     384            0 :     }
     385              : 
     386            0 :     pub fn endpoints_path(&self) -> PathBuf {
     387            0 :         self.base_data_dir.join("endpoints")
     388            0 :     }
     389              : 
     390            0 :     pub fn pageserver_data_dir(&self, pageserver_id: NodeId) -> PathBuf {
     391            0 :         self.base_data_dir
     392            0 :             .join(format!("pageserver_{pageserver_id}"))
     393            0 :     }
     394              : 
     395            0 :     pub fn safekeeper_data_dir(&self, data_dir_name: &str) -> PathBuf {
     396            0 :         self.base_data_dir.join("safekeepers").join(data_dir_name)
     397            0 :     }
     398              : 
     399            0 :     pub fn get_pageserver_conf(&self, id: NodeId) -> anyhow::Result<&PageServerConf> {
     400            0 :         if let Some(conf) = self.pageservers.iter().find(|node| node.id == id) {
     401            0 :             Ok(conf)
     402              :         } else {
     403            0 :             let have_ids = self
     404            0 :                 .pageservers
     405            0 :                 .iter()
     406            0 :                 .map(|node| format!("{}:{}", node.id, node.listen_http_addr))
     407            0 :                 .collect::<Vec<_>>();
     408            0 :             let joined = have_ids.join(",");
     409            0 :             bail!("could not find pageserver {id}, have ids {joined}")
     410              :         }
     411            0 :     }
     412              : 
     413              :     /// Inspect the base data directory and extract the instance id and instance directory path
     414              :     /// for all storage controller instances
     415            0 :     pub async fn storage_controller_instances(&self) -> std::io::Result<Vec<(u8, PathBuf)>> {
     416            0 :         let mut instances = Vec::default();
     417              : 
     418            0 :         let dir = std::fs::read_dir(self.base_data_dir.clone())?;
     419            0 :         for dentry in dir {
     420            0 :             let dentry = dentry?;
     421            0 :             let is_dir = dentry.metadata()?.is_dir();
     422            0 :             let filename = dentry.file_name().into_string().unwrap();
     423            0 :             let parsed_instance_id = match filename.strip_prefix("storage_controller_") {
     424            0 :                 Some(suffix) => suffix.parse::<u8>().ok(),
     425            0 :                 None => None,
     426              :             };
     427              : 
     428            0 :             let is_instance_dir = is_dir && parsed_instance_id.is_some();
     429              : 
     430            0 :             if !is_instance_dir {
     431            0 :                 continue;
     432            0 :             }
     433            0 : 
     434            0 :             instances.push((
     435            0 :                 parsed_instance_id.expect("Checked previously"),
     436            0 :                 dentry.path(),
     437            0 :             ));
     438              :         }
     439              : 
     440            0 :         Ok(instances)
     441            0 :     }
     442              : 
     443            0 :     pub fn register_branch_mapping(
     444            0 :         &mut self,
     445            0 :         branch_name: String,
     446            0 :         tenant_id: TenantId,
     447            0 :         timeline_id: TimelineId,
     448            0 :     ) -> anyhow::Result<()> {
     449            0 :         let existing_values = self
     450            0 :             .branch_name_mappings
     451            0 :             .entry(branch_name.clone())
     452            0 :             .or_default();
     453            0 : 
     454            0 :         let existing_ids = existing_values
     455            0 :             .iter()
     456            0 :             .find(|(existing_tenant_id, _)| existing_tenant_id == &tenant_id);
     457              : 
     458            0 :         if let Some((_, old_timeline_id)) = existing_ids {
     459            0 :             if old_timeline_id == &timeline_id {
     460            0 :                 Ok(())
     461              :             } else {
     462            0 :                 bail!("branch '{branch_name}' is already mapped to timeline {old_timeline_id}, cannot map to another timeline {timeline_id}");
     463              :             }
     464              :         } else {
     465            0 :             existing_values.push((tenant_id, timeline_id));
     466            0 :             Ok(())
     467              :         }
     468            0 :     }
     469              : 
     470            0 :     pub fn get_branch_timeline_id(
     471            0 :         &self,
     472            0 :         branch_name: &str,
     473            0 :         tenant_id: TenantId,
     474            0 :     ) -> Option<TimelineId> {
     475            0 :         self.branch_name_mappings
     476            0 :             .get(branch_name)?
     477            0 :             .iter()
     478            0 :             .find(|(mapped_tenant_id, _)| mapped_tenant_id == &tenant_id)
     479            0 :             .map(|&(_, timeline_id)| timeline_id)
     480            0 :             .map(TimelineId::from)
     481            0 :     }
     482              : 
     483            0 :     pub fn timeline_name_mappings(&self) -> HashMap<TenantTimelineId, String> {
     484            0 :         self.branch_name_mappings
     485            0 :             .iter()
     486            0 :             .flat_map(|(name, tenant_timelines)| {
     487            0 :                 tenant_timelines.iter().map(|&(tenant_id, timeline_id)| {
     488            0 :                     (TenantTimelineId::new(tenant_id, timeline_id), name.clone())
     489            0 :                 })
     490            0 :             })
     491            0 :             .collect()
     492            0 :     }
     493              : 
     494              :     ///  Construct `Self` from on-disk state.
     495            0 :     pub fn load_config(repopath: &Path) -> anyhow::Result<Self> {
     496            0 :         if !repopath.exists() {
     497            0 :             bail!(
     498            0 :                 "Neon config is not found in {}. You need to run 'neon_local init' first",
     499            0 :                 repopath.to_str().unwrap()
     500            0 :             );
     501            0 :         }
     502              : 
     503              :         // TODO: check that it looks like a neon repository
     504              : 
     505              :         // load and parse file
     506            0 :         let config_file_contents = fs::read_to_string(repopath.join("config"))?;
     507            0 :         let on_disk_config: OnDiskConfig = toml::from_str(config_file_contents.as_str())?;
     508            0 :         let mut env = {
     509            0 :             let OnDiskConfig {
     510            0 :                 pg_distrib_dir,
     511            0 :                 neon_distrib_dir,
     512            0 :                 default_tenant_id,
     513            0 :                 private_key_path,
     514            0 :                 broker,
     515            0 :                 storage_controller,
     516            0 :                 pageservers,
     517            0 :                 safekeepers,
     518            0 :                 control_plane_api,
     519            0 :                 control_plane_compute_hook_api,
     520            0 :                 branch_name_mappings,
     521            0 :             } = on_disk_config;
     522            0 :             LocalEnv {
     523            0 :                 base_data_dir: repopath.to_owned(),
     524            0 :                 pg_distrib_dir,
     525            0 :                 neon_distrib_dir,
     526            0 :                 default_tenant_id,
     527            0 :                 private_key_path,
     528            0 :                 broker,
     529            0 :                 storage_controller,
     530            0 :                 pageservers,
     531            0 :                 safekeepers,
     532            0 :                 control_plane_api,
     533            0 :                 control_plane_compute_hook_api,
     534            0 :                 branch_name_mappings,
     535            0 :             }
     536            0 :         };
     537            0 : 
     538            0 :         // The source of truth for pageserver configuration is the pageserver.toml.
     539            0 :         assert!(
     540            0 :             env.pageservers.is_empty(),
     541            0 :             "we ensure this during deserialization"
     542              :         );
     543            0 :         env.pageservers = {
     544            0 :             let iter = std::fs::read_dir(repopath).context("open dir")?;
     545            0 :             let mut pageservers = Vec::new();
     546            0 :             for res in iter {
     547            0 :                 let dentry = res?;
     548              :                 const PREFIX: &str = "pageserver_";
     549            0 :                 let dentry_name = dentry
     550            0 :                     .file_name()
     551            0 :                     .into_string()
     552            0 :                     .ok()
     553            0 :                     .with_context(|| format!("non-utf8 dentry: {:?}", dentry.path()))
     554            0 :                     .unwrap();
     555            0 :                 if !dentry_name.starts_with(PREFIX) {
     556            0 :                     continue;
     557            0 :                 }
     558            0 :                 if !dentry.file_type().context("determine file type")?.is_dir() {
     559            0 :                     anyhow::bail!("expected a directory, got {:?}", dentry.path());
     560            0 :                 }
     561            0 :                 let id = dentry_name[PREFIX.len()..]
     562            0 :                     .parse::<NodeId>()
     563            0 :                     .with_context(|| format!("parse id from {:?}", dentry.path()))?;
     564              :                 // TODO(christian): use pageserver_api::config::ConfigToml (PR #7656)
     565            0 :                 #[derive(serde::Serialize, serde::Deserialize)]
     566              :                 // (allow unknown fields, unlike PageServerConf)
     567              :                 struct PageserverConfigTomlSubset {
     568              :                     listen_pg_addr: String,
     569              :                     listen_http_addr: String,
     570              :                     pg_auth_type: AuthType,
     571              :                     http_auth_type: AuthType,
     572              :                 }
     573            0 :                 let config_toml_path = dentry.path().join("pageserver.toml");
     574            0 :                 let config_toml: PageserverConfigTomlSubset = toml_edit::de::from_str(
     575            0 :                     &std::fs::read_to_string(&config_toml_path)
     576            0 :                         .with_context(|| format!("read {:?}", config_toml_path))?,
     577              :                 )
     578            0 :                 .context("parse pageserver.toml")?;
     579            0 :                 let identity_toml_path = dentry.path().join("identity.toml");
     580            0 :                 #[derive(serde::Serialize, serde::Deserialize)]
     581              :                 struct IdentityTomlSubset {
     582              :                     id: NodeId,
     583              :                 }
     584            0 :                 let identity_toml: IdentityTomlSubset = toml_edit::de::from_str(
     585            0 :                     &std::fs::read_to_string(&identity_toml_path)
     586            0 :                         .with_context(|| format!("read {:?}", identity_toml_path))?,
     587              :                 )
     588            0 :                 .context("parse identity.toml")?;
     589              :                 let PageserverConfigTomlSubset {
     590            0 :                     listen_pg_addr,
     591            0 :                     listen_http_addr,
     592            0 :                     pg_auth_type,
     593            0 :                     http_auth_type,
     594            0 :                 } = config_toml;
     595            0 :                 let IdentityTomlSubset {
     596            0 :                     id: identity_toml_id,
     597            0 :                 } = identity_toml;
     598            0 :                 let conf = PageServerConf {
     599              :                     id: {
     600            0 :                         anyhow::ensure!(
     601            0 :                             identity_toml_id == id,
     602            0 :                             "id mismatch: identity.toml:id={identity_toml_id} pageserver_(.*) id={id}",
     603              :                         );
     604            0 :                         id
     605            0 :                     },
     606            0 :                     listen_pg_addr,
     607            0 :                     listen_http_addr,
     608            0 :                     pg_auth_type,
     609            0 :                     http_auth_type,
     610            0 :                 };
     611            0 :                 pageservers.push(conf);
     612              :             }
     613            0 :             pageservers
     614            0 :         };
     615            0 : 
     616            0 :         Ok(env)
     617            0 :     }
     618              : 
     619            0 :     pub fn persist_config(&self) -> anyhow::Result<()> {
     620            0 :         Self::persist_config_impl(
     621            0 :             &self.base_data_dir,
     622            0 :             &OnDiskConfig {
     623            0 :                 pg_distrib_dir: self.pg_distrib_dir.clone(),
     624            0 :                 neon_distrib_dir: self.neon_distrib_dir.clone(),
     625            0 :                 default_tenant_id: self.default_tenant_id,
     626            0 :                 private_key_path: self.private_key_path.clone(),
     627            0 :                 broker: self.broker.clone(),
     628            0 :                 storage_controller: self.storage_controller.clone(),
     629            0 :                 pageservers: vec![], // it's skip_serializing anyway
     630            0 :                 safekeepers: self.safekeepers.clone(),
     631            0 :                 control_plane_api: self.control_plane_api.clone(),
     632            0 :                 control_plane_compute_hook_api: self.control_plane_compute_hook_api.clone(),
     633            0 :                 branch_name_mappings: self.branch_name_mappings.clone(),
     634            0 :             },
     635            0 :         )
     636            0 :     }
     637              : 
     638            0 :     pub fn persist_config_impl(base_path: &Path, config: &OnDiskConfig) -> anyhow::Result<()> {
     639            0 :         let conf_content = &toml::to_string_pretty(config)?;
     640            0 :         let target_config_path = base_path.join("config");
     641            0 :         fs::write(&target_config_path, conf_content).with_context(|| {
     642            0 :             format!(
     643            0 :                 "Failed to write config file into path '{}'",
     644            0 :                 target_config_path.display()
     645            0 :             )
     646            0 :         })
     647            0 :     }
     648              : 
     649              :     // this function is used only for testing purposes in CLI e g generate tokens during init
     650            0 :     pub fn generate_auth_token(&self, claims: &Claims) -> anyhow::Result<String> {
     651            0 :         let private_key_path = self.get_private_key_path();
     652            0 :         let key_data = fs::read(private_key_path)?;
     653            0 :         encode_from_key_file(claims, &key_data)
     654            0 :     }
     655              : 
     656            0 :     pub fn get_private_key_path(&self) -> PathBuf {
     657            0 :         if self.private_key_path.is_absolute() {
     658            0 :             self.private_key_path.to_path_buf()
     659              :         } else {
     660            0 :             self.base_data_dir.join(&self.private_key_path)
     661              :         }
     662            0 :     }
     663              : 
     664              :     /// Materialize the [`NeonLocalInitConf`] to disk. Called during [`neon_local init`].
     665            0 :     pub fn init(conf: NeonLocalInitConf, force: &InitForceMode) -> anyhow::Result<()> {
     666            0 :         let base_path = base_path();
     667            0 :         assert_ne!(base_path, Path::new(""));
     668            0 :         let base_path = &base_path;
     669            0 : 
     670            0 :         // create base_path dir
     671            0 :         if base_path.exists() {
     672            0 :             match force {
     673              :                 InitForceMode::MustNotExist => {
     674            0 :                     bail!(
     675            0 :                         "directory '{}' already exists. Perhaps already initialized?",
     676            0 :                         base_path.display()
     677            0 :                     );
     678              :                 }
     679              :                 InitForceMode::EmptyDirOk => {
     680            0 :                     if let Some(res) = std::fs::read_dir(base_path)?.next() {
     681            0 :                         res.context("check if directory is empty")?;
     682            0 :                         anyhow::bail!("directory not empty: {base_path:?}");
     683            0 :                     }
     684              :                 }
     685              :                 InitForceMode::RemoveAllContents => {
     686            0 :                     println!("removing all contents of '{}'", base_path.display());
     687              :                     // instead of directly calling `remove_dir_all`, we keep the original dir but removing
     688              :                     // all contents inside. This helps if the developer symbol links another directory (i.e.,
     689              :                     // S3 local SSD) to the `.neon` base directory.
     690            0 :                     for entry in std::fs::read_dir(base_path)? {
     691            0 :                         let entry = entry?;
     692            0 :                         let path = entry.path();
     693            0 :                         if path.is_dir() {
     694            0 :                             fs::remove_dir_all(&path)?;
     695              :                         } else {
     696            0 :                             fs::remove_file(&path)?;
     697              :                         }
     698              :                     }
     699              :                 }
     700              :             }
     701            0 :         }
     702            0 :         if !base_path.exists() {
     703            0 :             fs::create_dir(base_path)?;
     704            0 :         }
     705              : 
     706              :         let NeonLocalInitConf {
     707            0 :             pg_distrib_dir,
     708            0 :             neon_distrib_dir,
     709            0 :             default_tenant_id,
     710            0 :             broker,
     711            0 :             storage_controller,
     712            0 :             pageservers,
     713            0 :             safekeepers,
     714            0 :             control_plane_api,
     715            0 :             control_plane_compute_hook_api,
     716            0 :         } = conf;
     717            0 : 
     718            0 :         // Find postgres binaries.
     719            0 :         // Follow POSTGRES_DISTRIB_DIR if set, otherwise look in "pg_install".
     720            0 :         // Note that later in the code we assume, that distrib dirs follow the same pattern
     721            0 :         // for all postgres versions.
     722            0 :         let pg_distrib_dir = pg_distrib_dir.unwrap_or_else(|| {
     723            0 :             if let Some(postgres_bin) = env::var_os("POSTGRES_DISTRIB_DIR") {
     724            0 :                 postgres_bin.into()
     725              :             } else {
     726            0 :                 let cwd = env::current_dir().unwrap();
     727            0 :                 cwd.join("pg_install")
     728              :             }
     729            0 :         });
     730            0 : 
     731            0 :         // Find neon binaries.
     732            0 :         let neon_distrib_dir = neon_distrib_dir
     733            0 :             .unwrap_or_else(|| env::current_exe().unwrap().parent().unwrap().to_owned());
     734            0 : 
     735            0 :         // Generate keypair for JWT.
     736            0 :         //
     737            0 :         // The keypair is only needed if authentication is enabled in any of the
     738            0 :         // components. For convenience, we generate the keypair even if authentication
     739            0 :         // is not enabled, so that you can easily enable it after the initialization
     740            0 :         // step.
     741            0 :         generate_auth_keys(
     742            0 :             base_path.join("auth_private_key.pem").as_path(),
     743            0 :             base_path.join("auth_public_key.pem").as_path(),
     744            0 :         )
     745            0 :         .context("generate auth keys")?;
     746            0 :         let private_key_path = PathBuf::from("auth_private_key.pem");
     747            0 : 
     748            0 :         // create the runtime type because the remaining initialization code below needs
     749            0 :         // a LocalEnv instance op operation
     750            0 :         // TODO: refactor to avoid this, LocalEnv should only be constructed from on-disk state
     751            0 :         let env = LocalEnv {
     752            0 :             base_data_dir: base_path.clone(),
     753            0 :             pg_distrib_dir,
     754            0 :             neon_distrib_dir,
     755            0 :             default_tenant_id: Some(default_tenant_id),
     756            0 :             private_key_path,
     757            0 :             broker,
     758            0 :             storage_controller: storage_controller.unwrap_or_default(),
     759            0 :             pageservers: pageservers.iter().map(Into::into).collect(),
     760            0 :             safekeepers,
     761            0 :             control_plane_api: control_plane_api.unwrap_or_default(),
     762            0 :             control_plane_compute_hook_api: control_plane_compute_hook_api.unwrap_or_default(),
     763            0 :             branch_name_mappings: Default::default(),
     764            0 :         };
     765            0 : 
     766            0 :         // create endpoints dir
     767            0 :         fs::create_dir_all(env.endpoints_path())?;
     768              : 
     769              :         // create safekeeper dirs
     770            0 :         for safekeeper in &env.safekeepers {
     771            0 :             fs::create_dir_all(SafekeeperNode::datadir_path_by_id(&env, safekeeper.id))?;
     772              :         }
     773              : 
     774              :         // initialize pageserver state
     775            0 :         for (i, ps) in pageservers.into_iter().enumerate() {
     776            0 :             let runtime_ps = &env.pageservers[i];
     777            0 :             assert_eq!(&PageServerConf::from(&ps), runtime_ps);
     778            0 :             fs::create_dir(env.pageserver_data_dir(ps.id))?;
     779            0 :             PageServerNode::from_env(&env, runtime_ps)
     780            0 :                 .initialize(ps)
     781            0 :                 .context("pageserver init failed")?;
     782              :         }
     783              : 
     784              :         // setup remote remote location for default LocalFs remote storage
     785            0 :         std::fs::create_dir_all(env.base_data_dir.join(PAGESERVER_REMOTE_STORAGE_DIR))?;
     786              : 
     787            0 :         env.persist_config()
     788            0 :     }
     789              : }
     790              : 
     791            0 : pub fn base_path() -> PathBuf {
     792            0 :     let path = match std::env::var_os("NEON_REPO_DIR") {
     793            0 :         Some(val) => {
     794            0 :             let path = PathBuf::from(val);
     795            0 :             if !path.is_absolute() {
     796              :                 // repeat the env var in the error because our default is always absolute
     797            0 :                 panic!("NEON_REPO_DIR must be an absolute path, got {path:?}");
     798            0 :             }
     799            0 :             path
     800              :         }
     801              :         None => {
     802            0 :             let pwd = std::env::current_dir()
     803            0 :                 // technically this can fail but it's quite unlikeley
     804            0 :                 .expect("determine current directory");
     805            0 :             let pwd_abs = pwd.canonicalize().expect("canonicalize current directory");
     806            0 :             pwd_abs.join(".neon")
     807              :         }
     808              :     };
     809            0 :     assert!(path.is_absolute());
     810            0 :     path
     811            0 : }
     812              : 
     813              : /// Generate a public/private key pair for JWT authentication
     814            0 : fn generate_auth_keys(private_key_path: &Path, public_key_path: &Path) -> anyhow::Result<()> {
     815              :     // Generate the key pair
     816              :     //
     817              :     // openssl genpkey -algorithm ed25519 -out auth_private_key.pem
     818            0 :     let keygen_output = Command::new("openssl")
     819            0 :         .arg("genpkey")
     820            0 :         .args(["-algorithm", "ed25519"])
     821            0 :         .args(["-out", private_key_path.to_str().unwrap()])
     822            0 :         .stdout(Stdio::null())
     823            0 :         .output()
     824            0 :         .context("failed to generate auth private key")?;
     825            0 :     if !keygen_output.status.success() {
     826            0 :         bail!(
     827            0 :             "openssl failed: '{}'",
     828            0 :             String::from_utf8_lossy(&keygen_output.stderr)
     829            0 :         );
     830            0 :     }
     831              :     // Extract the public key from the private key file
     832              :     //
     833              :     // openssl pkey -in auth_private_key.pem -pubout -out auth_public_key.pem
     834            0 :     let keygen_output = Command::new("openssl")
     835            0 :         .arg("pkey")
     836            0 :         .args(["-in", private_key_path.to_str().unwrap()])
     837            0 :         .arg("-pubout")
     838            0 :         .args(["-out", public_key_path.to_str().unwrap()])
     839            0 :         .output()
     840            0 :         .context("failed to extract public key from private key")?;
     841            0 :     if !keygen_output.status.success() {
     842            0 :         bail!(
     843            0 :             "openssl failed: '{}'",
     844            0 :             String::from_utf8_lossy(&keygen_output.stderr)
     845            0 :         );
     846            0 :     }
     847            0 :     Ok(())
     848            0 : }
        

Generated by: LCOV version 2.1-beta