LCOV - code coverage report
Current view: top level - storage_scrubber/src - cloud_admin_api.rs (source / functions) Coverage Total Hit
Test: 53437f7e869ac68c86c7d3e4c20964c0156f158c.info Lines: 0.0 % 366 0
Test Date: 2024-09-20 16:14:12 Functions: 0.0 % 135 0

            Line data    Source code
       1              : use chrono::{DateTime, Utc};
       2              : use futures::Future;
       3              : use hex::FromHex;
       4              : 
       5              : use reqwest::{header, Client, StatusCode, Url};
       6              : use serde::Deserialize;
       7              : use tokio::sync::Semaphore;
       8              : 
       9              : use tokio_util::sync::CancellationToken;
      10              : use utils::backoff;
      11              : use utils::id::{TenantId, TimelineId};
      12              : use utils::lsn::Lsn;
      13              : 
      14              : use crate::ConsoleConfig;
      15              : 
      16              : #[derive(Debug)]
      17              : pub struct Error {
      18              :     context: String,
      19              :     kind: ErrorKind,
      20              : }
      21              : 
      22              : impl Error {
      23            0 :     fn new(context: String, kind: ErrorKind) -> Self {
      24            0 :         Self { context, kind }
      25            0 :     }
      26              : }
      27              : 
      28              : impl std::fmt::Display for Error {
      29            0 :     fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
      30            0 :         match &self.kind {
      31            0 :             ErrorKind::RequestSend(e) => write!(
      32            0 :                 f,
      33            0 :                 "Failed to send a request. Context: {}, error: {}",
      34            0 :                 self.context, e
      35            0 :             ),
      36            0 :             ErrorKind::BodyRead(e) => {
      37            0 :                 write!(
      38            0 :                     f,
      39            0 :                     "Failed to read a request body. Context: {}, error: {}",
      40            0 :                     self.context, e
      41            0 :                 )
      42              :             }
      43            0 :             ErrorKind::ResponseStatus(status) => {
      44            0 :                 write!(f, "Bad response status {}: {}", status, self.context)
      45              :             }
      46            0 :             ErrorKind::UnexpectedState => write!(f, "Unexpected state: {}", self.context),
      47              :         }
      48            0 :     }
      49              : }
      50              : 
      51            0 : #[derive(Debug, Clone, serde::Deserialize, Hash, PartialEq, Eq)]
      52              : #[serde(transparent)]
      53              : pub struct ProjectId(pub String);
      54              : 
      55            0 : #[derive(Clone, Debug, serde::Deserialize, Hash, PartialEq, Eq)]
      56              : #[serde(transparent)]
      57              : pub struct BranchId(pub String);
      58              : 
      59              : impl std::error::Error for Error {}
      60              : 
      61              : #[derive(Debug)]
      62              : pub enum ErrorKind {
      63              :     RequestSend(reqwest::Error),
      64              :     BodyRead(reqwest::Error),
      65              :     ResponseStatus(StatusCode),
      66              :     UnexpectedState,
      67              : }
      68              : 
      69              : pub struct CloudAdminApiClient {
      70              :     request_limiter: Semaphore,
      71              :     token: String,
      72              :     base_url: Url,
      73              :     http_client: Client,
      74              : }
      75              : 
      76            0 : #[derive(Debug, serde::Deserialize)]
      77              : struct AdminApiResponse<T> {
      78              :     data: T,
      79              :     total: Option<usize>,
      80              : }
      81              : 
      82            0 : #[derive(Debug, serde::Deserialize)]
      83              : pub struct PageserverData {
      84              :     pub id: u64,
      85              :     pub created_at: DateTime<Utc>,
      86              :     pub updated_at: DateTime<Utc>,
      87              :     pub region_id: String,
      88              :     pub version: i64,
      89              :     pub instance_id: String,
      90              :     pub port: u16,
      91              :     pub http_host: String,
      92              :     pub http_port: u16,
      93              :     pub active: bool,
      94              :     pub projects_count: usize,
      95              :     pub availability_zone_id: String,
      96              : }
      97              : 
      98            0 : #[derive(Debug, Clone, serde::Deserialize)]
      99              : pub struct SafekeeperData {
     100              :     pub id: u64,
     101              :     pub created_at: DateTime<Utc>,
     102              :     pub updated_at: DateTime<Utc>,
     103              :     pub region_id: String,
     104              :     pub version: i64,
     105              :     pub instance_id: String,
     106              :     pub active: bool,
     107              :     pub host: String,
     108              :     pub port: u16,
     109              :     pub projects_count: usize,
     110              :     pub availability_zone_id: String,
     111              : }
     112              : 
     113              : /// For ID fields, the Console API does not always return a value or null.  It will
     114              : /// sometimes return an empty string.  Our native Id type does not consider this acceptable
     115              : /// (nor should it), so we use a wrapper for talking to the Console API.
     116            0 : fn from_nullable_id<'de, D>(deserializer: D) -> Result<TenantId, D::Error>
     117            0 : where
     118            0 :     D: serde::de::Deserializer<'de>,
     119            0 : {
     120            0 :     if deserializer.is_human_readable() {
     121            0 :         let id_str = String::deserialize(deserializer)?;
     122            0 :         if id_str.is_empty() {
     123              :             // This is a bogus value, but for the purposes of the scrubber all that
     124              :             // matters is that it doesn't collide with any real IDs.
     125            0 :             Ok(TenantId::from([0u8; 16]))
     126              :         } else {
     127            0 :             TenantId::from_hex(&id_str).map_err(|e| serde::de::Error::custom(format!("{e}")))
     128              :         }
     129              :     } else {
     130            0 :         let id_arr = <[u8; 16]>::deserialize(deserializer)?;
     131            0 :         Ok(TenantId::from(id_arr))
     132              :     }
     133            0 : }
     134              : 
     135            0 : #[derive(Debug, Clone, serde::Deserialize)]
     136              : pub struct ProjectData {
     137              :     pub id: ProjectId,
     138              :     pub name: String,
     139              :     pub region_id: String,
     140              :     pub platform_id: String,
     141              :     pub user_id: String,
     142              :     pub pageserver_id: Option<u64>,
     143              :     #[serde(deserialize_with = "from_nullable_id")]
     144              :     pub tenant: TenantId,
     145              :     pub safekeepers: Vec<SafekeeperData>,
     146              :     pub deleted: bool,
     147              :     pub created_at: DateTime<Utc>,
     148              :     pub updated_at: DateTime<Utc>,
     149              :     pub pg_version: u32,
     150              :     pub max_project_size: u64,
     151              :     pub remote_storage_size: u64,
     152              :     pub resident_size: u64,
     153              :     pub synthetic_storage_size: u64,
     154              :     pub compute_time: u64,
     155              :     pub data_transfer: u64,
     156              :     pub data_storage: u64,
     157              :     pub maintenance_set: Option<String>,
     158              : }
     159              : 
     160            0 : #[derive(Debug, Clone, serde::Deserialize)]
     161              : pub struct BranchData {
     162              :     pub id: BranchId,
     163              :     pub created_at: DateTime<Utc>,
     164              :     pub updated_at: DateTime<Utc>,
     165              :     pub name: String,
     166              :     pub project_id: ProjectId,
     167              :     pub timeline_id: TimelineId,
     168              :     #[serde(default)]
     169              :     pub parent_id: Option<BranchId>,
     170              :     #[serde(default)]
     171              :     pub parent_lsn: Option<Lsn>,
     172              :     pub default: bool,
     173              :     pub deleted: bool,
     174              :     pub logical_size: Option<u64>,
     175              :     pub physical_size: Option<u64>,
     176              :     pub written_size: Option<u64>,
     177              : }
     178              : 
     179              : pub trait MaybeDeleted {
     180              :     fn is_deleted(&self) -> bool;
     181              : }
     182              : 
     183              : impl MaybeDeleted for ProjectData {
     184            0 :     fn is_deleted(&self) -> bool {
     185            0 :         self.deleted
     186            0 :     }
     187              : }
     188              : 
     189              : impl MaybeDeleted for BranchData {
     190            0 :     fn is_deleted(&self) -> bool {
     191            0 :         self.deleted
     192            0 :     }
     193              : }
     194              : 
     195              : impl CloudAdminApiClient {
     196            0 :     pub fn new(config: ConsoleConfig) -> Self {
     197            0 :         Self {
     198            0 :             token: config.token,
     199            0 :             base_url: config.base_url,
     200            0 :             request_limiter: Semaphore::new(200),
     201            0 :             http_client: Client::new(), // TODO timeout configs at least
     202            0 :         }
     203            0 :     }
     204              : 
     205            0 :     pub async fn find_tenant_project(
     206            0 :         &self,
     207            0 :         tenant_id: TenantId,
     208            0 :     ) -> Result<Option<ProjectData>, Error> {
     209            0 :         let _permit = self
     210            0 :             .request_limiter
     211            0 :             .acquire()
     212            0 :             .await
     213            0 :             .expect("Semaphore is not closed");
     214              : 
     215            0 :         let response = CloudAdminApiClient::with_retries(
     216            0 :             || async {
     217            0 :                 let response = self
     218            0 :                     .http_client
     219            0 :                     .get(self.append_url("/projects"))
     220            0 :                     .query(&[
     221            0 :                         ("tenant_id", tenant_id.to_string()),
     222            0 :                         ("show_deleted", "true".to_string()),
     223            0 :                     ])
     224            0 :                     .header(header::ACCEPT, "application/json")
     225            0 :                     .bearer_auth(&self.token)
     226            0 :                     .send()
     227            0 :                     .await
     228            0 :                     .map_err(|e| {
     229            0 :                         Error::new(
     230            0 :                             "Find project for tenant".to_string(),
     231            0 :                             ErrorKind::RequestSend(e),
     232            0 :                         )
     233            0 :                     })?;
     234              : 
     235            0 :                 let response: AdminApiResponse<Vec<ProjectData>> =
     236            0 :                     response.json().await.map_err(|e| {
     237            0 :                         Error::new(
     238            0 :                             "Find project for tenant".to_string(),
     239            0 :                             ErrorKind::BodyRead(e),
     240            0 :                         )
     241            0 :                     })?;
     242            0 :                 Ok(response)
     243            0 :             },
     244            0 :             "find_tenant_project",
     245            0 :         )
     246            0 :         .await?;
     247              : 
     248            0 :         match response.data.len() {
     249            0 :             0 => Ok(None),
     250            0 :             1 => Ok(Some(
     251            0 :                 response
     252            0 :                     .data
     253            0 :                     .into_iter()
     254            0 :                     .next()
     255            0 :                     .expect("Should have exactly one element"),
     256            0 :             )),
     257            0 :             too_many => Err(Error::new(
     258            0 :                 format!("Find project for tenant returned {too_many} projects instead of 0 or 1"),
     259            0 :                 ErrorKind::UnexpectedState,
     260            0 :             )),
     261              :         }
     262            0 :     }
     263              : 
     264            0 :     pub async fn list_projects(&self, region_id: String) -> Result<Vec<ProjectData>, Error> {
     265            0 :         let _permit = self
     266            0 :             .request_limiter
     267            0 :             .acquire()
     268            0 :             .await
     269            0 :             .expect("Semaphore is not closed");
     270            0 : 
     271            0 :         let mut pagination_offset = 0;
     272              :         const PAGINATION_LIMIT: usize = 512;
     273            0 :         let mut result: Vec<ProjectData> = Vec::with_capacity(PAGINATION_LIMIT);
     274              :         loop {
     275            0 :             let response_bytes = CloudAdminApiClient::with_retries(
     276            0 :                 || async {
     277            0 :                     let response = self
     278            0 :                         .http_client
     279            0 :                         .get(self.append_url("/projects"))
     280            0 :                         .query(&[
     281            0 :                             ("show_deleted", "false".to_string()),
     282            0 :                             ("limit", format!("{PAGINATION_LIMIT}")),
     283            0 :                             ("offset", format!("{pagination_offset}")),
     284            0 :                         ])
     285            0 :                         .header(header::ACCEPT, "application/json")
     286            0 :                         .bearer_auth(&self.token)
     287            0 :                         .send()
     288            0 :                         .await
     289            0 :                         .map_err(|e| {
     290            0 :                             Error::new(
     291            0 :                                 "List active projects".to_string(),
     292            0 :                                 ErrorKind::RequestSend(e),
     293            0 :                             )
     294            0 :                         })?;
     295              : 
     296            0 :                     response.bytes().await.map_err(|e| {
     297            0 :                         Error::new("List active projects".to_string(), ErrorKind::BodyRead(e))
     298            0 :                     })
     299            0 :                 },
     300            0 :                 "list_projects",
     301            0 :             )
     302            0 :             .await?;
     303              : 
     304            0 :             let decode_result =
     305            0 :                 serde_json::from_slice::<AdminApiResponse<Vec<ProjectData>>>(&response_bytes);
     306              : 
     307            0 :             let mut response = match decode_result {
     308            0 :                 Ok(r) => r,
     309            0 :                 Err(decode) => {
     310            0 :                     tracing::error!(
     311            0 :                         "Failed to decode response body: {}\n{}",
     312            0 :                         decode,
     313            0 :                         String::from_utf8(response_bytes.to_vec()).unwrap()
     314              :                     );
     315            0 :                     panic!("we out");
     316              :                 }
     317              :             };
     318              : 
     319            0 :             pagination_offset += response.data.len();
     320            0 : 
     321            0 :             result.extend(response.data.drain(..).filter(|t| t.region_id == region_id));
     322            0 : 
     323            0 :             if pagination_offset >= response.total.unwrap_or(0) {
     324            0 :                 break;
     325            0 :             }
     326              :         }
     327              : 
     328            0 :         Ok(result)
     329            0 :     }
     330              : 
     331            0 :     pub async fn find_timeline_branch(
     332            0 :         &self,
     333            0 :         tenant_id: TenantId,
     334            0 :         timeline_id: TimelineId,
     335            0 :     ) -> Result<Option<BranchData>, Error> {
     336            0 :         let _permit = self
     337            0 :             .request_limiter
     338            0 :             .acquire()
     339            0 :             .await
     340            0 :             .expect("Semaphore is not closed");
     341              : 
     342            0 :         let response = CloudAdminApiClient::with_retries(
     343            0 :             || async {
     344            0 :                 let response = self
     345            0 :                     .http_client
     346            0 :                     .get(self.append_url("/branches"))
     347            0 :                     .query(&[
     348            0 :                         ("timeline_id", timeline_id.to_string()),
     349            0 :                         ("show_deleted", "true".to_string()),
     350            0 :                     ])
     351            0 :                     .header(header::ACCEPT, "application/json")
     352            0 :                     .bearer_auth(&self.token)
     353            0 :                     .send()
     354            0 :                     .await
     355            0 :                     .map_err(|e| {
     356            0 :                         Error::new(
     357            0 :                             "Find branch for timeline".to_string(),
     358            0 :                             ErrorKind::RequestSend(e),
     359            0 :                         )
     360            0 :                     })?;
     361              : 
     362            0 :                 let response: AdminApiResponse<Vec<BranchData>> =
     363            0 :                     response.json().await.map_err(|e| {
     364            0 :                         Error::new(
     365            0 :                             "Find branch for timeline".to_string(),
     366            0 :                             ErrorKind::BodyRead(e),
     367            0 :                         )
     368            0 :                     })?;
     369            0 :                 Ok(response)
     370            0 :             },
     371            0 :             "find_timeline_branch",
     372            0 :         )
     373            0 :         .await?;
     374              : 
     375            0 :         let mut branches: Vec<BranchData> = response.data.into_iter().collect();
     376              :         // Normally timeline_id is unique. However, we do have at least one case
     377              :         // of the same timeline_id in two different projects, apparently after
     378              :         // manual recovery. So always recheck project_id (discovered through
     379              :         // tenant_id).
     380            0 :         let project_data = match self.find_tenant_project(tenant_id).await? {
     381            0 :             Some(pd) => pd,
     382            0 :             None => return Ok(None),
     383              :         };
     384            0 :         branches.retain(|b| b.project_id == project_data.id);
     385            0 :         if branches.len() < 2 {
     386            0 :             Ok(branches.first().cloned())
     387              :         } else {
     388            0 :             Err(Error::new(
     389            0 :                 format!(
     390            0 :                     "Find branch for timeline {}/{} returned {} branches instead of 0 or 1",
     391            0 :                     tenant_id,
     392            0 :                     timeline_id,
     393            0 :                     branches.len()
     394            0 :                 ),
     395            0 :                 ErrorKind::UnexpectedState,
     396            0 :             ))
     397              :         }
     398            0 :     }
     399              : 
     400            0 :     pub async fn list_pageservers(&self) -> Result<Vec<PageserverData>, Error> {
     401            0 :         let _permit = self
     402            0 :             .request_limiter
     403            0 :             .acquire()
     404            0 :             .await
     405            0 :             .expect("Semaphore is not closed");
     406              : 
     407            0 :         let response = self
     408            0 :             .http_client
     409            0 :             .get(self.append_url("/pageservers"))
     410            0 :             .header(header::ACCEPT, "application/json")
     411            0 :             .bearer_auth(&self.token)
     412            0 :             .send()
     413            0 :             .await
     414            0 :             .map_err(|e| Error::new("List pageservers".to_string(), ErrorKind::RequestSend(e)))?;
     415              : 
     416            0 :         let response: AdminApiResponse<Vec<PageserverData>> = response
     417            0 :             .json()
     418            0 :             .await
     419            0 :             .map_err(|e| Error::new("List pageservers".to_string(), ErrorKind::BodyRead(e)))?;
     420              : 
     421            0 :         Ok(response.data)
     422            0 :     }
     423              : 
     424            0 :     pub async fn list_safekeepers(&self) -> Result<Vec<SafekeeperData>, Error> {
     425            0 :         let _permit = self
     426            0 :             .request_limiter
     427            0 :             .acquire()
     428            0 :             .await
     429            0 :             .expect("Semaphore is not closed");
     430              : 
     431            0 :         let response = self
     432            0 :             .http_client
     433            0 :             .get(self.append_url("/safekeepers"))
     434            0 :             .header(header::ACCEPT, "application/json")
     435            0 :             .bearer_auth(&self.token)
     436            0 :             .send()
     437            0 :             .await
     438            0 :             .map_err(|e| Error::new("List safekeepers".to_string(), ErrorKind::RequestSend(e)))?;
     439              : 
     440            0 :         let response: AdminApiResponse<Vec<SafekeeperData>> = response
     441            0 :             .json()
     442            0 :             .await
     443            0 :             .map_err(|e| Error::new("List safekeepers".to_string(), ErrorKind::BodyRead(e)))?;
     444              : 
     445            0 :         Ok(response.data)
     446            0 :     }
     447              : 
     448            0 :     pub async fn projects_for_pageserver(
     449            0 :         &self,
     450            0 :         pageserver_id: u64,
     451            0 :         show_deleted: bool,
     452            0 :     ) -> Result<Vec<ProjectData>, Error> {
     453            0 :         let _permit = self
     454            0 :             .request_limiter
     455            0 :             .acquire()
     456            0 :             .await
     457            0 :             .expect("Semaphore is not closed");
     458              : 
     459            0 :         let response = self
     460            0 :             .http_client
     461            0 :             .get(self.append_url("/projects"))
     462            0 :             .query(&[
     463            0 :                 ("pageserver_id", &pageserver_id.to_string()),
     464            0 :                 ("show_deleted", &show_deleted.to_string()),
     465            0 :             ])
     466            0 :             .header(header::ACCEPT, "application/json")
     467            0 :             .bearer_auth(&self.token)
     468            0 :             .send()
     469            0 :             .await
     470            0 :             .map_err(|e| Error::new("Project for tenant".to_string(), ErrorKind::RequestSend(e)))?;
     471              : 
     472            0 :         let response: AdminApiResponse<Vec<ProjectData>> = response
     473            0 :             .json()
     474            0 :             .await
     475            0 :             .map_err(|e| Error::new("Project for tenant".to_string(), ErrorKind::BodyRead(e)))?;
     476              : 
     477            0 :         Ok(response.data)
     478            0 :     }
     479              : 
     480            0 :     pub async fn project_for_tenant(
     481            0 :         &self,
     482            0 :         tenant_id: TenantId,
     483            0 :         show_deleted: bool,
     484            0 :     ) -> Result<Option<ProjectData>, Error> {
     485            0 :         let _permit = self
     486            0 :             .request_limiter
     487            0 :             .acquire()
     488            0 :             .await
     489            0 :             .expect("Semaphore is not closed");
     490              : 
     491            0 :         let response = self
     492            0 :             .http_client
     493            0 :             .get(self.append_url("/projects"))
     494            0 :             .query(&[
     495            0 :                 ("search", &tenant_id.to_string()),
     496            0 :                 ("show_deleted", &show_deleted.to_string()),
     497            0 :             ])
     498            0 :             .header(header::ACCEPT, "application/json")
     499            0 :             .bearer_auth(&self.token)
     500            0 :             .send()
     501            0 :             .await
     502            0 :             .map_err(|e| Error::new("Project for tenant".to_string(), ErrorKind::RequestSend(e)))?;
     503              : 
     504            0 :         let response: AdminApiResponse<Vec<ProjectData>> = response
     505            0 :             .json()
     506            0 :             .await
     507            0 :             .map_err(|e| Error::new("Project for tenant".to_string(), ErrorKind::BodyRead(e)))?;
     508              : 
     509            0 :         match response.data.as_slice() {
     510            0 :             [] => Ok(None),
     511            0 :             [_single] => Ok(Some(response.data.into_iter().next().unwrap())),
     512            0 :             multiple => Err(Error::new(
     513            0 :                 format!("Got more than one project for tenant {tenant_id} : {multiple:?}"),
     514            0 :                 ErrorKind::UnexpectedState,
     515            0 :             )),
     516              :         }
     517            0 :     }
     518              : 
     519            0 :     pub async fn branches_for_project(
     520            0 :         &self,
     521            0 :         project_id: &ProjectId,
     522            0 :         show_deleted: bool,
     523            0 :     ) -> Result<Vec<BranchData>, Error> {
     524            0 :         let _permit = self
     525            0 :             .request_limiter
     526            0 :             .acquire()
     527            0 :             .await
     528            0 :             .expect("Semaphore is not closed");
     529              : 
     530            0 :         let response = self
     531            0 :             .http_client
     532            0 :             .get(self.append_url("/branches"))
     533            0 :             .query(&[
     534            0 :                 ("project_id", &project_id.0),
     535            0 :                 ("show_deleted", &show_deleted.to_string()),
     536            0 :             ])
     537            0 :             .header(header::ACCEPT, "application/json")
     538            0 :             .bearer_auth(&self.token)
     539            0 :             .send()
     540            0 :             .await
     541            0 :             .map_err(|e| Error::new("Project for tenant".to_string(), ErrorKind::RequestSend(e)))?;
     542              : 
     543            0 :         let response: AdminApiResponse<Vec<BranchData>> = response
     544            0 :             .json()
     545            0 :             .await
     546            0 :             .map_err(|e| Error::new("Project for tenant".to_string(), ErrorKind::BodyRead(e)))?;
     547              : 
     548            0 :         Ok(response.data)
     549            0 :     }
     550              : 
     551            0 :     fn append_url(&self, subpath: &str) -> Url {
     552            0 :         // TODO fugly, but `.join` does not work when called
     553            0 :         (self.base_url.to_string() + subpath)
     554            0 :             .parse()
     555            0 :             .unwrap_or_else(|e| panic!("Could not append {subpath} to base url: {e}"))
     556            0 :     }
     557              : 
     558            0 :     async fn with_retries<T, O, F>(op: O, description: &str) -> Result<T, Error>
     559            0 :     where
     560            0 :         O: FnMut() -> F,
     561            0 :         F: Future<Output = Result<T, Error>>,
     562            0 :     {
     563            0 :         let cancel = CancellationToken::new(); // not really used
     564            0 :         backoff::retry(op, |_| false, 1, 20, description, &cancel)
     565            0 :             .await
     566            0 :             .expect("cancellations are disabled")
     567            0 :     }
     568              : }
        

Generated by: LCOV version 2.1-beta