LCOV - code coverage report
Current view: top level - libs/tenant_size_model/src - calculation.rs (source / functions) Coverage Total Hit
Test: a43a77853355b937a79c57b07a8f05607cf29e6c.info Lines: 98.3 % 121 119
Test Date: 2024-09-19 12:04:32 Functions: 100.0 % 3 3

            Line data    Source code
       1              : use crate::{SegmentMethod, SegmentSizeResult, SizeResult, StorageModel};
       2              : 
       3              : //
       4              : //                 *-g--*---D--->
       5              : //                /
       6              : //               /
       7              : //              /                 *---b----*-B--->
       8              : //             /                 /
       9              : //            /                 /
      10              : //      -----*--e---*-----f----* C
      11              : //           E                  \
      12              : //                               \
      13              : //                                *--a---*---A-->
      14              : //
      15              : // If A and B need to be retained, is it cheaper to store
      16              : // snapshot at C+a+b, or snapshots at A and B ?
      17              : //
      18              : // If D also needs to be retained, which is cheaper:
      19              : //
      20              : // 1. E+g+e+f+a+b
      21              : // 2. D+C+a+b
      22              : // 3. D+A+B
      23              : 
      24              : /// `Segment` which has had its size calculated.
      25              : #[derive(Clone, Debug)]
      26              : struct SegmentSize {
      27              :     method: SegmentMethod,
      28              : 
      29              :     // calculated size of this subtree, using this method
      30              :     accum_size: u64,
      31              : 
      32              :     seg_id: usize,
      33              :     children: Vec<SegmentSize>,
      34              : }
      35              : 
      36              : struct SizeAlternatives {
      37              :     /// cheapest alternative if parent is available.
      38              :     incremental: SegmentSize,
      39              : 
      40              :     /// cheapest alternative if parent node is not available
      41              :     non_incremental: Option<SegmentSize>,
      42              : }
      43              : 
      44              : impl StorageModel {
      45           18 :     pub fn calculate(&self) -> SizeResult {
      46           18 :         // Build adjacency list. 'child_list' is indexed by segment id. Each entry
      47           18 :         // contains a list of all child segments of the segment.
      48           18 :         let mut roots: Vec<usize> = Vec::new();
      49           18 :         let mut child_list: Vec<Vec<usize>> = Vec::new();
      50           18 :         child_list.resize(self.segments.len(), Vec::new());
      51              : 
      52          141 :         for (seg_id, seg) in self.segments.iter().enumerate() {
      53          141 :             if let Some(parent_id) = seg.parent {
      54          123 :                 child_list[parent_id].push(seg_id);
      55          123 :             } else {
      56           18 :                 roots.push(seg_id);
      57           18 :             }
      58              :         }
      59              : 
      60           18 :         let mut segment_results = Vec::new();
      61           18 :         segment_results.resize(
      62           18 :             self.segments.len(),
      63           18 :             SegmentSizeResult {
      64           18 :                 method: SegmentMethod::Skipped,
      65           18 :                 accum_size: 0,
      66           18 :             },
      67           18 :         );
      68           18 : 
      69           18 :         let mut total_size = 0;
      70           36 :         for root in roots {
      71           18 :             if let Some(selected) = self.size_here(root, &child_list).non_incremental {
      72           18 :                 StorageModel::fill_selected_sizes(&selected, &mut segment_results);
      73           18 :                 total_size += selected.accum_size;
      74           18 :             } else {
      75            0 :                 // Couldn't find any way to get this root. Error?
      76            0 :             }
      77              :         }
      78              : 
      79           18 :         SizeResult {
      80           18 :             total_size,
      81           18 :             segments: segment_results,
      82           18 :         }
      83           18 :     }
      84              : 
      85          141 :     fn fill_selected_sizes(selected: &SegmentSize, result: &mut Vec<SegmentSizeResult>) {
      86          141 :         result[selected.seg_id] = SegmentSizeResult {
      87          141 :             method: selected.method,
      88          141 :             accum_size: selected.accum_size,
      89          141 :         };
      90              :         // recurse to children
      91          141 :         for child in selected.children.iter() {
      92          123 :             StorageModel::fill_selected_sizes(child, result);
      93          123 :         }
      94          141 :     }
      95              : 
      96              :     //
      97              :     // This is the core of the sizing calculation.
      98              :     //
      99              :     // This is a recursive function, that for each Segment calculates the best way
     100              :     // to reach all the Segments that are marked as needed in this subtree, under two
     101              :     // different conditions:
     102              :     // a) when the parent of this segment is available (as a snaphot or through WAL), and
     103              :     // b) when the parent of this segment is not available.
     104              :     //
     105          141 :     fn size_here(&self, seg_id: usize, child_list: &Vec<Vec<usize>>) -> SizeAlternatives {
     106          141 :         let seg = &self.segments[seg_id];
     107          141 :         // First figure out the best way to get each child
     108          141 :         let mut children = Vec::new();
     109          141 :         for child_id in &child_list[seg_id] {
     110          123 :             children.push(self.size_here(*child_id, child_list))
     111              :         }
     112              : 
     113              :         // Method 1. If this node is not needed, we can skip it as long as we
     114              :         // take snapshots later in each sub-tree
     115          141 :         let snapshot_later = if !seg.needed {
     116           98 :             let mut snapshot_later = SegmentSize {
     117           98 :                 seg_id,
     118           98 :                 method: SegmentMethod::Skipped,
     119           98 :                 accum_size: 0,
     120           98 :                 children: Vec::new(),
     121           98 :             };
     122           98 : 
     123           98 :             let mut possible = true;
     124          104 :             for child in children.iter() {
     125          104 :                 if let Some(non_incremental) = &child.non_incremental {
     126           70 :                     snapshot_later.accum_size += non_incremental.accum_size;
     127           70 :                     snapshot_later.children.push(non_incremental.clone())
     128              :                 } else {
     129           34 :                     possible = false;
     130           34 :                     break;
     131              :                 }
     132              :             }
     133           98 :             if possible {
     134           64 :                 Some(snapshot_later)
     135              :             } else {
     136           34 :                 None
     137              :             }
     138              :         } else {
     139           43 :             None
     140              :         };
     141              : 
     142              :         // Method 2. Get a snapshot here. This assumed to be possible, if the 'size' of
     143              :         // this Segment was given.
     144          141 :         let snapshot_here = if !seg.needed || seg.parent.is_none() {
     145           98 :             if let Some(snapshot_size) = seg.size {
     146           74 :                 let mut snapshot_here = SegmentSize {
     147           74 :                     seg_id,
     148           74 :                     method: SegmentMethod::SnapshotHere,
     149           74 :                     accum_size: snapshot_size,
     150           74 :                     children: Vec::new(),
     151           74 :                 };
     152           87 :                 for child in children.iter() {
     153           87 :                     snapshot_here.accum_size += child.incremental.accum_size;
     154           87 :                     snapshot_here.children.push(child.incremental.clone())
     155              :                 }
     156           74 :                 Some(snapshot_here)
     157              :             } else {
     158           24 :                 None
     159              :             }
     160              :         } else {
     161           43 :             None
     162              :         };
     163              : 
     164              :         // Method 3. Use WAL to get here from parent
     165          141 :         let wal_here = {
     166          141 :             let mut wal_here = SegmentSize {
     167          141 :                 seg_id,
     168          141 :                 method: SegmentMethod::Wal,
     169          141 :                 accum_size: if let Some(parent_id) = seg.parent {
     170          123 :                     seg.lsn - self.segments[parent_id].lsn
     171              :                 } else {
     172           18 :                     0
     173              :                 },
     174          141 :                 children: Vec::new(),
     175              :             };
     176          264 :             for child in children {
     177          123 :                 wal_here.accum_size += child.incremental.accum_size;
     178          123 :                 wal_here.children.push(child.incremental)
     179              :             }
     180          141 :             wal_here
     181          141 :         };
     182          141 : 
     183          141 :         // If the parent is not available, what's the cheapest method involving
     184          141 :         // a snapshot here or later?
     185          141 :         let mut cheapest_non_incremental: Option<SegmentSize> = None;
     186          141 :         if let Some(snapshot_here) = snapshot_here {
     187           74 :             cheapest_non_incremental = Some(snapshot_here);
     188           74 :         }
     189          141 :         if let Some(snapshot_later) = snapshot_later {
     190              :             // Use <=, to prefer skipping if the size is equal
     191           64 :             if let Some(parent) = &cheapest_non_incremental {
     192           40 :                 if snapshot_later.accum_size <= parent.accum_size {
     193           34 :                     cheapest_non_incremental = Some(snapshot_later);
     194           34 :                 }
     195           24 :             } else {
     196           24 :                 cheapest_non_incremental = Some(snapshot_later);
     197           24 :             }
     198           77 :         }
     199              : 
     200              :         // And what's the cheapest method, if the parent is available?
     201          141 :         let cheapest_incremental = if let Some(cheapest_non_incremental) = &cheapest_non_incremental
     202              :         {
     203              :             // Is it cheaper to use a snapshot here or later, anyway?
     204              :             // Use <, to prefer Wal over snapshot if the cost is the same
     205           98 :             if wal_here.accum_size < cheapest_non_incremental.accum_size {
     206           67 :                 wal_here
     207              :             } else {
     208           31 :                 cheapest_non_incremental.clone()
     209              :             }
     210              :         } else {
     211           43 :             wal_here
     212              :         };
     213              : 
     214          141 :         SizeAlternatives {
     215          141 :             incremental: cheapest_incremental,
     216          141 :             non_incremental: cheapest_non_incremental,
     217          141 :         }
     218          141 :     }
     219              : }
        

Generated by: LCOV version 2.1-beta