1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113
use std::{collections::BTreeMap, marker::PhantomData};
/// Statistics regarding object encountered during execution of the [`traverse()`][crate::index::File::traverse()] method.
#[derive(Debug, PartialEq, Eq, Hash, Ord, PartialOrd, Clone)]
#[cfg_attr(feature = "serde", derive(serde::Serialize, serde::Deserialize))]
pub struct Statistics {
/// The average over all decoded objects
pub average: crate::data::decode::entry::Outcome,
/// A mapping of the length of the chain to the amount of objects at that length.
///
/// A length of 0 indicates full objects, and everything above that involves the given amount
/// of delta objects.
pub objects_per_chain_length: BTreeMap<u32, u32>,
/// The amount of bytes in all compressed streams, one per entry
pub total_compressed_entries_size: u64,
/// The amount of bytes in all decompressed streams, one per entry
pub total_decompressed_entries_size: u64,
/// The amount of bytes occupied by all undeltified, decompressed objects
pub total_object_size: u64,
/// The amount of bytes occupied by the pack itself, in bytes
pub pack_size: u64,
/// The amount of objects encountered that where commits
pub num_commits: u32,
/// The amount of objects encountered that where trees
pub num_trees: u32,
/// The amount of objects encountered that where tags
pub num_tags: u32,
/// The amount of objects encountered that where blobs
pub num_blobs: u32,
}
impl Default for Statistics {
fn default() -> Self {
Statistics {
average: crate::data::decode::entry::Outcome::default_from_kind(gix_object::Kind::Tree),
objects_per_chain_length: Default::default(),
total_compressed_entries_size: 0,
total_decompressed_entries_size: 0,
total_object_size: 0,
pack_size: 0,
num_blobs: 0,
num_commits: 0,
num_trees: 0,
num_tags: 0,
}
}
}
/// The ways to validate decoded objects before passing them to the processor.
#[derive(Default, Debug, PartialEq, Eq, Hash, Ord, PartialOrd, Clone, Copy)]
#[cfg_attr(feature = "serde", derive(serde::Serialize, serde::Deserialize))]
pub enum SafetyCheck {
/// Don't verify the validity of the checksums stored in the index and pack file
SkipFileChecksumVerification,
/// All of the above, and also don't perform any object checksum verification
SkipFileAndObjectChecksumVerification,
/// All of the above, and only log object decode errors.
///
/// Useful if there is a damaged pack and you would like to traverse as many objects as possible.
SkipFileAndObjectChecksumVerificationAndNoAbortOnDecodeError,
/// Perform all available safety checks before operating on the pack and
/// abort if any of them fails
#[default]
All,
}
impl SafetyCheck {
pub(crate) fn file_checksum(&self) -> bool {
matches!(self, SafetyCheck::All)
}
pub(crate) fn object_checksum(&self) -> bool {
matches!(self, SafetyCheck::All | SafetyCheck::SkipFileChecksumVerification)
}
pub(crate) fn fatal_decode_error(&self) -> bool {
match self {
SafetyCheck::All
| SafetyCheck::SkipFileChecksumVerification
| SafetyCheck::SkipFileAndObjectChecksumVerification => true,
SafetyCheck::SkipFileAndObjectChecksumVerificationAndNoAbortOnDecodeError => false,
}
}
}
/// The way we verify the pack
#[derive(Default, Debug, PartialEq, Eq, Hash, Ord, PartialOrd, Clone, Copy)]
#[cfg_attr(feature = "serde", derive(serde::Serialize, serde::Deserialize))]
pub enum Algorithm {
/// Build an index to allow decoding each delta and base exactly once, saving a lot of computational
/// resource at the expense of resident memory, as we will use an additional `DeltaTree` to accelerate
/// delta chain resolution.
#[default]
DeltaTreeLookup,
/// We lookup each object similarly to what would happen during normal repository use.
/// Uses more compute resources as it will resolve delta chains from back to front, but start right away
/// without indexing or investing any memory in indices.
///
/// This option may be well suited for big packs in memory-starved system that support memory mapping.
Lookup,
}
/// The progress ids used in [`traverse()`][crate::index::File::traverse()] .
///
/// Use this information to selectively extract the progress of interest in case the parent application has custom visualization.
#[derive(Debug, Copy, Clone)]
pub enum ProgressId {
/// A root progress which isn't actually used, but links to the `ProgressId` of the lookup version of the algorithm.
WithLookup(PhantomData<super::with_lookup::ProgressId>),
/// A root progress which isn't actually used, but links to the `ProgressId` of the indexed version of the algorithm.
WithIndex(PhantomData<super::with_index::ProgressId>),
}