blob: 385aa3d719cf99b61a1d269e17090da05e1e1d89 [file] [log] [blame]
//! a pack data file
use std::path::Path;
/// The offset to an entry into the pack data file, relative to its beginning.
pub type Offset = u64;
/// An identifier to uniquely identify all packs loaded within a known context or namespace.
pub type Id = u32;
use memmap2::Mmap;
/// An representing an full- or delta-object within a pack
#[derive(PartialEq, Eq, Debug, Hash, Ord, PartialOrd, Clone)]
#[cfg_attr(feature = "serde", derive(serde::Serialize, serde::Deserialize))]
pub struct Entry {
/// The entry's header
pub header: entry::Header,
/// The decompressed size of the entry in bytes.
///
/// Note that for non-delta entries this will be the size of the object itself.
pub decompressed_size: u64,
/// absolute offset to compressed object data in the pack, just behind the entry's header
pub data_offset: Offset,
}
mod file;
pub use file::{decode, verify, Header};
///
#[allow(clippy::empty_docs)]
pub mod header;
///
#[allow(clippy::empty_docs)]
pub mod init {
pub use super::header::decode::Error;
}
///
#[allow(clippy::empty_docs)]
pub mod entry;
///
#[cfg(feature = "streaming-input")]
pub mod input;
/// Utilities to encode pack data entries and write them to a `Write` implementation to resemble a pack data file.
#[cfg(feature = "generate")]
pub mod output;
/// A slice into a pack file denoting a pack entry.
///
/// An entry can be decoded into an object.
pub type EntryRange = std::ops::Range<Offset>;
/// Supported versions of a pack data file
#[derive(Default, PartialEq, Eq, Debug, Hash, Ord, PartialOrd, Clone, Copy)]
#[cfg_attr(feature = "serde", derive(serde::Serialize, serde::Deserialize))]
#[allow(missing_docs)]
pub enum Version {
#[default]
V2,
V3,
}
/// A pack data file
pub struct File {
data: Mmap,
path: std::path::PathBuf,
/// A value to represent this pack uniquely when used with cache lookup, or a way to identify this pack by its location on disk.
/// The same location on disk should yield the same id.
///
/// These must be unique per pack and must be stable, that is they don't change if the pack doesn't change.
/// If the same id is assigned (or reassigned) to different packs, pack creation or cache access will fail in hard-to-debug ways.
///
/// This value is controlled by the owning object store, which can use it in whichever way it wants as long as the above constraints are met.
pub id: Id,
version: Version,
num_objects: u32,
/// The size of the hash contained within. This is entirely determined by the caller, and repositories have to know which hash to use
/// based on their configuration.
hash_len: usize,
object_hash: gix_hash::Kind,
}
/// Information about the pack data file itself
impl File {
/// The pack data version of this file
pub fn version(&self) -> Version {
self.version
}
/// The number of objects stored in this pack data file
pub fn num_objects(&self) -> u32 {
self.num_objects
}
/// The length of all mapped data, including the pack header and the pack trailer
pub fn data_len(&self) -> usize {
self.data.len()
}
/// The kind of hash we use internally.
pub fn object_hash(&self) -> gix_hash::Kind {
self.object_hash
}
/// The position of the byte one past the last pack entry, or in other terms, the first byte of the trailing hash.
pub fn pack_end(&self) -> usize {
self.data.len() - self.hash_len
}
/// The path to the pack data file on disk
pub fn path(&self) -> &Path {
&self.path
}
/// Returns the pack data at the given slice if its range is contained in the mapped pack data
pub fn entry_slice(&self, slice: EntryRange) -> Option<&[u8]> {
let entry_end: usize = slice.end.try_into().expect("end of pack fits into usize");
let entry_start = slice.start as usize;
self.data.get(entry_start..entry_end)
}
/// Returns the CRC32 of the pack data indicated by `pack_offset` and the `size` of the mapped data.
///
/// _Note:_ finding the right size is only possible by decompressing
/// the pack entry beforehand, or by using the (to be sorted) offsets stored in an index file.
///
/// # Panics
///
/// If `pack_offset` or `size` are pointing to a range outside of the mapped pack data.
pub fn entry_crc32(&self, pack_offset: Offset, size: usize) -> u32 {
let pack_offset: usize = pack_offset.try_into().expect("pack_size fits into usize");
gix_features::hash::crc32(&self.data[pack_offset..pack_offset + size])
}
}
pub(crate) mod delta;