blob: 358bd743c80d30e655f2fce5346ed7095c24afae [file] [log] [blame]
use std::io;
use super::{BLOB, COMMIT, OFS_DELTA, REF_DELTA, TAG, TREE};
use crate::data;
/// The header portion of a pack data entry, identifying the kind of stored object.
#[derive(PartialEq, Eq, Debug, Hash, Ord, PartialOrd, Clone, Copy)]
#[cfg_attr(feature = "serde", derive(serde::Serialize, serde::Deserialize))]
#[allow(missing_docs)]
pub enum Header {
/// The object is a commit
Commit,
/// The object is a tree
Tree,
/// The object is a blob
Blob,
/// The object is a tag
Tag,
/// Describes a delta-object which needs to be applied to a base. The base object is identified by the `base_id` field
/// which is found within the parent repository.
/// Most commonly used for **thin-packs** when receiving pack files from the server to refer to objects that are not
/// part of the pack but expected to be present in the receivers repository.
///
/// # Note
/// This could also be an object within this pack if the LSB encoded offset would be larger than 20 bytes, which is unlikely to
/// happen.
///
/// **The naming** is exactly the same as the canonical implementation uses, namely **REF_DELTA**.
RefDelta { base_id: gix_hash::ObjectId },
/// Describes a delta-object present in this pack which acts as base for this object.
/// The base object is measured as a distance from this objects
/// pack offset, so that `base_pack_offset = this_objects_pack_offset - base_distance`
///
/// # Note
///
/// **The naming** is exactly the same as the canonical implementation uses, namely **OFS_DELTA**.
OfsDelta { base_distance: u64 },
}
impl Header {
/// Subtract `distance` from `pack_offset` safely without the chance for overflow or no-ops if `distance` is 0.
pub fn verified_base_pack_offset(pack_offset: data::Offset, distance: u64) -> Option<data::Offset> {
if distance == 0 {
return None;
}
pack_offset.checked_sub(distance)
}
/// Convert the header's object kind into [`gix_object::Kind`] if possible
pub fn as_kind(&self) -> Option<gix_object::Kind> {
use gix_object::Kind::*;
Some(match self {
Header::Tree => Tree,
Header::Blob => Blob,
Header::Commit => Commit,
Header::Tag => Tag,
Header::RefDelta { .. } | Header::OfsDelta { .. } => return None,
})
}
/// Convert this header's object kind into the packs internal representation
pub fn as_type_id(&self) -> u8 {
use Header::*;
match self {
Blob => BLOB,
Tree => TREE,
Commit => COMMIT,
Tag => TAG,
OfsDelta { .. } => OFS_DELTA,
RefDelta { .. } => REF_DELTA,
}
}
/// Return's true if this is a delta object, i.e. not a full object.
pub fn is_delta(&self) -> bool {
matches!(self, Header::OfsDelta { .. } | Header::RefDelta { .. })
}
/// Return's true if this is a base object, i.e. not a delta object.
pub fn is_base(&self) -> bool {
!self.is_delta()
}
}
impl Header {
/// Encode this header along the given `decompressed_size_in_bytes` into the `out` write stream for use within a data pack.
///
/// Returns the amount of bytes written to `out`.
/// `decompressed_size_in_bytes` is the full size in bytes of the object that this header represents
pub fn write_to(&self, decompressed_size_in_bytes: u64, out: &mut dyn io::Write) -> io::Result<usize> {
let mut size = decompressed_size_in_bytes;
let mut written = 1;
let mut c: u8 = (self.as_type_id() << 4) | (size as u8 & 0b0000_1111);
size >>= 4;
while size != 0 {
out.write_all(&[c | 0b1000_0000])?;
written += 1;
c = size as u8 & 0b0111_1111;
size >>= 7;
}
out.write_all(&[c])?;
use Header::*;
match self {
RefDelta { base_id: oid } => {
out.write_all(oid.as_slice())?;
written += oid.as_slice().len();
}
OfsDelta { base_distance } => {
let mut buf = [0u8; 10];
let buf = leb64_encode(*base_distance, &mut buf);
out.write_all(buf)?;
written += buf.len();
}
Blob | Tree | Commit | Tag => {}
}
Ok(written)
}
/// The size of the header in bytes when serialized
pub fn size(&self, decompressed_size: u64) -> usize {
self.write_to(decompressed_size, &mut io::sink())
.expect("io::sink() to never fail")
}
}
#[inline]
fn leb64_encode(mut n: u64, buf: &mut [u8; 10]) -> &[u8] {
let mut bytes_written = 1;
buf[buf.len() - 1] = n as u8 & 0b0111_1111;
for out in buf.iter_mut().rev().skip(1) {
n >>= 7;
if n == 0 {
break;
}
n -= 1;
*out = 0b1000_0000 | (n as u8 & 0b0111_1111);
bytes_written += 1;
}
debug_assert_eq!(n, 0, "BUG: buffer must be large enough to hold a 64 bit integer");
&buf[buf.len() - bytes_written..]
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn leb64_encode_max_int() {
let mut buf = [0u8; 10];
let buf = leb64_encode(u64::MAX, &mut buf);
assert_eq!(buf.len(), 10, "10 bytes should be used when 64bits are encoded");
}
}