blob: 35c990556af2e6dd4d00494b6ebb2e778c9c9292 [file] [log] [blame]
// Copyright 2022 The ChromiumOS Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
//! This crate provides tools to help decode and encode various video codecs, leveraging the
//! hardware acceleration available on the target.
//!
//! The [codec] module contains tools to parse encoded video streams like H.264 or VP9 and extract
//! the information useful in order to perform e.g. hardware-accelerated decoding.
//!
//! The [backend] module contains common backend code. A backend is a provider of some way to
//! decode or encode a particular codec, like VAAPI.
//!
//! The [decoder] module contains decoders that can turn an encoded video stream into a sequence of
//! decoded frames using the hardware acceleration available on the host.
//!
//! The [encoder] module contains encoder that can turn a picture sequence into a compressed
//! sequence of decodable encoded packets using the hardware acceleration available on the host.
//!
//! The [utils] module contains some useful code that is shared between different parts of this
//! crate and didn't fit any of the modules above.
pub mod bitstream_utils;
pub mod codec;
#[cfg(any(feature = "vaapi", feature = "v4l2"))]
pub mod backend;
#[cfg(any(feature = "vaapi", feature = "v4l2"))]
pub mod decoder;
#[cfg(any(feature = "vaapi", feature = "v4l2"))]
pub mod encoder;
#[cfg(any(feature = "vaapi", feature = "v4l2"))]
pub mod image_processing;
#[cfg(any(feature = "vaapi", feature = "v4l2"))]
pub mod utils;
use std::str::FromStr;
#[cfg(feature = "vaapi")]
pub use libva;
#[cfg(feature = "v4l2")]
pub use v4l2r;
/// Rounding modes for `Resolution`
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
pub enum ResolutionRoundMode {
/// Rounds component-wise to the next even value.
Even,
}
/// A frame resolution in pixels.
#[derive(Copy, Clone, Debug, Default, PartialEq, Eq)]
pub struct Resolution {
pub width: u32,
pub height: u32,
}
impl Resolution {
/// Whether `self` can contain `other`.
pub fn can_contain(&self, other: Self) -> bool {
self.width >= other.width && self.height >= other.height
}
/// Rounds `self` according to `rnd_mode`.
pub fn round(mut self, rnd_mode: ResolutionRoundMode) -> Self {
match rnd_mode {
ResolutionRoundMode::Even => {
if self.width % 2 != 0 {
self.width += 1;
}
if self.height % 2 != 0 {
self.height += 1;
}
}
}
self
}
}
impl From<(u32, u32)> for Resolution {
fn from(value: (u32, u32)) -> Self {
Self {
width: value.0,
height: value.1,
}
}
}
impl From<Resolution> for (u32, u32) {
fn from(value: Resolution) -> Self {
(value.width, value.height)
}
}
/// Wrapper around u32 when they are meant to be a fourcc.
///
/// Provides conversion and display/debug implementations useful when dealing with fourcc codes.
#[derive(Clone, Copy, PartialEq)]
pub struct Fourcc(u32);
impl From<u32> for Fourcc {
fn from(fourcc: u32) -> Self {
Self(fourcc)
}
}
impl From<Fourcc> for u32 {
fn from(fourcc: Fourcc) -> Self {
fourcc.0
}
}
impl From<&[u8; 4]> for Fourcc {
fn from(n: &[u8; 4]) -> Self {
Self(n[0] as u32 | (n[1] as u32) << 8 | (n[2] as u32) << 16 | (n[3] as u32) << 24)
}
}
impl From<Fourcc> for [u8; 4] {
fn from(n: Fourcc) -> Self {
[
n.0 as u8,
(n.0 >> 8) as u8,
(n.0 >> 16) as u8,
(n.0 >> 24) as u8,
]
}
}
impl std::fmt::Display for Fourcc {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
let c: [u8; 4] = (*self).into();
f.write_fmt(format_args!(
"{}{}{}{}",
c[0] as char, c[1] as char, c[2] as char, c[3] as char
))
}
}
impl std::fmt::Debug for Fourcc {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
f.write_fmt(format_args!("0x{:08x} ({})", self.0, self))
}
}
/// Formats that buffers can be mapped into for the CPU to read.
///
/// The conventions here largely follow these of libyuv.
#[derive(Copy, Clone, Debug, PartialEq, Eq, Hash)]
pub enum DecodedFormat {
/// Y, U and V planes, 4:2:0 sampling, 8 bits per sample.
I420,
/// One Y and one interleaved UV plane, 4:2:0 sampling, 8 bits per sample.
NV12,
/// Y, U and V planes, 4:2:2 sampling, 8 bits per sample.
I422,
/// Y, U and V planes, 4:4:4 sampling, 8 bits per sample.
I444,
/// Y, U and V planes, 4:2:0 sampling, 16 bits per sample, LE. Only the 10 LSBs are used.
I010,
/// Y, U and V planes, 4:2:0 sampling, 16 bits per sample, LE. Only the 12 LSBs are used.
I012,
/// Y, U and V planes, 4:2:2 sampling, 16 bits per sample, LE. Only the 10 LSBs are used.
I210,
/// Y, U and V planes, 4:2:2 sampling, 16 bits per sample, LE. Only the 12 LSBs are used.
I212,
/// Y, U and V planes, 4:4:4 sampling, 16 bits per sample, LE. Only the 10 LSBs are used.
I410,
/// Y, U and V planes, 4:4:4 sampling, 16 bits per sample, LE. Only the 12 LSBs are used.
I412,
}
impl FromStr for DecodedFormat {
type Err = &'static str;
fn from_str(s: &str) -> Result<Self, Self::Err> {
match s {
"i420" | "I420" => Ok(DecodedFormat::I420),
"i422" | "I422" => Ok(DecodedFormat::I422),
"i444" | "I444" => Ok(DecodedFormat::I444),
"nv12" | "NV12" => Ok(DecodedFormat::NV12),
"i010" | "I010" => Ok(DecodedFormat::I010),
"i012" | "I012" => Ok(DecodedFormat::I012),
"i210" | "I210" => Ok(DecodedFormat::I210),
"i212" | "I212" => Ok(DecodedFormat::I212),
"i410" | "I410" => Ok(DecodedFormat::I410),
"i412" | "I412" => Ok(DecodedFormat::I412),
_ => {
Err("unrecognized output format. Valid values: i420, nv12, i422, i444, i010, i012, i210, i212, i410, i412")
}
}
}
}
/// Describes the layout of a plane within a frame.
#[derive(Debug, Clone, PartialEq)]
pub struct PlaneLayout {
/// Index of the memory buffer the plane belongs to.
pub buffer_index: usize,
/// Start offset of the plane within its buffer.
pub offset: usize,
/// Distance in bytes between two lines of data in this plane.
pub stride: usize,
}
/// Unambiguously describes the layout of a frame.
///
/// A frame can be made of one or several memory buffers, each containing one or several planes.
/// For a given frame, this structure defines where each plane can be found.
#[derive(Debug, Clone, PartialEq)]
pub struct FrameLayout {
/// `(Fourcc, modifier)` tuple describing the arrangement of the planes.
///
/// This member is enough to infer how many planes and buffers the frame has, and which
/// buffer each plane belongs into.
pub format: (Fourcc, u64),
/// Size in pixels of the frame.
pub size: Resolution,
/// Layout of each individual plane.
pub planes: Vec<PlaneLayout>,
}
/// Build a frame memory descriptor enum that supports multiple descriptor types.
///
/// This is useful for the case where the frames' memory backing is not decided at compile-time.
/// In this case, this macro can be used to list all the potential types supported at run-time, and
/// the selected one can be built as the program is run.
///
/// # Example
///
///
/// use cros_codecs::multiple_desc_type;
/// use cros_codecs::utils::DmabufFrame;
///
/// /// Frames' memory can be provided either by the backend, or via PRIME DMABUF handles.
/// multiple_desc_type! {
/// enum OwnedOrDmaDescriptor {
/// Owned(()),
/// Dmabuf(DmabufFrame),
/// }
/// }
///
#[macro_export]
macro_rules! multiple_desc_type {
(enum $s:ident { $($v:ident($t:ty),)* } ) => {
enum $s {
$($v($t),)*
}
#[cfg(feature = "vaapi")]
impl libva::SurfaceMemoryDescriptor for $s {
fn add_attrs(&mut self, attrs: &mut Vec<libva::VASurfaceAttrib>) -> Option<Box<dyn std::any::Any>> {
match self {
$($s::$v(desc) => desc.add_attrs(attrs),)*
}
}
}
}
}
/// Returns the size required to store a frame of `format` with size `width`x`height`, without any
/// padding. This is the minimum size of the destination buffer passed to `nv12_copy` or
/// `i420_copy`.
pub fn decoded_frame_size(format: DecodedFormat, width: usize, height: usize) -> usize {
match format {
DecodedFormat::I420 | DecodedFormat::NV12 => {
let u_size = width * height;
// U and V planes need to be aligned to 2.
let uv_size = ((width + 1) / 2) * ((height + 1) / 2) * 2;
u_size + uv_size
}
DecodedFormat::I422 => {
let u_size = width * height;
// U and V planes need to be aligned to 2.
let uv_size = ((width + 1) / 2) * ((height + 1) / 2) * 2 * 2;
u_size + uv_size
}
DecodedFormat::I444 => (width * height) * 3,
DecodedFormat::I010 | DecodedFormat::I012 => {
decoded_frame_size(DecodedFormat::I420, width, height) * 2
}
DecodedFormat::I210 | DecodedFormat::I212 => {
let u_size = width * height * 2;
// U and V planes need to be aligned to 2.
let uv_size = ((width + 1) / 2) * ((height + 1) / 2) * 2 * 2;
u_size + uv_size
}
DecodedFormat::I410 | DecodedFormat::I412 => (width * height * 2) * 3,
}
}
/// Instructs on whether it should block on the operation(s).
#[derive(Default, Debug, Clone, Copy, PartialEq, Eq)]
pub enum BlockingMode {
Blocking,
#[default]
NonBlocking,
}
#[cfg(test)]
mod tests {
use super::Fourcc;
const NV12_FOURCC: u32 = 0x3231564E;
#[test]
fn fourcc_u32() {
let fourcc = Fourcc::from(NV12_FOURCC);
let value: u32 = fourcc.into();
assert_eq!(value, NV12_FOURCC);
}
#[test]
fn fourcc_u8_4() {
let fourcc = Fourcc::from(NV12_FOURCC);
let value: [u8; 4] = fourcc.into();
assert_eq!(value, *b"NV12");
}
#[test]
fn fourcc_display() {
let fourcc = Fourcc::from(NV12_FOURCC);
assert_eq!(fourcc.to_string(), "NV12");
}
#[test]
fn fourcc_debug() {
let fourcc = Fourcc::from(NV12_FOURCC);
assert_eq!(format!("{:?}", fourcc), "0x3231564e (NV12)");
}
}