iamf/cli/temporal_unit_view.cc - platform/external/iamf_tools - Git at Google

 /*
  * Copyright (c) 2025, Alliance for Open Media. All rights reserved
  *
  * This source code is subject to the terms of the BSD 3-Clause Clear License
  * and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear
  * License was not distributed with this source code in the LICENSE file, you
  * can obtain it at www.aomedia.org/license/software-license/bsd-3-c-c. If the
  * Alliance for Open Media Patent License 1.0 was not distributed with this
  * source code in the PATENTS file, you can obtain it at
  * www.aomedia.org/license/patent.
  */

 #include "iamf/cli/temporal_unit_view.h"

 #include <cstdint>
 #include <functional>
 #include <optional>
 #include <utility>
 #include <vector>

 #include "absl/algorithm/container.h"
 #include "absl/container/flat_hash_set.h"
 #include "absl/log/check.h"
 #include "absl/log/log.h"
 #include "absl/status/status.h"
 #include "absl/status/statusor.h"
 #include "absl/strings/string_view.h"
 #include "absl/types/span.h"
 #include "iamf/cli/audio_frame_with_data.h"
 #include "iamf/cli/parameter_block_with_data.h"
 #include "iamf/common/utils/macros.h"
 #include "iamf/common/utils/validation_utils.h"
 #include "iamf/obu/arbitrary_obu.h"
 #include "iamf/obu/types.h"

 namespace iamf_tools {

 namespace {

 // Common statistics about a temporal unit.
 struct TemporalUnitStatistics {
   uint32_t num_samples_per_frame;
   uint32_t num_samples_to_trim_at_end;
   uint32_t num_samples_to_trim_at_start;
   uint32_t num_untrimmed_samples;
   InternalTimestamp start_timestamp;
   InternalTimestamp end_timestamp;
 };

 absl::StatusOr<TemporalUnitStatistics> ComputeTemporalUnitStatistics(
     const AudioFrameWithData* first_audio_frame) {
   RETURN_IF_NOT_OK(ValidateNotNull(first_audio_frame, "`audio_frames`"));
   RETURN_IF_NOT_OK(ValidateNotNull(first_audio_frame->audio_element_with_data,
                                    "`audio_frame.audio_element_with_data`"));
   RETURN_IF_NOT_OK(
       ValidateNotNull(first_audio_frame->audio_element_with_data->codec_config,
                       "`audio_frame.audio_element_with_data.codec_config`"));
   TemporalUnitStatistics statistics{
       .num_samples_per_frame = first_audio_frame->audio_element_with_data
                                    ->codec_config->GetNumSamplesPerFrame(),
       .num_samples_to_trim_at_end =
           first_audio_frame->obu.header_.num_samples_to_trim_at_end,
       .num_samples_to_trim_at_start =
           first_audio_frame->obu.header_.num_samples_to_trim_at_start,
       .start_timestamp = first_audio_frame->start_timestamp,
       .end_timestamp = first_audio_frame->end_timestamp,
   };

   // Check the trim in the first frame is plausible. I.e. there are not at least
   // 0 samples. This also prevents underflow when subtracting later.
   const uint32_t cumulative_trim = statistics.num_samples_to_trim_at_start +
                                    statistics.num_samples_to_trim_at_end;
   RETURN_IF_NOT_OK(Validate(cumulative_trim, std::less_equal<uint32_t>(),
                             statistics.num_samples_per_frame,
                             "cumulative trim is <= `num_samples_per_frame`"));
   statistics.num_untrimmed_samples =
       statistics.num_samples_per_frame - cumulative_trim;

   return statistics;
 }

 absl::Status ValidateAllParameterBlocksMatchStatistics(
     absl::Span<const ParameterBlockWithData* const> parameter_blocks,
     const TemporalUnitStatistics& statistics) {
   absl::flat_hash_set<uint32_t> seen_parameter_ids;
   for (const auto* parameter_block : parameter_blocks) {
     RETURN_IF_NOT_OK(ValidateNotNull(parameter_block, "`parameter_block`"));
     const auto& [unused_iter, inserted] =
         seen_parameter_ids.insert(parameter_block->obu->parameter_id_);
     if (!inserted) {
       return absl::InvalidArgumentError(
           "A temporal unit must not have multiple parameter blocks with the "
           "same parameter ID.");
     }

     RETURN_IF_NOT_OK(ValidateEqual(
         parameter_block->start_timestamp, statistics.start_timestamp,
         "`start_timestamp` must be the same for all parameter blocks"));
     RETURN_IF_NOT_OK(ValidateEqual(
         parameter_block->end_timestamp, statistics.end_timestamp,
         "`end_timestamp` must be the same for all parameter blocks"));
   }
   return absl::OkStatus();
 }

 absl::Status ValidateAllAudioFramesMatchStatistics(
     absl::Span<const AudioFrameWithData* const> audio_frames,
     const TemporalUnitStatistics& statistics) {
   absl::flat_hash_set<uint32_t> seen_substream_ids;
   for (const auto* audio_frame : audio_frames) {
     RETURN_IF_NOT_OK(ValidateNotNull(audio_frame, "`audio_frame`"));
     const auto& [unused_iter, inserted] =
         seen_substream_ids.insert(audio_frame->obu.GetSubstreamId());
     if (!inserted) {
       return absl::InvalidArgumentError(
           "A temporal unit must not have multiple audio with the same "
           "substream ID.");
     }

     RETURN_IF_NOT_OK(ValidateNotNull(audio_frame->audio_element_with_data,
                                      "`audio_frame.audio_element_with_data`"));
     RETURN_IF_NOT_OK(
         ValidateNotNull(audio_frame->audio_element_with_data->codec_config,
                         "`audio_frame.audio_element_with_data.codec_config`"));
     RETURN_IF_NOT_OK(ValidateEqual(
         audio_frame->obu.header_.num_samples_to_trim_at_end,
         statistics.num_samples_to_trim_at_end,
         "`num_samples_to_trim_at_end` must be the same for all audio frames"));
     RETURN_IF_NOT_OK(
         ValidateEqual(audio_frame->obu.header_.num_samples_to_trim_at_start,
                       statistics.num_samples_to_trim_at_start,
                       "`num_samples_to_trim_at_start` must be the same for all "
                       "audio frames"));
     RETURN_IF_NOT_OK(ValidateEqual(
         audio_frame->start_timestamp, statistics.start_timestamp,
         "`start_timestamp` must be the same for all audio frames"));
     RETURN_IF_NOT_OK(
         ValidateEqual(audio_frame->end_timestamp, statistics.end_timestamp,
                       "`end_timestamp` must be the same for all audio frames"));
   }
   return absl::OkStatus();
 }

 absl::Status ValidateAllArbitraryObusMatchStatistics(
     absl::Span<const ArbitraryObu* const> arbitrary_obus,
     const TemporalUnitStatistics& statistics) {
   for (const auto* arbitrary_obu : arbitrary_obus) {
     RETURN_IF_NOT_OK(ValidateNotNull(arbitrary_obu, "`arbitrary_obu`"));
     RETURN_IF_NOT_OK(ValidateEqual(
         *arbitrary_obu->insertion_tick_,
         static_cast<int64_t>(statistics.start_timestamp),
         "`insertion_tick` must be the same for  all arbitrary OBUs"));
   }
   return absl::OkStatus();
 }

 bool CompareParameterId(const ParameterBlockWithData* a,
                         const ParameterBlockWithData* b) {
   // These were sanitized elsewhere in the class.
   CHECK_NE(a, nullptr);
   CHECK_NE(b, nullptr);
   return a->obu->parameter_id_ < b->obu->parameter_id_;
 }

 bool CompareAudioElementIdAudioSubstreamId(const AudioFrameWithData* a,
                                            const AudioFrameWithData* b) {
   // These were sanitized elsewhere in the class.
   CHECK_NE(a, nullptr);
   CHECK_NE(a->audio_element_with_data, nullptr);
   CHECK_NE(b, nullptr);
   CHECK_NE(b->audio_element_with_data, nullptr);
   CHECK_NE(b, nullptr);
   if (a->audio_element_with_data->obu.GetAudioElementId() !=
       b->audio_element_with_data->obu.GetAudioElementId()) {
     return a->audio_element_with_data->obu.GetAudioElementId() <
            b->audio_element_with_data->obu.GetAudioElementId();
   }
   return a->obu.GetSubstreamId() < b->obu.GetSubstreamId();
 }

 }  // namespace

 absl::StatusOr<TemporalUnitView> TemporalUnitView::CreateFromPointers(
     absl::Span<const ParameterBlockWithData* const> parameter_blocks,
     absl::Span<const AudioFrameWithData* const> audio_frames,
     absl::Span<const ArbitraryObu* const> arbitrary_obus) {
   if (audio_frames.empty()) {
     // Exit early even when `IGNORE_ERRORS_USE_ONLY_FOR_IAMF_TEST_SUITE` is set.
     return absl::InvalidArgumentError(
         "Every temporal unit must have an audio frame.");
   }

   // Infer some statistics based on the first audio frame
   const auto statistics = ComputeTemporalUnitStatistics(*audio_frames.begin());
   if (!statistics.ok()) {
     return statistics.status();
   }

   // Check that all OBUs agree with the statistics.  All frames must have the
   // same trimming information and timestamps as of IAMF v1.1.0.
   RETURN_IF_NOT_OK(
       ValidateAllAudioFramesMatchStatistics(audio_frames, *statistics));
   RETURN_IF_NOT_OK(
       ValidateAllParameterBlocksMatchStatistics(parameter_blocks, *statistics));
   RETURN_IF_NOT_OK(
       ValidateAllArbitraryObusMatchStatistics(arbitrary_obus, *statistics));

   // Sort the OBUS into a canonical order.
   // TODO(b/332956880): Support a custom ordering of parameter blocks and
   // substreams.
   std::vector<const ParameterBlockWithData*> sorted_parameter_blocks(
       parameter_blocks.begin(), parameter_blocks.end());
   std::vector<const AudioFrameWithData*> sorted_audio_frames(
       audio_frames.begin(), audio_frames.end());
   std::vector<const ArbitraryObu*> copied_arbitrary_obus(arbitrary_obus.begin(),
                                                          arbitrary_obus.end());
   absl::c_sort(sorted_parameter_blocks, CompareParameterId);
   absl::c_sort(sorted_audio_frames, CompareAudioElementIdAudioSubstreamId);
   return TemporalUnitView(
       std::move(sorted_parameter_blocks), std::move(sorted_audio_frames),
       std::move(copied_arbitrary_obus), statistics->start_timestamp,
       statistics->end_timestamp, statistics->num_samples_to_trim_at_start,
       statistics->num_untrimmed_samples);
 }

 TemporalUnitView::TemporalUnitView(
     std::vector<const ParameterBlockWithData*>&& parameter_blocks,
     std::vector<const AudioFrameWithData*>&& audio_frames,
     std::vector<const ArbitraryObu*>&& arbitrary_obus,
     InternalTimestamp start_timestamp, InternalTimestamp end_timestamp,
     uint32_t num_samples_to_trim_at_start, uint32_t num_untrimmed_samples)
     : parameter_blocks_(std::move(parameter_blocks)),
       audio_frames_(std::move(audio_frames)),
       arbitrary_obus_(std::move(arbitrary_obus)),
       start_timestamp_(start_timestamp),
       end_timestamp_(end_timestamp),
       num_samples_to_trim_at_start_(num_samples_to_trim_at_start),
       num_untrimmed_samples_(num_untrimmed_samples) {}

 }  // namespace iamf_tools
	/*
	* Copyright (c) 2025, Alliance for Open Media. All rights reserved
	*
	* This source code is subject to the terms of the BSD 3-Clause Clear License
	* and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear
	* License was not distributed with this source code in the LICENSE file, you
	* can obtain it at www.aomedia.org/license/software-license/bsd-3-c-c. If the
	* Alliance for Open Media Patent License 1.0 was not distributed with this
	* source code in the PATENTS file, you can obtain it at
	* www.aomedia.org/license/patent.
	*/

	#include "iamf/cli/temporal_unit_view.h"

	#include <cstdint>
	#include <functional>
	#include <optional>
	#include <utility>
	#include <vector>

	#include "absl/algorithm/container.h"
	#include "absl/container/flat_hash_set.h"
	#include "absl/log/check.h"
	#include "absl/log/log.h"
	#include "absl/status/status.h"
	#include "absl/status/statusor.h"
	#include "absl/strings/string_view.h"
	#include "absl/types/span.h"
	#include "iamf/cli/audio_frame_with_data.h"
	#include "iamf/cli/parameter_block_with_data.h"
	#include "iamf/common/utils/macros.h"
	#include "iamf/common/utils/validation_utils.h"
	#include "iamf/obu/arbitrary_obu.h"
	#include "iamf/obu/types.h"

	namespace iamf_tools {

	namespace {

	// Common statistics about a temporal unit.
	struct TemporalUnitStatistics {
	uint32_t num_samples_per_frame;
	uint32_t num_samples_to_trim_at_end;
	uint32_t num_samples_to_trim_at_start;
	uint32_t num_untrimmed_samples;
	InternalTimestamp start_timestamp;
	InternalTimestamp end_timestamp;
	};

	absl::StatusOr<TemporalUnitStatistics> ComputeTemporalUnitStatistics(
	const AudioFrameWithData* first_audio_frame) {
	RETURN_IF_NOT_OK(ValidateNotNull(first_audio_frame, "`audio_frames`"));
	RETURN_IF_NOT_OK(ValidateNotNull(first_audio_frame->audio_element_with_data,
	"`audio_frame.audio_element_with_data`"));
	RETURN_IF_NOT_OK(
	ValidateNotNull(first_audio_frame->audio_element_with_data->codec_config,
	"`audio_frame.audio_element_with_data.codec_config`"));
	TemporalUnitStatistics statistics{
	.num_samples_per_frame = first_audio_frame->audio_element_with_data
	->codec_config->GetNumSamplesPerFrame(),
	.num_samples_to_trim_at_end =
	first_audio_frame->obu.header_.num_samples_to_trim_at_end,
	.num_samples_to_trim_at_start =
	first_audio_frame->obu.header_.num_samples_to_trim_at_start,
	.start_timestamp = first_audio_frame->start_timestamp,
	.end_timestamp = first_audio_frame->end_timestamp,
	};

	// Check the trim in the first frame is plausible. I.e. there are not at least
	// 0 samples. This also prevents underflow when subtracting later.
	const uint32_t cumulative_trim = statistics.num_samples_to_trim_at_start +
	statistics.num_samples_to_trim_at_end;
	RETURN_IF_NOT_OK(Validate(cumulative_trim, std::less_equal<uint32_t>(),
	statistics.num_samples_per_frame,
	"cumulative trim is <= `num_samples_per_frame`"));
	statistics.num_untrimmed_samples =
	statistics.num_samples_per_frame - cumulative_trim;

	return statistics;
	}

	absl::Status ValidateAllParameterBlocksMatchStatistics(
	absl::Span<const ParameterBlockWithData* const> parameter_blocks,
	const TemporalUnitStatistics& statistics) {
	absl::flat_hash_set<uint32_t> seen_parameter_ids;
	for (const auto* parameter_block : parameter_blocks) {
	RETURN_IF_NOT_OK(ValidateNotNull(parameter_block, "`parameter_block`"));
	const auto& [unused_iter, inserted] =
	seen_parameter_ids.insert(parameter_block->obu->parameter_id_);
	if (!inserted) {
	return absl::InvalidArgumentError(
	"A temporal unit must not have multiple parameter blocks with the "
	"same parameter ID.");
	}

	RETURN_IF_NOT_OK(ValidateEqual(
	parameter_block->start_timestamp, statistics.start_timestamp,
	"`start_timestamp` must be the same for all parameter blocks"));
	RETURN_IF_NOT_OK(ValidateEqual(
	parameter_block->end_timestamp, statistics.end_timestamp,
	"`end_timestamp` must be the same for all parameter blocks"));
	}
	return absl::OkStatus();
	}

	absl::Status ValidateAllAudioFramesMatchStatistics(
	absl::Span<const AudioFrameWithData* const> audio_frames,
	const TemporalUnitStatistics& statistics) {
	absl::flat_hash_set<uint32_t> seen_substream_ids;
	for (const auto* audio_frame : audio_frames) {
	RETURN_IF_NOT_OK(ValidateNotNull(audio_frame, "`audio_frame`"));
	const auto& [unused_iter, inserted] =
	seen_substream_ids.insert(audio_frame->obu.GetSubstreamId());
	if (!inserted) {
	return absl::InvalidArgumentError(
	"A temporal unit must not have multiple audio with the same "
	"substream ID.");
	}

	RETURN_IF_NOT_OK(ValidateNotNull(audio_frame->audio_element_with_data,
	"`audio_frame.audio_element_with_data`"));
	RETURN_IF_NOT_OK(
	ValidateNotNull(audio_frame->audio_element_with_data->codec_config,
	"`audio_frame.audio_element_with_data.codec_config`"));
	RETURN_IF_NOT_OK(ValidateEqual(
	audio_frame->obu.header_.num_samples_to_trim_at_end,
	statistics.num_samples_to_trim_at_end,
	"`num_samples_to_trim_at_end` must be the same for all audio frames"));
	RETURN_IF_NOT_OK(
	ValidateEqual(audio_frame->obu.header_.num_samples_to_trim_at_start,
	statistics.num_samples_to_trim_at_start,
	"`num_samples_to_trim_at_start` must be the same for all "
	"audio frames"));
	RETURN_IF_NOT_OK(ValidateEqual(
	audio_frame->start_timestamp, statistics.start_timestamp,
	"`start_timestamp` must be the same for all audio frames"));
	RETURN_IF_NOT_OK(
	ValidateEqual(audio_frame->end_timestamp, statistics.end_timestamp,
	"`end_timestamp` must be the same for all audio frames"));
	}
	return absl::OkStatus();
	}

	absl::Status ValidateAllArbitraryObusMatchStatistics(
	absl::Span<const ArbitraryObu* const> arbitrary_obus,
	const TemporalUnitStatistics& statistics) {
	for (const auto* arbitrary_obu : arbitrary_obus) {
	RETURN_IF_NOT_OK(ValidateNotNull(arbitrary_obu, "`arbitrary_obu`"));
	RETURN_IF_NOT_OK(ValidateEqual(
	*arbitrary_obu->insertion_tick_,
	static_cast<int64_t>(statistics.start_timestamp),
	"`insertion_tick` must be the same for all arbitrary OBUs"));
	}
	return absl::OkStatus();
	}

	bool CompareParameterId(const ParameterBlockWithData* a,
	const ParameterBlockWithData* b) {
	// These were sanitized elsewhere in the class.
	CHECK_NE(a, nullptr);
	CHECK_NE(b, nullptr);
	return a->obu->parameter_id_ < b->obu->parameter_id_;
	}

	bool CompareAudioElementIdAudioSubstreamId(const AudioFrameWithData* a,
	const AudioFrameWithData* b) {
	// These were sanitized elsewhere in the class.
	CHECK_NE(a, nullptr);
	CHECK_NE(a->audio_element_with_data, nullptr);
	CHECK_NE(b, nullptr);
	CHECK_NE(b->audio_element_with_data, nullptr);
	CHECK_NE(b, nullptr);
	if (a->audio_element_with_data->obu.GetAudioElementId() !=
	b->audio_element_with_data->obu.GetAudioElementId()) {
	return a->audio_element_with_data->obu.GetAudioElementId() <
	b->audio_element_with_data->obu.GetAudioElementId();
	}
	return a->obu.GetSubstreamId() < b->obu.GetSubstreamId();
	}

	} // namespace

	absl::StatusOr<TemporalUnitView> TemporalUnitView::CreateFromPointers(
	absl::Span<const ParameterBlockWithData* const> parameter_blocks,
	absl::Span<const AudioFrameWithData* const> audio_frames,
	absl::Span<const ArbitraryObu* const> arbitrary_obus) {
	if (audio_frames.empty()) {
	// Exit early even when `IGNORE_ERRORS_USE_ONLY_FOR_IAMF_TEST_SUITE` is set.
	return absl::InvalidArgumentError(
	"Every temporal unit must have an audio frame.");
	}

	// Infer some statistics based on the first audio frame
	const auto statistics = ComputeTemporalUnitStatistics(*audio_frames.begin());
	if (!statistics.ok()) {
	return statistics.status();
	}

	// Check that all OBUs agree with the statistics. All frames must have the
	// same trimming information and timestamps as of IAMF v1.1.0.
	RETURN_IF_NOT_OK(
	ValidateAllAudioFramesMatchStatistics(audio_frames, *statistics));
	RETURN_IF_NOT_OK(
	ValidateAllParameterBlocksMatchStatistics(parameter_blocks, *statistics));
	RETURN_IF_NOT_OK(
	ValidateAllArbitraryObusMatchStatistics(arbitrary_obus, *statistics));

	// Sort the OBUS into a canonical order.
	// TODO(b/332956880): Support a custom ordering of parameter blocks and
	// substreams.
	std::vector<const ParameterBlockWithData*> sorted_parameter_blocks(
	parameter_blocks.begin(), parameter_blocks.end());
	std::vector<const AudioFrameWithData*> sorted_audio_frames(
	audio_frames.begin(), audio_frames.end());
	std::vector<const ArbitraryObu*> copied_arbitrary_obus(arbitrary_obus.begin(),
	arbitrary_obus.end());
	absl::c_sort(sorted_parameter_blocks, CompareParameterId);
	absl::c_sort(sorted_audio_frames, CompareAudioElementIdAudioSubstreamId);
	return TemporalUnitView(
	std::move(sorted_parameter_blocks), std::move(sorted_audio_frames),
	std::move(copied_arbitrary_obus), statistics->start_timestamp,
	statistics->end_timestamp, statistics->num_samples_to_trim_at_start,
	statistics->num_untrimmed_samples);
	}

	TemporalUnitView::TemporalUnitView(
	std::vector<const ParameterBlockWithData*>&& parameter_blocks,
	std::vector<const AudioFrameWithData*>&& audio_frames,
	std::vector<const ArbitraryObu*>&& arbitrary_obus,
	InternalTimestamp start_timestamp, InternalTimestamp end_timestamp,
	uint32_t num_samples_to_trim_at_start, uint32_t num_untrimmed_samples)
	: parameter_blocks_(std::move(parameter_blocks)),
	audio_frames_(std::move(audio_frames)),
	arbitrary_obus_(std::move(arbitrary_obus)),
	start_timestamp_(start_timestamp),
	end_timestamp_(end_timestamp),
	num_samples_to_trim_at_start_(num_samples_to_trim_at_start),
	num_untrimmed_samples_(num_untrimmed_samples) {}

	} // namespace iamf_tools