iamf/cli/sample_processor_base.h - platform/external/iamf_tools - Git at Google

 /*
  * Copyright (c) 2024, Alliance for Open Media. All rights reserved
  *
  * This source code is subject to the terms of the BSD 3-Clause Clear License
  * and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear
  * License was not distributed with this source code in the LICENSE file, you
  * can obtain it at www.aomedia.org/license/software-license/bsd-3-c-c. If the
  * Alliance for Open Media Patent License 1.0 was not distributed with this
  * source code in the PATENTS file, you can obtain it at
  * www.aomedia.org/license/patent.
  */
 #ifndef CLI_SAMPLE_PROCESSOR_BASE_H_
 #define CLI_SAMPLE_PROCESSOR_BASE_H_

 #include <cstddef>
 #include <cstdint>
 #include <vector>

 #include "absl/status/status.h"
 #include "absl/types/span.h"

 namespace iamf_tools {

 /*!\brief Abstract class to process PCM samples.
  *
  * This class represents an abstract interface to reprocess PCM samples. In
  * general, processors could introduce delay or could result in a different
  * number of samples per frame.
  *
  * Usage pattern:
  *   - While input samples are available:
  *     - Call `PushFrame()` to push in samples.
  *     - Call `GetOutputSamplesAsSpan()` to retrieve the samples.
  *   - Call `Flush()` to signal that no more frames will be pushed.
  *   - Call `GetOutputSamplesAsSpan()` one last time to retrieve any remaining
  *     samples.
  *
  *   - Note: Results from `GetOutputSamplesAsSpan()` are invalidated by
  *     further calls to `PushFrame()` or `Flush()`.
  */
 class SampleProcessorBase {
  public:
   /*!\brief Constructor.
    *
    * \param max_input_samples_per_frame Maximum number of samples per frame in
    *        the input timescale.
    * \param num_channels Number of channels. Later calls to `PushFrame()` must
    *        contain this many channels.
    * \param max_output_samples_per_frame Maximum number of samples per frame in
    *        the output timescale.
    */
   SampleProcessorBase(size_t max_input_samples_per_frame, size_t num_channels,
                       size_t max_output_samples_per_frame)
       : max_input_samples_per_frame_(max_input_samples_per_frame),
         num_channels_(num_channels),
         output_time_channel_samples_(max_output_samples_per_frame,
                                      std::vector<int32_t>(num_channels)) {}

   /*!\brief Destructor. */
   virtual ~SampleProcessorBase() = 0;

   /*!\brief Pushes a frame of samples to the processor.
    *
    * \param time_channel_samples Samples to push arranged in (time, channel).
    * \return `absl::OkStatus()` on success. `absl::FailedPreconditionError` if
    *         called after `Flush()`. Other specific statuses on failure.
    */
   absl::Status PushFrame(
       absl::Span<const std::vector<int32_t>> time_channel_samples);

   /*!\brief Signals to close the processor and flush any remaining samples.
    *
    * After calling `Flush()`, it is invalid to call `PushFrame()`
    * or `Flush()` again.
    *
    * \return `absl::OkStatus()` on success. `absl::FailedPreconditionError` if
    *         called after `Flush()`. Other specific statuses on failure.
    */
   absl::Status Flush();

   /*!\brief Gets a span of the output samples.
    *
    * \return Span of the output samples. The span will be invalidated when
    *         `PushFrame()` or `Flush()` is called.
    */
   absl::Span<const std::vector<int32_t>> GetOutputSamplesAsSpan() const;

  protected:
   /*!\brief Pushes a frame of samples to the processor.
    *
    * \param time_channel_samples Samples to push arranged in (time, channel).
    * \return `absl::OkStatus()` on success. A specific status on failure.
    */
   virtual absl::Status PushFrameDerived(
       absl::Span<const std::vector<int32_t>> time_channel_samples) = 0;

   /*!\brief Signals to close the processor and flush any remaining samples.
    *
    * \return `absl::OkStatus()` on success. A specific status on failure.
    */
   virtual absl::Status FlushDerived() = 0;

   const size_t max_input_samples_per_frame_;
   const size_t num_channels_;

   // Stores the output decoded frames arranged in (time, sample) axes. That
   // is to say, each inner vector has one sample for per channel and the outer
   // vector contains one inner vector for each time tick. When the decoded
   // samples is shorter than a frame, only the first `num_valid_ticks_` ticks
   // should be used.
   std::vector<std::vector<int32_t>> output_time_channel_samples_;

   // Number of ticks (time samples) in `output_time_channel_samples_` that are
   // valid.
   size_t num_valid_ticks_ = 0;

  private:
   enum class State {
     kTakingSamples,
     kFlushCalled,
   } state_ = State::kTakingSamples;
 };

 }  // namespace iamf_tools

 #endif  // CLI_SAMPLE_PROCESSOR_BASE_H_
	/*
	* Copyright (c) 2024, Alliance for Open Media. All rights reserved
	*
	* This source code is subject to the terms of the BSD 3-Clause Clear License
	* and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear
	* License was not distributed with this source code in the LICENSE file, you
	* can obtain it at www.aomedia.org/license/software-license/bsd-3-c-c. If the
	* Alliance for Open Media Patent License 1.0 was not distributed with this
	* source code in the PATENTS file, you can obtain it at
	* www.aomedia.org/license/patent.
	*/
	#ifndef CLI_SAMPLE_PROCESSOR_BASE_H_
	#define CLI_SAMPLE_PROCESSOR_BASE_H_

	#include <cstddef>
	#include <cstdint>
	#include <vector>

	#include "absl/status/status.h"
	#include "absl/types/span.h"

	namespace iamf_tools {

	/*!\brief Abstract class to process PCM samples.
	*
	* This class represents an abstract interface to reprocess PCM samples. In
	* general, processors could introduce delay or could result in a different
	* number of samples per frame.
	*
	* Usage pattern:
	* - While input samples are available:
	* - Call `PushFrame()` to push in samples.
	* - Call `GetOutputSamplesAsSpan()` to retrieve the samples.
	* - Call `Flush()` to signal that no more frames will be pushed.
	* - Call `GetOutputSamplesAsSpan()` one last time to retrieve any remaining
	* samples.
	*
	* - Note: Results from `GetOutputSamplesAsSpan()` are invalidated by
	* further calls to `PushFrame()` or `Flush()`.
	*/
	class SampleProcessorBase {
	public:
	/*!\brief Constructor.
	*
	* \param max_input_samples_per_frame Maximum number of samples per frame in
	* the input timescale.
	* \param num_channels Number of channels. Later calls to `PushFrame()` must
	* contain this many channels.
	* \param max_output_samples_per_frame Maximum number of samples per frame in
	* the output timescale.
	*/
	SampleProcessorBase(size_t max_input_samples_per_frame, size_t num_channels,
	size_t max_output_samples_per_frame)
	: max_input_samples_per_frame_(max_input_samples_per_frame),
	num_channels_(num_channels),
	output_time_channel_samples_(max_output_samples_per_frame,
	std::vector<int32_t>(num_channels)) {}

	/!\brief Destructor. /
	virtual ~SampleProcessorBase() = 0;

	/*!\brief Pushes a frame of samples to the processor.
	*
	* \param time_channel_samples Samples to push arranged in (time, channel).
	* \return `absl::OkStatus()` on success. `absl::FailedPreconditionError` if
	* called after `Flush()`. Other specific statuses on failure.
	*/
	absl::Status PushFrame(
	absl::Span<const std::vector<int32_t>> time_channel_samples);

	/*!\brief Signals to close the processor and flush any remaining samples.
	*
	* After calling `Flush()`, it is invalid to call `PushFrame()`
	* or `Flush()` again.
	*
	* \return `absl::OkStatus()` on success. `absl::FailedPreconditionError` if
	* called after `Flush()`. Other specific statuses on failure.
	*/
	absl::Status Flush();

	/*!\brief Gets a span of the output samples.
	*
	* \return Span of the output samples. The span will be invalidated when
	* `PushFrame()` or `Flush()` is called.
	*/
	absl::Span<const std::vector<int32_t>> GetOutputSamplesAsSpan() const;

	protected:
	/*!\brief Pushes a frame of samples to the processor.
	*
	* \param time_channel_samples Samples to push arranged in (time, channel).
	* \return `absl::OkStatus()` on success. A specific status on failure.
	*/
	virtual absl::Status PushFrameDerived(
	absl::Span<const std::vector<int32_t>> time_channel_samples) = 0;

	/*!\brief Signals to close the processor and flush any remaining samples.
	*
	* \return `absl::OkStatus()` on success. A specific status on failure.
	*/
	virtual absl::Status FlushDerived() = 0;

	const size_t max_input_samples_per_frame_;
	const size_t num_channels_;

	// Stores the output decoded frames arranged in (time, sample) axes. That
	// is to say, each inner vector has one sample for per channel and the outer
	// vector contains one inner vector for each time tick. When the decoded
	// samples is shorter than a frame, only the first `num_valid_ticks_` ticks
	// should be used.
	std::vector<std::vector<int32_t>> output_time_channel_samples_;

	// Number of ticks (time samples) in `output_time_channel_samples_` that are
	// valid.
	size_t num_valid_ticks_ = 0;

	private:
	enum class State {
	kTakingSamples,
	kFlushCalled,
	} state_ = State::kTakingSamples;
	};

	} // namespace iamf_tools

	#endif // CLI_SAMPLE_PROCESSOR_BASE_H_