blob: 0499e709dce8a69f7763ee5a4f2d0d4be3412d57 [file] [log] [blame]
// Copyright 2022 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
//#define LOG_NDEBUG 0
#define LOG_TAG "NalParser"
#include <v4l2_codec2/common/HEVCNalParser.h>
#include <algorithm>
#include <media/stagefright/foundation/ABitReader.h>
#include <utils/Log.h>
namespace android {
namespace {
constexpr uint32_t kMaxShortTermRefPicSets = 64;
struct StRefPicSet {
// Syntax elements.
int numNegativePics;
int numPositivePics;
int deltaPocS0[kMaxShortTermRefPicSets];
int deltaPocS1[kMaxShortTermRefPicSets];
// Calculated fields.
int numDeltaPocs;
};
// Skip an HEVC ProfileTierLevel in the specified bitstream.
bool skipProfileTierLevel(ABitReader* br, uint32_t spsMaxSublayersMinus1) {
// general_profile_space(2), general_tier_flag(1), general_profile_idc(5),
// general_profile_compatibility_flag(32), general_progressive_source_flag(1),
// general_interlaced_source_flag(1), general_non_packed_constraint_flag(1),
// general_frame_only_constraint_flag(1), compatibility_flags(43), general_inbld_flag(1),
// general_level_idc(8)
br->skipBits(96);
if (spsMaxSublayersMinus1 > 6) return false;
uint32_t subLayerProfilePresentFlag[6];
uint32_t subLayerLevelPresentFlag[6];
for (uint32_t i = 0; i < spsMaxSublayersMinus1; ++i) {
if (!br->getBitsGraceful(1, &subLayerProfilePresentFlag[i])) return false;
if (!br->getBitsGraceful(1, &subLayerLevelPresentFlag[i])) return false;
}
if (spsMaxSublayersMinus1 > 0) {
br->skipBits(2 * (8 - spsMaxSublayersMinus1));
}
for (uint32_t i = 0; i < spsMaxSublayersMinus1; ++i) {
if (subLayerProfilePresentFlag[i]) {
// sub_layer_profile_space(2), sub_layer_tier_flag(1), sub_layer_profile_idc(5),
// sub_layer_profile_compatibility_flag(32), sub_layer_progressive_source_flag(1),
// sub_layer_interlaced_source_flag(1), sub_layer_non_packed_constraint_flag(1),
// sub_layer_frame_only_constraint_flag(1), compatibility_flags(43),
// sub_layer_inbld_flag(1)
br->skipBits(88);
}
if (subLayerLevelPresentFlag[i]) {
br->skipBits(8); // sub_layer_level_idc
}
}
return true;
}
// Skip an HEVC ScalingListData in the specified bitstream.
bool skipScalingListData(ABitReader* br) {
for (int sizeId = 0; sizeId < 4; ++sizeId) {
for (int matrixId = 0; matrixId < 6; matrixId += (sizeId == 3) ? 3 : 1) {
uint32_t scalingListPredModeFlag;
if (!br->getBitsGraceful(1, &scalingListPredModeFlag)) return false;
if (!scalingListPredModeFlag) {
uint32_t unused;
NalParser::parseUE(br, &unused); // scaling_list_pred_matrix_id_delta
} else {
int32_t unused;
if (sizeId > 1)
NalParser::parseSE(br, &unused); // scaling_list_dc_coef_16x16 or 32x32
int coefNum = std::min(64, (1 << (4 + (sizeId << 1))));
for (int i = 0; i < coefNum; ++i)
NalParser::parseSE(br, &unused); // scaling_list_delta_coef
}
}
}
return true;
}
// Skip an HEVC StRefPicSet in the specified bitstream.
bool skipStRefPicSet(ABitReader* br, uint32_t stRpsIdx, uint32_t numShortTermRefPicSets,
StRefPicSet* allRefPicSets, StRefPicSet* currRefPicSet) {
uint32_t interRefPicSetPredictionFlag = 0;
if (stRpsIdx != 0) {
if (!br->getBitsGraceful(1, &interRefPicSetPredictionFlag)) return false;
}
if (interRefPicSetPredictionFlag) {
uint32_t deltaIdxMinus1 = 0;
if (stRpsIdx == numShortTermRefPicSets) {
if (!NalParser::parseUE(br, &deltaIdxMinus1)) return false;
if (deltaIdxMinus1 + 1 > stRpsIdx) {
ALOGW("deltaIdxMinus1 is out of range");
return false;
}
}
int refRpsIdx = stRpsIdx - (static_cast<int>(deltaIdxMinus1) + 1);
uint32_t deltaRpsSign;
uint32_t absDeltaRpsMinus1;
if (!br->getBitsGraceful(1, &deltaRpsSign)) return false;
if (!NalParser::parseUE(br, &absDeltaRpsMinus1)) return false;
int deltaRps = (1 - 2 * static_cast<int>(deltaRpsSign)) *
(static_cast<int>(absDeltaRpsMinus1) + 1);
const StRefPicSet& refSet = allRefPicSets[refRpsIdx];
uint32_t useDeltaFlag[kMaxShortTermRefPicSets];
// useDeltaFlag defaults to 1 if not present.
std::fill_n(useDeltaFlag, kMaxShortTermRefPicSets, 1);
for (int j = 0; j <= refSet.numDeltaPocs; j++) {
uint32_t usedByCurrPicFlag;
if (!br->getBitsGraceful(1, &usedByCurrPicFlag)) return false;
if (!usedByCurrPicFlag)
if (!br->getBitsGraceful(1, &useDeltaFlag[j])) return false;
}
int i = 0;
for (int j = refSet.numPositivePics - 1; j >= 0; --j) {
int dPoc = refSet.deltaPocS1[j] + deltaRps;
if (dPoc < 0 && useDeltaFlag[refSet.numNegativePics + j])
currRefPicSet->deltaPocS0[i++] = dPoc;
}
if (deltaRps < 0 && useDeltaFlag[refSet.numDeltaPocs]) {
currRefPicSet->deltaPocS0[i++] = deltaRps;
}
for (int j = 0; j < refSet.numNegativePics; ++j) {
int dPoc = refSet.deltaPocS0[j] + deltaRps;
if (dPoc < 0 && useDeltaFlag[j]) currRefPicSet->deltaPocS0[i++] = dPoc;
}
currRefPicSet->numNegativePics = i;
i = 0;
for (int j = refSet.numNegativePics - 1; j >= 0; --j) {
int dPoc = refSet.deltaPocS0[j] + deltaRps;
if (dPoc > 0 && useDeltaFlag[j]) currRefPicSet->deltaPocS1[i++] = dPoc;
}
if (deltaRps > 0 && useDeltaFlag[refSet.numDeltaPocs])
currRefPicSet->deltaPocS1[i++] = deltaRps;
for (int j = 0; j < refSet.numPositivePics; ++j) {
int dPoc = refSet.deltaPocS1[j] + deltaRps;
if (dPoc > 0 && useDeltaFlag[refSet.numNegativePics + j])
currRefPicSet->deltaPocS1[i++] = dPoc;
}
currRefPicSet->numPositivePics = i;
} else {
uint32_t uintForRead;
if (!NalParser::parseUE(br, &uintForRead)) return false;
currRefPicSet->numNegativePics = static_cast<int>(uintForRead);
if (!NalParser::parseUE(br, &uintForRead)) return false;
currRefPicSet->numPositivePics = static_cast<int>(uintForRead);
if (currRefPicSet->numNegativePics > kMaxShortTermRefPicSets ||
currRefPicSet->numPositivePics > kMaxShortTermRefPicSets) {
ALOGW("num_negative_pics or num_positive_pics is out of range");
return false;
}
for (int i = 0; i < currRefPicSet->numNegativePics; ++i) {
uint32_t deltaPocS0Minus1;
if (!NalParser::parseUE(br, &deltaPocS0Minus1)) return false;
if (i == 0) {
currRefPicSet->deltaPocS0[i] = -(static_cast<int>(deltaPocS0Minus1) + 1);
} else {
currRefPicSet->deltaPocS0[i] =
currRefPicSet->deltaPocS0[i - 1] - (static_cast<int>(deltaPocS0Minus1) + 1);
}
br->skipBits(1); // used_by_curr_pic_s0
}
for (int i = 0; i < currRefPicSet->numPositivePics; ++i) {
uint32_t deltaPocS1Minus1;
if (!NalParser::parseUE(br, &deltaPocS1Minus1)) return false;
if (i == 0) {
currRefPicSet->deltaPocS1[i] = static_cast<int>(deltaPocS1Minus1) + 1;
} else {
currRefPicSet->deltaPocS1[i] =
currRefPicSet->deltaPocS1[i - 1] + static_cast<int>(deltaPocS1Minus1) + 1;
}
br->skipBits(1); // used_by_curr_pic_s1
}
}
currRefPicSet->numDeltaPocs = currRefPicSet->numNegativePics + currRefPicSet->numPositivePics;
if (currRefPicSet->numDeltaPocs > kMaxShortTermRefPicSets) {
ALOGW("numDeltaPocs is out of range");
return false;
}
return true;
}
} // namespace
HEVCNalParser::HEVCNalParser(const uint8_t* data, size_t length) : NalParser(data, length) {}
bool HEVCNalParser::locateSPS() {
while (locateNextNal()) {
if (length() == 0) continue;
if (type() != kSPSType) continue;
return true;
}
return false;
}
uint8_t HEVCNalParser::type() const {
// First bit is forbidden_zero_bit, next 6 are nal_unit_type
constexpr uint8_t kNALTypeMask = 0x7e;
return (*mCurrNalDataPos & kNALTypeMask) >> 1;
}
bool HEVCNalParser::findCodedColorAspects(ColorAspects* colorAspects) {
ALOG_ASSERT(colorAspects);
ALOG_ASSERT(type() == kSPSType);
// Unfortunately we can't directly jump to the Video Usability Information (VUI) parameters that
// contain the color aspects. We need to parse the entire SPS header up until the values we
// need.
// Skip first 2 bytes for the NALU header.
if (length() <= 2) return false;
NALBitReader br(mCurrNalDataPos + 2, length() - 2);
br.skipBits(4); // sps_video_parameter_set_id
uint32_t spsMaxSublayersMinus1;
if (!br.getBitsGraceful(3, &spsMaxSublayersMinus1)) return false;
br.skipBits(1); // sps_temporal_id_nesting_flag
if (!skipProfileTierLevel(&br, spsMaxSublayersMinus1)) return false;
uint32_t unused;
parseUE(&br, &unused); // sps_seq_parameter_set_id
uint32_t chromaFormatIdc;
if (!parseUE(&br, &chromaFormatIdc)) return false;
if (chromaFormatIdc == 3) br.skipBits(1); // separate_colour_plane_flag
parseUE(&br, &unused); // pic_width_in_luma_samples
parseUE(&br, &unused); // pic_height_in_luma_samples
uint32_t conformanceWindowFlag;
if (!br.getBitsGraceful(1, &conformanceWindowFlag)) return false;
if (conformanceWindowFlag) {
parseUE(&br, &unused); // conf_win_left_offset
parseUE(&br, &unused); // conf_win_right_offset
parseUE(&br, &unused); // conf_win_top_offset
parseUE(&br, &unused); // conf_win_bottom_offset
}
parseUE(&br, &unused); // bit_depth_luma_minus8
parseUE(&br, &unused); // bit_depth_chroma_minus8
uint32_t log2MaxPicOrderCntLsbMinus4;
if (!parseUE(&br, &log2MaxPicOrderCntLsbMinus4)) return false;
uint32_t spsSubLayerOrderingInfoPresentFlag;
if (!br.getBitsGraceful(1, &spsSubLayerOrderingInfoPresentFlag)) return false;
for (uint32_t i = spsSubLayerOrderingInfoPresentFlag ? 0 : spsMaxSublayersMinus1;
i <= spsMaxSublayersMinus1; ++i) {
parseUE(&br, &unused); // sps_max_dec_pic_buffering_minus1
parseUE(&br, &unused); // sps_max_num_reorder_pics
parseUE(&br, &unused); // sps_max_latency_increase_plus1
}
parseUE(&br, &unused); // log2_min_luma_coding_block_size_minus3
parseUE(&br, &unused); // log2_diff_max_min_luma_coding_block_size
parseUE(&br, &unused); // log2_min_luma_transform_block_size_minus2
parseUE(&br, &unused); // log2_diff_max_min_luma_transform_block_size
parseUE(&br, &unused); // max_transform_hierarchy_depth_inter
parseUE(&br, &unused); // max_transform_hierarchy_depth_intra
uint32_t scalingListEnabledFlag;
if (!br.getBitsGraceful(1, &scalingListEnabledFlag)) return false;
if (scalingListEnabledFlag) {
uint32_t spsScalingListDataPresentFlag;
if (!br.getBitsGraceful(1, &spsScalingListDataPresentFlag)) return false;
if (spsScalingListDataPresentFlag) {
if (!skipScalingListData(&br)) return false;
}
}
br.skipBits(2); // amp_enabled_flag(1), sample_adaptive_offset_enabled_flag(1)
uint32_t pcmEnabledFlag;
if (!br.getBitsGraceful(1, &pcmEnabledFlag)) return false;
if (pcmEnabledFlag) {
// pcm_sample_bit_depth_luma_minus1(4), pcm_sample_bit_depth_chroma_minus1(4)
br.skipBits(8);
parseUE(&br, &unused); // log2_min_pcm_luma_coding_block_size_minus3
parseUE(&br, &unused); // log2_diff_max_min_pcm_luma_coding_block_size
br.skipBits(1); // pcm_loop_filter_disabled_flag
}
uint32_t numShortTermRefPicSets;
if (!parseUE(&br, &numShortTermRefPicSets)) return false;
if (numShortTermRefPicSets > kMaxShortTermRefPicSets) {
ALOGW("numShortTermRefPicSets out of range");
return false;
}
StRefPicSet allRefPicSets[kMaxShortTermRefPicSets];
memset(allRefPicSets, 0, sizeof(StRefPicSet) * kMaxShortTermRefPicSets);
for (uint32_t i = 0; i < numShortTermRefPicSets; ++i) {
if (!skipStRefPicSet(&br, i, numShortTermRefPicSets, allRefPicSets, &allRefPicSets[i]))
return false;
}
uint32_t longTermRefPicsPresentFlag;
if (!br.getBitsGraceful(1, &longTermRefPicsPresentFlag)) return false;
if (longTermRefPicsPresentFlag) {
uint32_t numLongTermRefPicsSps;
if (!parseUE(&br, &numLongTermRefPicsSps)) return false;
for (uint32_t i = 0; i < numLongTermRefPicsSps; ++i) {
// lt_ref_pic_poc_lsb_sps
if (!br.getBitsGraceful(log2MaxPicOrderCntLsbMinus4 + 4, &unused)) return false;
if (!br.getBitsGraceful(1, &unused)) return false; // used_by_curr_pic_lt_sps_flag
}
}
// sps_temporal_mvp_enabled_flag(1), strong_intra_smoothing_enabled_flag(1)
br.skipBits(2);
uint32_t vuiParametersPresentFlag;
if (!br.getBitsGraceful(1, &vuiParametersPresentFlag)) return false;
if (vuiParametersPresentFlag) {
uint32_t aspectRatioInfoPresentFlag;
if (!br.getBitsGraceful(1, &aspectRatioInfoPresentFlag))
return false; // VUI aspect_ratio_info_present_flag
if (aspectRatioInfoPresentFlag) {
uint32_t aspectRatioIdc;
if (!br.getBitsGraceful(8, &aspectRatioIdc)) return false; // VUI aspect_ratio_idc
if (aspectRatioIdc == 255) { // VUI aspect_ratio_idc == extended sample aspect ratio
br.skipBits(32); // VUI sar_width + sar_height
}
}
uint32_t overscanInfoPresentFlag;
if (!br.getBitsGraceful(1, &overscanInfoPresentFlag))
return false; // VUI overscan_info_present_flag
if (overscanInfoPresentFlag) br.skipBits(1); // VUI overscan_appropriate_flag
uint32_t videoSignalTypePresentFlag;
if (!br.getBitsGraceful(1, &videoSignalTypePresentFlag))
return false; // VUI video_signal_type_present_flag
if (videoSignalTypePresentFlag) {
br.skipBits(3); // VUI video_format
uint32_t videoFullRangeFlag;
if (!br.getBitsGraceful(1, &videoFullRangeFlag))
return false; // VUI videoFullRangeFlag
colorAspects->fullRange = videoFullRangeFlag;
uint32_t color_description_present_flag;
if (!br.getBitsGraceful(1, &color_description_present_flag))
return false; // VUI color_description_present_flag
if (color_description_present_flag) {
if (!br.getBitsGraceful(8, &colorAspects->primaries))
return false; // VUI colour_primaries
if (!br.getBitsGraceful(8, &colorAspects->transfer))
return false; // VUI transfer_characteristics
if (!br.getBitsGraceful(8, &colorAspects->coeffs))
return false; // VUI matrix_coefficients
return true;
}
}
}
return false; // The NAL unit doesn't contain color aspects info.
}
} // namespace android