// Copyright 2022 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. //#define LOG_NDEBUG 0 #define LOG_TAG "NalParser" #include #include #include #include namespace android { namespace { constexpr uint32_t kMaxShortTermRefPicSets = 64; struct StRefPicSet { // Syntax elements. int numNegativePics; int numPositivePics; int deltaPocS0[kMaxShortTermRefPicSets]; int deltaPocS1[kMaxShortTermRefPicSets]; // Calculated fields. int numDeltaPocs; }; // Skip an HEVC ProfileTierLevel in the specified bitstream. bool skipProfileTierLevel(ABitReader* br, uint32_t spsMaxSublayersMinus1) { // general_profile_space(2), general_tier_flag(1), general_profile_idc(5), // general_profile_compatibility_flag(32), general_progressive_source_flag(1), // general_interlaced_source_flag(1), general_non_packed_constraint_flag(1), // general_frame_only_constraint_flag(1), compatibility_flags(43), general_inbld_flag(1), // general_level_idc(8) br->skipBits(96); if (spsMaxSublayersMinus1 > 6) return false; uint32_t subLayerProfilePresentFlag[6]; uint32_t subLayerLevelPresentFlag[6]; for (uint32_t i = 0; i < spsMaxSublayersMinus1; ++i) { if (!br->getBitsGraceful(1, &subLayerProfilePresentFlag[i])) return false; if (!br->getBitsGraceful(1, &subLayerLevelPresentFlag[i])) return false; } if (spsMaxSublayersMinus1 > 0) { br->skipBits(2 * (8 - spsMaxSublayersMinus1)); } for (uint32_t i = 0; i < spsMaxSublayersMinus1; ++i) { if (subLayerProfilePresentFlag[i]) { // sub_layer_profile_space(2), sub_layer_tier_flag(1), sub_layer_profile_idc(5), // sub_layer_profile_compatibility_flag(32), sub_layer_progressive_source_flag(1), // sub_layer_interlaced_source_flag(1), sub_layer_non_packed_constraint_flag(1), // sub_layer_frame_only_constraint_flag(1), compatibility_flags(43), // sub_layer_inbld_flag(1) br->skipBits(88); } if (subLayerLevelPresentFlag[i]) { br->skipBits(8); // sub_layer_level_idc } } return true; } // Skip an HEVC ScalingListData in the specified bitstream. bool skipScalingListData(ABitReader* br) { for (int sizeId = 0; sizeId < 4; ++sizeId) { for (int matrixId = 0; matrixId < 6; matrixId += (sizeId == 3) ? 3 : 1) { uint32_t scalingListPredModeFlag; if (!br->getBitsGraceful(1, &scalingListPredModeFlag)) return false; if (!scalingListPredModeFlag) { uint32_t unused; NalParser::parseUE(br, &unused); // scaling_list_pred_matrix_id_delta } else { int32_t unused; if (sizeId > 1) NalParser::parseSE(br, &unused); // scaling_list_dc_coef_16x16 or 32x32 int coefNum = std::min(64, (1 << (4 + (sizeId << 1)))); for (int i = 0; i < coefNum; ++i) NalParser::parseSE(br, &unused); // scaling_list_delta_coef } } } return true; } // Skip an HEVC StRefPicSet in the specified bitstream. bool skipStRefPicSet(ABitReader* br, uint32_t stRpsIdx, uint32_t numShortTermRefPicSets, StRefPicSet* allRefPicSets, StRefPicSet* currRefPicSet) { uint32_t interRefPicSetPredictionFlag = 0; if (stRpsIdx != 0) { if (!br->getBitsGraceful(1, &interRefPicSetPredictionFlag)) return false; } if (interRefPicSetPredictionFlag) { uint32_t deltaIdxMinus1 = 0; if (stRpsIdx == numShortTermRefPicSets) { if (!NalParser::parseUE(br, &deltaIdxMinus1)) return false; if (deltaIdxMinus1 + 1 > stRpsIdx) { ALOGW("deltaIdxMinus1 is out of range"); return false; } } int refRpsIdx = stRpsIdx - (static_cast(deltaIdxMinus1) + 1); uint32_t deltaRpsSign; uint32_t absDeltaRpsMinus1; if (!br->getBitsGraceful(1, &deltaRpsSign)) return false; if (!NalParser::parseUE(br, &absDeltaRpsMinus1)) return false; int deltaRps = (1 - 2 * static_cast(deltaRpsSign)) * (static_cast(absDeltaRpsMinus1) + 1); const StRefPicSet& refSet = allRefPicSets[refRpsIdx]; uint32_t useDeltaFlag[kMaxShortTermRefPicSets]; // useDeltaFlag defaults to 1 if not present. std::fill_n(useDeltaFlag, kMaxShortTermRefPicSets, 1); for (int j = 0; j <= refSet.numDeltaPocs; j++) { uint32_t usedByCurrPicFlag; if (!br->getBitsGraceful(1, &usedByCurrPicFlag)) return false; if (!usedByCurrPicFlag) if (!br->getBitsGraceful(1, &useDeltaFlag[j])) return false; } int i = 0; for (int j = refSet.numPositivePics - 1; j >= 0; --j) { int dPoc = refSet.deltaPocS1[j] + deltaRps; if (dPoc < 0 && useDeltaFlag[refSet.numNegativePics + j]) currRefPicSet->deltaPocS0[i++] = dPoc; } if (deltaRps < 0 && useDeltaFlag[refSet.numDeltaPocs]) { currRefPicSet->deltaPocS0[i++] = deltaRps; } for (int j = 0; j < refSet.numNegativePics; ++j) { int dPoc = refSet.deltaPocS0[j] + deltaRps; if (dPoc < 0 && useDeltaFlag[j]) currRefPicSet->deltaPocS0[i++] = dPoc; } currRefPicSet->numNegativePics = i; i = 0; for (int j = refSet.numNegativePics - 1; j >= 0; --j) { int dPoc = refSet.deltaPocS0[j] + deltaRps; if (dPoc > 0 && useDeltaFlag[j]) currRefPicSet->deltaPocS1[i++] = dPoc; } if (deltaRps > 0 && useDeltaFlag[refSet.numDeltaPocs]) currRefPicSet->deltaPocS1[i++] = deltaRps; for (int j = 0; j < refSet.numPositivePics; ++j) { int dPoc = refSet.deltaPocS1[j] + deltaRps; if (dPoc > 0 && useDeltaFlag[refSet.numNegativePics + j]) currRefPicSet->deltaPocS1[i++] = dPoc; } currRefPicSet->numPositivePics = i; } else { uint32_t uintForRead; if (!NalParser::parseUE(br, &uintForRead)) return false; currRefPicSet->numNegativePics = static_cast(uintForRead); if (!NalParser::parseUE(br, &uintForRead)) return false; currRefPicSet->numPositivePics = static_cast(uintForRead); if (currRefPicSet->numNegativePics > kMaxShortTermRefPicSets || currRefPicSet->numPositivePics > kMaxShortTermRefPicSets) { ALOGW("num_negative_pics or num_positive_pics is out of range"); return false; } for (int i = 0; i < currRefPicSet->numNegativePics; ++i) { uint32_t deltaPocS0Minus1; if (!NalParser::parseUE(br, &deltaPocS0Minus1)) return false; if (i == 0) { currRefPicSet->deltaPocS0[i] = -(static_cast(deltaPocS0Minus1) + 1); } else { currRefPicSet->deltaPocS0[i] = currRefPicSet->deltaPocS0[i - 1] - (static_cast(deltaPocS0Minus1) + 1); } br->skipBits(1); // used_by_curr_pic_s0 } for (int i = 0; i < currRefPicSet->numPositivePics; ++i) { uint32_t deltaPocS1Minus1; if (!NalParser::parseUE(br, &deltaPocS1Minus1)) return false; if (i == 0) { currRefPicSet->deltaPocS1[i] = static_cast(deltaPocS1Minus1) + 1; } else { currRefPicSet->deltaPocS1[i] = currRefPicSet->deltaPocS1[i - 1] + static_cast(deltaPocS1Minus1) + 1; } br->skipBits(1); // used_by_curr_pic_s1 } } currRefPicSet->numDeltaPocs = currRefPicSet->numNegativePics + currRefPicSet->numPositivePics; if (currRefPicSet->numDeltaPocs > kMaxShortTermRefPicSets) { ALOGW("numDeltaPocs is out of range"); return false; } return true; } } // namespace HEVCNalParser::HEVCNalParser(const uint8_t* data, size_t length) : NalParser(data, length) {} bool HEVCNalParser::locateSPS() { while (locateNextNal()) { if (length() == 0) continue; if (type() != kSPSType) continue; return true; } return false; } bool HEVCNalParser::locateIDR() { while (locateNextNal()) { if (length() == 0) continue; if (type() != kIDRType) continue; return true; } return false; } uint8_t HEVCNalParser::type() const { // First bit is forbidden_zero_bit, next 6 are nal_unit_type constexpr uint8_t kNALTypeMask = 0x7e; return (*mCurrNalDataPos & kNALTypeMask) >> 1; } bool HEVCNalParser::findCodedColorAspects(ColorAspects* colorAspects) { ALOG_ASSERT(colorAspects); ALOG_ASSERT(type() == kSPSType); // Unfortunately we can't directly jump to the Video Usability Information (VUI) parameters that // contain the color aspects. We need to parse the entire SPS header up until the values we // need. // Skip first 2 bytes for the NALU header. if (length() <= 2) return false; NALBitReader br(mCurrNalDataPos + 2, length() - 2); br.skipBits(4); // sps_video_parameter_set_id uint32_t spsMaxSublayersMinus1; if (!br.getBitsGraceful(3, &spsMaxSublayersMinus1)) return false; br.skipBits(1); // sps_temporal_id_nesting_flag if (!skipProfileTierLevel(&br, spsMaxSublayersMinus1)) return false; uint32_t unused; parseUE(&br, &unused); // sps_seq_parameter_set_id uint32_t chromaFormatIdc; if (!parseUE(&br, &chromaFormatIdc)) return false; if (chromaFormatIdc == 3) br.skipBits(1); // separate_colour_plane_flag parseUE(&br, &unused); // pic_width_in_luma_samples parseUE(&br, &unused); // pic_height_in_luma_samples uint32_t conformanceWindowFlag; if (!br.getBitsGraceful(1, &conformanceWindowFlag)) return false; if (conformanceWindowFlag) { parseUE(&br, &unused); // conf_win_left_offset parseUE(&br, &unused); // conf_win_right_offset parseUE(&br, &unused); // conf_win_top_offset parseUE(&br, &unused); // conf_win_bottom_offset } parseUE(&br, &unused); // bit_depth_luma_minus8 parseUE(&br, &unused); // bit_depth_chroma_minus8 uint32_t log2MaxPicOrderCntLsbMinus4; if (!parseUE(&br, &log2MaxPicOrderCntLsbMinus4)) return false; uint32_t spsSubLayerOrderingInfoPresentFlag; if (!br.getBitsGraceful(1, &spsSubLayerOrderingInfoPresentFlag)) return false; for (uint32_t i = spsSubLayerOrderingInfoPresentFlag ? 0 : spsMaxSublayersMinus1; i <= spsMaxSublayersMinus1; ++i) { parseUE(&br, &unused); // sps_max_dec_pic_buffering_minus1 parseUE(&br, &unused); // sps_max_num_reorder_pics parseUE(&br, &unused); // sps_max_latency_increase_plus1 } parseUE(&br, &unused); // log2_min_luma_coding_block_size_minus3 parseUE(&br, &unused); // log2_diff_max_min_luma_coding_block_size parseUE(&br, &unused); // log2_min_luma_transform_block_size_minus2 parseUE(&br, &unused); // log2_diff_max_min_luma_transform_block_size parseUE(&br, &unused); // max_transform_hierarchy_depth_inter parseUE(&br, &unused); // max_transform_hierarchy_depth_intra uint32_t scalingListEnabledFlag; if (!br.getBitsGraceful(1, &scalingListEnabledFlag)) return false; if (scalingListEnabledFlag) { uint32_t spsScalingListDataPresentFlag; if (!br.getBitsGraceful(1, &spsScalingListDataPresentFlag)) return false; if (spsScalingListDataPresentFlag) { if (!skipScalingListData(&br)) return false; } } br.skipBits(2); // amp_enabled_flag(1), sample_adaptive_offset_enabled_flag(1) uint32_t pcmEnabledFlag; if (!br.getBitsGraceful(1, &pcmEnabledFlag)) return false; if (pcmEnabledFlag) { // pcm_sample_bit_depth_luma_minus1(4), pcm_sample_bit_depth_chroma_minus1(4) br.skipBits(8); parseUE(&br, &unused); // log2_min_pcm_luma_coding_block_size_minus3 parseUE(&br, &unused); // log2_diff_max_min_pcm_luma_coding_block_size br.skipBits(1); // pcm_loop_filter_disabled_flag } uint32_t numShortTermRefPicSets; if (!parseUE(&br, &numShortTermRefPicSets)) return false; if (numShortTermRefPicSets > kMaxShortTermRefPicSets) { ALOGW("numShortTermRefPicSets out of range"); return false; } StRefPicSet allRefPicSets[kMaxShortTermRefPicSets]; memset(allRefPicSets, 0, sizeof(StRefPicSet) * kMaxShortTermRefPicSets); for (uint32_t i = 0; i < numShortTermRefPicSets; ++i) { if (!skipStRefPicSet(&br, i, numShortTermRefPicSets, allRefPicSets, &allRefPicSets[i])) return false; } uint32_t longTermRefPicsPresentFlag; if (!br.getBitsGraceful(1, &longTermRefPicsPresentFlag)) return false; if (longTermRefPicsPresentFlag) { uint32_t numLongTermRefPicsSps; if (!parseUE(&br, &numLongTermRefPicsSps)) return false; for (uint32_t i = 0; i < numLongTermRefPicsSps; ++i) { // lt_ref_pic_poc_lsb_sps if (!br.getBitsGraceful(log2MaxPicOrderCntLsbMinus4 + 4, &unused)) return false; if (!br.getBitsGraceful(1, &unused)) return false; // used_by_curr_pic_lt_sps_flag } } // sps_temporal_mvp_enabled_flag(1), strong_intra_smoothing_enabled_flag(1) br.skipBits(2); uint32_t vuiParametersPresentFlag; if (!br.getBitsGraceful(1, &vuiParametersPresentFlag)) return false; if (vuiParametersPresentFlag) { uint32_t aspectRatioInfoPresentFlag; if (!br.getBitsGraceful(1, &aspectRatioInfoPresentFlag)) return false; // VUI aspect_ratio_info_present_flag if (aspectRatioInfoPresentFlag) { uint32_t aspectRatioIdc; if (!br.getBitsGraceful(8, &aspectRatioIdc)) return false; // VUI aspect_ratio_idc if (aspectRatioIdc == 255) { // VUI aspect_ratio_idc == extended sample aspect ratio br.skipBits(32); // VUI sar_width + sar_height } } uint32_t overscanInfoPresentFlag; if (!br.getBitsGraceful(1, &overscanInfoPresentFlag)) return false; // VUI overscan_info_present_flag if (overscanInfoPresentFlag) br.skipBits(1); // VUI overscan_appropriate_flag uint32_t videoSignalTypePresentFlag; if (!br.getBitsGraceful(1, &videoSignalTypePresentFlag)) return false; // VUI video_signal_type_present_flag if (videoSignalTypePresentFlag) { br.skipBits(3); // VUI video_format uint32_t videoFullRangeFlag; if (!br.getBitsGraceful(1, &videoFullRangeFlag)) return false; // VUI videoFullRangeFlag colorAspects->fullRange = videoFullRangeFlag; uint32_t color_description_present_flag; if (!br.getBitsGraceful(1, &color_description_present_flag)) return false; // VUI color_description_present_flag if (color_description_present_flag) { if (!br.getBitsGraceful(8, &colorAspects->primaries)) return false; // VUI colour_primaries if (!br.getBitsGraceful(8, &colorAspects->transfer)) return false; // VUI transfer_characteristics if (!br.getBitsGraceful(8, &colorAspects->coeffs)) return false; // VUI matrix_coefficients return true; } } } return false; // The NAL unit doesn't contain color aspects info. } } // namespace android