// Copyright 2016 Google LLC. All rights reserved. // // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file or at // https://developers.google.com/open-source/licenses/bsd #include "packager/media/codecs/h265_parser.h" #include #include #include "glog/logging.h" #include "packager/media/base/macros.h" #include "packager/media/codecs/nalu_reader.h" #define TRUE_OR_RETURN(a) \ do { \ if (!(a)) { \ DVLOG(1) << "Failure while processing " << #a; \ return kInvalidStream; \ } \ } while (0) #define OK_OR_RETURN(a) \ do { \ Result status = (a); \ if (status != kOk) \ return status; \ } while (false) #define READ_LONG_OR_RETURN(out) \ do { \ int _top_half, _bottom_half; \ if (!br->ReadBits(16, &_top_half)) { \ DVLOG(1) \ << "Error in stream: unexpected EOS while trying to read " #out; \ return kInvalidStream; \ } \ if (!br->ReadBits(16, &_bottom_half)) { \ DVLOG(1) \ << "Error in stream: unexpected EOS while trying to read " #out; \ return kInvalidStream; \ } \ *(out) = ((long)_top_half) << 16 | _bottom_half; \ } while (false) namespace shaka { namespace media { namespace { int GetNumPicTotalCurr(const H265SliceHeader& slice_header, const H265Sps& sps) { int num_pic_total_curr = 0; const H265ReferencePictureSet& ref_pic_set = slice_header.short_term_ref_pic_set_sps_flag ? sps.st_ref_pic_sets[slice_header.short_term_ref_pic_set_idx] : slice_header.st_ref_pic_set; for (int i = 0; i < ref_pic_set.num_negative_pics; i++) { if (ref_pic_set.used_by_curr_pic_s0[i]) num_pic_total_curr++; } for (int i = 0; i < ref_pic_set.num_positive_pics; i++) { if (ref_pic_set.used_by_curr_pic_s1[i]) num_pic_total_curr++; } return num_pic_total_curr + slice_header.used_by_curr_pic_lt; } void GetAspectRatioInfo(const H265Sps& sps, uint32_t* pixel_width, uint32_t* pixel_height) { // The default value is 0; so if this is not in the SPS, it will correctly // assume unspecified. int aspect_ratio_idc = sps.vui_parameters.aspect_ratio_idc; // Table E.1 switch (aspect_ratio_idc) { case 1: *pixel_width = 1; *pixel_height = 1; break; case 2: *pixel_width = 12; *pixel_height = 11; break; case 3: *pixel_width = 10; *pixel_height = 11; break; case 4: *pixel_width = 16; *pixel_height = 11; break; case 5: *pixel_width = 40; *pixel_height = 33; break; case 6: *pixel_width = 24; *pixel_height = 11; break; case 7: *pixel_width = 20; *pixel_height = 11; break; case 8: *pixel_width = 32; *pixel_height = 11; break; case 9: *pixel_width = 80; *pixel_height = 33; break; case 10: *pixel_width = 18; *pixel_height = 11; break; case 11: *pixel_width = 15; *pixel_height = 11; break; case 12: *pixel_width = 64; *pixel_height = 33; break; case 13: *pixel_width = 160; *pixel_height = 99; break; case 14: *pixel_width = 4; *pixel_height = 3; break; case 15: *pixel_width = 3; *pixel_height = 2; break; case 16: *pixel_width = 2; *pixel_height = 1; break; case 255: *pixel_width = sps.vui_parameters.sar_width; *pixel_height = sps.vui_parameters.sar_height; break; default: // Section E.3.1 specifies that other values should be interpreted as 0. LOG(WARNING) << "Unknown aspect_ratio_idc " << aspect_ratio_idc; FALLTHROUGH_INTENDED; case 0: // Unlike the spec, assume 1:1 if not specified. *pixel_width = 1; *pixel_height = 1; break; } } } // namespace bool ExtractResolutionFromSps(const H265Sps& sps, uint32_t* coded_width, uint32_t* coded_height, uint32_t* pixel_width, uint32_t* pixel_height) { int crop_x = 0; int crop_y = 0; if (sps.conformance_window_flag) { int sub_width_c = 0; int sub_height_c = 0; // Table 6-1 switch (sps.chroma_format_idc) { case 0: // Monochrome sub_width_c = 1; sub_height_c = 1; break; case 1: // 4:2:0 sub_width_c = 2; sub_height_c = 2; break; case 2: // 4:2:2 sub_width_c = 2; sub_height_c = 1; break; case 3: // 4:4:4 sub_width_c = 1; sub_height_c = 1; break; default: LOG(ERROR) << "Unexpected chroma_format_idc " << sps.chroma_format_idc; return false; } // Formula D-28, D-29 crop_x = sub_width_c * (sps.conf_win_right_offset + sps.conf_win_left_offset); crop_y = sub_height_c * (sps.conf_win_bottom_offset + sps.conf_win_top_offset); } // Formula D-28, D-29 *coded_width = sps.pic_width_in_luma_samples - crop_x; *coded_height = sps.pic_height_in_luma_samples - crop_y; GetAspectRatioInfo(sps, pixel_width, pixel_height); return true; } H265Pps::H265Pps() {} H265Pps::~H265Pps() {} H265Sps::H265Sps() {} H265Sps::~H265Sps() {} int H265Sps::GetPicSizeInCtbsY() const { int min_cb_log2_size_y = log2_min_luma_coding_block_size_minus3 + 3; int ctb_log2_size_y = min_cb_log2_size_y + log2_diff_max_min_luma_coding_block_size; int ctb_size_y = 1 << ctb_log2_size_y; // Round-up division. int pic_width_in_ctbs_y = (pic_width_in_luma_samples - 1) / ctb_size_y + 1; int pic_height_in_ctbs_y = (pic_height_in_luma_samples - 1) / ctb_size_y + 1; return pic_width_in_ctbs_y * pic_height_in_ctbs_y; } int H265Sps::GetChromaArrayType() const { if (!separate_colour_plane_flag) return chroma_format_idc; else return 0; } H265ReferencePictureListModifications::H265ReferencePictureListModifications() { } H265ReferencePictureListModifications:: ~H265ReferencePictureListModifications() {} H265SliceHeader::H265SliceHeader() {} H265SliceHeader::~H265SliceHeader() {} H265Parser::H265Parser() {} H265Parser::~H265Parser() {} H265Parser::Result H265Parser::ParseSliceHeader(const Nalu& nalu, H265SliceHeader* slice_header) { DCHECK(nalu.is_video_slice()); *slice_header = H265SliceHeader(); // Parses whole element. H26xBitReader reader; reader.Initialize(nalu.data() + nalu.header_size(), nalu.payload_size()); H26xBitReader* br = &reader; TRUE_OR_RETURN(br->ReadBool(&slice_header->first_slice_segment_in_pic_flag)); if (nalu.type() >= Nalu::H265_BLA_W_LP && nalu.type() <= Nalu::H265_RSV_IRAP_VCL23) { TRUE_OR_RETURN(br->ReadBool(&slice_header->no_output_of_prior_pics_flag)); } TRUE_OR_RETURN(br->ReadUE(&slice_header->pic_parameter_set_id)); const H265Pps* pps = GetPps(slice_header->pic_parameter_set_id); TRUE_OR_RETURN(pps); const H265Sps* sps = GetSps(pps->seq_parameter_set_id); TRUE_OR_RETURN(sps); if (!slice_header->first_slice_segment_in_pic_flag) { if (pps->dependent_slice_segments_enabled_flag) { TRUE_OR_RETURN(br->ReadBool(&slice_header->dependent_slice_segment_flag)); } const int bit_length = ceil(log2(sps->GetPicSizeInCtbsY())); TRUE_OR_RETURN(br->ReadBits(bit_length, &slice_header->segment_address)); } if (!slice_header->dependent_slice_segment_flag) { TRUE_OR_RETURN(br->SkipBits(pps->num_extra_slice_header_bits)); TRUE_OR_RETURN(br->ReadUE(&slice_header->slice_type)); if (pps->output_flag_present_flag) { TRUE_OR_RETURN(br->ReadBool(&slice_header->pic_output_flag)); } if (sps->separate_colour_plane_flag) { TRUE_OR_RETURN(br->ReadBits(2, &slice_header->colour_plane_id)); } if (nalu.type() != Nalu::H265_IDR_W_RADL && nalu.type() != Nalu::H265_IDR_N_LP) { TRUE_OR_RETURN(br->ReadBits(sps->log2_max_pic_order_cnt_lsb_minus4 + 4, &slice_header->slice_pic_order_cnt_lsb)); TRUE_OR_RETURN( br->ReadBool(&slice_header->short_term_ref_pic_set_sps_flag)); if (!slice_header->short_term_ref_pic_set_sps_flag) { OK_OR_RETURN(ParseReferencePictureSet( sps->num_short_term_ref_pic_sets, sps->num_short_term_ref_pic_sets, sps->st_ref_pic_sets, br, &slice_header->st_ref_pic_set)); } else if (sps->num_short_term_ref_pic_sets > 1) { TRUE_OR_RETURN( br->ReadBits(ceil(log2(sps->num_short_term_ref_pic_sets)), &slice_header->short_term_ref_pic_set_idx)); TRUE_OR_RETURN(slice_header->short_term_ref_pic_set_idx < sps->num_short_term_ref_pic_sets); } if (sps->long_term_ref_pic_present_flag) { if (sps->num_long_term_ref_pics > 0) { TRUE_OR_RETURN(br->ReadUE(&slice_header->num_long_term_sps)); } TRUE_OR_RETURN(br->ReadUE(&slice_header->num_long_term_pics)); const int pic_count = slice_header->num_long_term_sps + slice_header->num_long_term_pics; slice_header->long_term_pics_info.resize(pic_count); for (int i = 0; i < pic_count; i++) { if (i < slice_header->num_long_term_sps) { int lt_idx_sps = 0; if (sps->num_long_term_ref_pics > 1) { TRUE_OR_RETURN(br->ReadBits( ceil(log2(sps->num_long_term_ref_pics)), <_idx_sps)); } if (sps->used_by_curr_pic_lt_flag[lt_idx_sps]) slice_header->used_by_curr_pic_lt++; } else { TRUE_OR_RETURN(br->SkipBits(sps->log2_max_pic_order_cnt_lsb_minus4 + 4)); // poc_lsb_lt bool used_by_curr_pic_lt_flag; TRUE_OR_RETURN(br->ReadBool(&used_by_curr_pic_lt_flag)); if (used_by_curr_pic_lt_flag) slice_header->used_by_curr_pic_lt++; } TRUE_OR_RETURN(br->ReadBool(&slice_header->long_term_pics_info[i] .delta_poc_msb_present_flag)); if (slice_header->long_term_pics_info[i].delta_poc_msb_present_flag) { TRUE_OR_RETURN(br->ReadUE( &slice_header->long_term_pics_info[i].delta_poc_msb_cycle_lt)); } } } if (sps->temporal_mvp_enabled_flag) { TRUE_OR_RETURN( br->ReadBool(&slice_header->slice_temporal_mvp_enabled_flag)); } } if (nalu.nuh_layer_id() != 0) { NOTIMPLEMENTED() << "Multi-layer streams are not supported."; return kUnsupportedStream; } if (sps->sample_adaptive_offset_enabled_flag) { TRUE_OR_RETURN(br->ReadBool(&slice_header->slice_sao_luma_flag)); if (sps->GetChromaArrayType() != 0) { TRUE_OR_RETURN(br->ReadBool(&slice_header->slice_sao_chroma_flag)); } } slice_header->num_ref_idx_l0_active_minus1 = pps->num_ref_idx_l0_default_active_minus1; slice_header->num_ref_idx_l1_active_minus1 = pps->num_ref_idx_l1_default_active_minus1; if (slice_header->slice_type == kPSlice || slice_header->slice_type == kBSlice) { TRUE_OR_RETURN( br->ReadBool(&slice_header->num_ref_idx_active_override_flag)); if (slice_header->num_ref_idx_active_override_flag) { TRUE_OR_RETURN(br->ReadUE(&slice_header->num_ref_idx_l0_active_minus1)); if (slice_header->slice_type == kBSlice) { TRUE_OR_RETURN( br->ReadUE(&slice_header->num_ref_idx_l1_active_minus1)); } } const int num_pic_total_curr = GetNumPicTotalCurr(*slice_header, *sps); if (pps->lists_modification_present_flag && num_pic_total_curr > 1) { OK_OR_RETURN(SkipReferencePictureListModification( *slice_header, *pps, num_pic_total_curr, br)); } if (slice_header->slice_type == kBSlice) { TRUE_OR_RETURN(br->ReadBool(&slice_header->mvd_l1_zero_flag)); } if (pps->cabac_init_present_flag) { TRUE_OR_RETURN(br->ReadBool(&slice_header->cabac_init_flag)); } if (slice_header->slice_temporal_mvp_enabled_flag) { if (slice_header->slice_type == kBSlice) { TRUE_OR_RETURN(br->ReadBool(&slice_header->collocated_from_l0)); } bool l0_greater_than_0 = slice_header->num_ref_idx_l0_active_minus1 > 0; bool l1_greater_than_0 = slice_header->num_ref_idx_l1_active_minus1 > 0; if (slice_header->collocated_from_l0 ? l0_greater_than_0 : l1_greater_than_0) { TRUE_OR_RETURN(br->ReadUE(&slice_header->collocated_ref_idx)); } } if ((pps->weighted_pred_flag && slice_header->slice_type == kPSlice) || (pps->weighted_bipred_flag && slice_header->slice_type == kBSlice)) { OK_OR_RETURN(SkipPredictionWeightTable( slice_header->slice_type == kBSlice, *sps, *slice_header, br)); } TRUE_OR_RETURN(br->ReadUE(&slice_header->five_minus_max_num_merge_cand)); } TRUE_OR_RETURN(br->ReadSE(&slice_header->slice_qp_delta)); if (pps->slice_chroma_qp_offsets_present_flag) { TRUE_OR_RETURN(br->ReadSE(&slice_header->slice_cb_qp_offset)); TRUE_OR_RETURN(br->ReadSE(&slice_header->slice_cr_qp_offset)); } if (pps->chroma_qp_offset_list_enabled_flag) { TRUE_OR_RETURN( br->ReadBool(&slice_header->cu_chroma_qp_offset_enabled_flag)); } if (pps->deblocking_filter_override_enabled_flag) { TRUE_OR_RETURN( br->ReadBool(&slice_header->deblocking_filter_override_flag)); } if (slice_header->deblocking_filter_override_flag) { TRUE_OR_RETURN( br->ReadBool(&slice_header->slice_deblocking_filter_disabled_flag)); if (!slice_header->slice_deblocking_filter_disabled_flag) { TRUE_OR_RETURN(br->ReadSE(&slice_header->slice_beta_offset_div2)); TRUE_OR_RETURN(br->ReadSE(&slice_header->slice_tc_offset_div2)); } } if (pps->loop_filter_across_slices_enabled_flag && (slice_header->slice_sao_luma_flag || slice_header->slice_sao_chroma_flag || !slice_header->slice_deblocking_filter_disabled_flag)) { TRUE_OR_RETURN(br->ReadBool( &slice_header->slice_loop_filter_across_slices_enabled_flag)); } } if (pps->tiles_enabled_flag || pps->entropy_coding_sync_enabled_flag) { TRUE_OR_RETURN(br->ReadUE(&slice_header->num_entry_point_offsets)); if (slice_header->num_entry_point_offsets > 0) { TRUE_OR_RETURN(br->ReadUE(&slice_header->offset_len_minus1)); slice_header->entry_point_offset_minus1.resize( slice_header->num_entry_point_offsets); for (int i = 0; i < slice_header->num_entry_point_offsets; i++) { TRUE_OR_RETURN( br->ReadBits(slice_header->offset_len_minus1 + 1, &slice_header->entry_point_offset_minus1[i])); } } } if (pps->slice_segment_header_extension_present_flag) { int extension_length; TRUE_OR_RETURN(br->ReadUE(&extension_length)); TRUE_OR_RETURN(br->SkipBits(extension_length * 8)); } OK_OR_RETURN(ByteAlignment(br)); slice_header->header_bit_size = nalu.payload_size() * 8 - br->NumBitsLeft(); return kOk; } H265Parser::Result H265Parser::ParsePps(const Nalu& nalu, int* pps_id) { DCHECK_EQ(Nalu::H265_PPS, nalu.type()); // Reads most of the element, not reading the extension data. H26xBitReader reader; reader.Initialize(nalu.data() + nalu.header_size(), nalu.payload_size()); H26xBitReader* br = &reader; *pps_id = -1; std::unique_ptr pps(new H265Pps); TRUE_OR_RETURN(br->ReadUE(&pps->pic_parameter_set_id)); TRUE_OR_RETURN(br->ReadUE(&pps->seq_parameter_set_id)); TRUE_OR_RETURN(br->ReadBool(&pps->dependent_slice_segments_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->output_flag_present_flag)); TRUE_OR_RETURN(br->ReadBits(3, &pps->num_extra_slice_header_bits)); TRUE_OR_RETURN(br->ReadBool(&pps->sign_data_hiding_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->cabac_init_present_flag)); TRUE_OR_RETURN(br->ReadUE(&pps->num_ref_idx_l0_default_active_minus1)); TRUE_OR_RETURN(br->ReadUE(&pps->num_ref_idx_l1_default_active_minus1)); TRUE_OR_RETURN(br->ReadSE(&pps->init_qp_minus26)); TRUE_OR_RETURN(br->ReadBool(&pps->constrained_intra_pred_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->transform_skip_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->cu_qp_delta_enabled_flag)); if (pps->cu_qp_delta_enabled_flag) TRUE_OR_RETURN(br->ReadUE(&pps->diff_cu_qp_delta_depth)); TRUE_OR_RETURN(br->ReadSE(&pps->cb_qp_offset)); TRUE_OR_RETURN(br->ReadSE(&pps->cr_qp_offset)); TRUE_OR_RETURN(br->ReadBool(&pps->slice_chroma_qp_offsets_present_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->weighted_pred_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->weighted_bipred_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->transquant_bypass_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->tiles_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->entropy_coding_sync_enabled_flag)); if (pps->tiles_enabled_flag) { TRUE_OR_RETURN(br->ReadUE(&pps->num_tile_columns_minus1)); TRUE_OR_RETURN(br->ReadUE(&pps->num_tile_rows_minus1)); TRUE_OR_RETURN(br->ReadBool(&pps->uniform_spacing_flag)); if (!pps->uniform_spacing_flag) { pps->column_width_minus1.resize(pps->num_tile_columns_minus1); for (int i = 0; i < pps->num_tile_columns_minus1; i++) { TRUE_OR_RETURN(br->ReadUE(&pps->column_width_minus1[i])); } pps->row_height_minus1.resize(pps->num_tile_rows_minus1); for (int i = 0; i < pps->num_tile_rows_minus1; i++) { TRUE_OR_RETURN(br->ReadUE(&pps->row_height_minus1[i])); } } TRUE_OR_RETURN(br->ReadBool(&pps->loop_filter_across_tiles_enabled_flag)); } TRUE_OR_RETURN(br->ReadBool(&pps->loop_filter_across_slices_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->deblocking_filter_control_present_flag)); if (pps->deblocking_filter_control_present_flag) { TRUE_OR_RETURN(br->ReadBool(&pps->deblocking_filter_override_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&pps->deblocking_filter_disabled_flag)); if (!pps->deblocking_filter_disabled_flag) { TRUE_OR_RETURN(br->ReadSE(&pps->beta_offset_div2)); TRUE_OR_RETURN(br->ReadSE(&pps->tc_offset_div2)); } } TRUE_OR_RETURN(br->ReadBool(&pps->scaling_list_data_present_flag)); if (pps->scaling_list_data_present_flag) { OK_OR_RETURN(SkipScalingListData(br)); } TRUE_OR_RETURN(br->ReadBool(&pps->lists_modification_present_flag)); TRUE_OR_RETURN(br->ReadUE(&pps->log2_parallel_merge_level_minus2)); TRUE_OR_RETURN( br->ReadBool(&pps->slice_segment_header_extension_present_flag)); bool pps_extension_present_flag; bool pps_range_extension_flag = false; TRUE_OR_RETURN(br->ReadBool(&pps_extension_present_flag)); if (pps_extension_present_flag) { TRUE_OR_RETURN(br->ReadBool(&pps_range_extension_flag)); // pps_multilayer_extension_flag, pps_3d_extension_flag, pps_extension_5bits TRUE_OR_RETURN(br->SkipBits(1 + 1 + 5)); } if (pps_range_extension_flag) { if (pps->transform_skip_enabled_flag) { // log2_max_transform_skip_block_size_minus2 int ignored; TRUE_OR_RETURN(br->ReadUE(&ignored)); } TRUE_OR_RETURN(br->SkipBits(1)); // cross_component_prediction_enabled_flag TRUE_OR_RETURN(br->ReadBool(&pps->chroma_qp_offset_list_enabled_flag)); // Incomplete } // Ignore remaining extension data. // This will replace any existing PPS instance. *pps_id = pps->pic_parameter_set_id; active_ppses_[*pps_id] = std::move(pps); return kOk; } H265Parser::Result H265Parser::ParseSps(const Nalu& nalu, int* sps_id) { DCHECK_EQ(Nalu::H265_SPS, nalu.type()); // Reads most of the element, not reading the extension data. H26xBitReader reader; reader.Initialize(nalu.data() + nalu.header_size(), nalu.payload_size()); H26xBitReader* br = &reader; *sps_id = -1; std::unique_ptr sps(new H265Sps); TRUE_OR_RETURN(br->ReadBits(4, &sps->video_parameter_set_id)); TRUE_OR_RETURN(br->ReadBits(3, &sps->max_sub_layers_minus1)); TRUE_OR_RETURN(br->ReadBool(&sps->temporal_id_nesting_flag)); OK_OR_RETURN( ReadProfileTierLevel(true, sps->max_sub_layers_minus1, br, sps.get())); TRUE_OR_RETURN(br->ReadUE(&sps->seq_parameter_set_id)); TRUE_OR_RETURN(br->ReadUE(&sps->chroma_format_idc)); if (sps->chroma_format_idc == 3) { TRUE_OR_RETURN(br->ReadBool(&sps->separate_colour_plane_flag)); } TRUE_OR_RETURN(br->ReadUE(&sps->pic_width_in_luma_samples)); TRUE_OR_RETURN(br->ReadUE(&sps->pic_height_in_luma_samples)); TRUE_OR_RETURN(br->ReadBool(&sps->conformance_window_flag)); if (sps->conformance_window_flag) { TRUE_OR_RETURN(br->ReadUE(&sps->conf_win_left_offset)); TRUE_OR_RETURN(br->ReadUE(&sps->conf_win_right_offset)); TRUE_OR_RETURN(br->ReadUE(&sps->conf_win_top_offset)); TRUE_OR_RETURN(br->ReadUE(&sps->conf_win_bottom_offset)); } TRUE_OR_RETURN(br->ReadUE(&sps->bit_depth_luma_minus8)); TRUE_OR_RETURN(br->ReadUE(&sps->bit_depth_chroma_minus8)); TRUE_OR_RETURN(br->ReadUE(&sps->log2_max_pic_order_cnt_lsb_minus4)); TRUE_OR_RETURN(br->ReadBool(&sps->sub_layer_ordering_info_present_flag)); int start = sps->sub_layer_ordering_info_present_flag ? 0 : sps->max_sub_layers_minus1; for (int i = start; i <= sps->max_sub_layers_minus1; i++) { TRUE_OR_RETURN(br->ReadUE(&sps->max_dec_pic_buffering_minus1[i])); TRUE_OR_RETURN(br->ReadUE(&sps->max_num_reorder_pics[i])); TRUE_OR_RETURN(br->ReadUE(&sps->max_latency_increase_plus1[i])); } TRUE_OR_RETURN(br->ReadUE(&sps->log2_min_luma_coding_block_size_minus3)); TRUE_OR_RETURN(br->ReadUE(&sps->log2_diff_max_min_luma_coding_block_size)); TRUE_OR_RETURN(br->ReadUE(&sps->log2_min_luma_transform_block_size_minus2)); TRUE_OR_RETURN(br->ReadUE(&sps->log2_diff_max_min_luma_transform_block_size)); TRUE_OR_RETURN(br->ReadUE(&sps->max_transform_hierarchy_depth_inter)); TRUE_OR_RETURN(br->ReadUE(&sps->max_transform_hierarchy_depth_intra)); TRUE_OR_RETURN(br->ReadBool(&sps->scaling_list_enabled_flag)); if (sps->scaling_list_enabled_flag) { TRUE_OR_RETURN(br->ReadBool(&sps->scaling_list_data_present_flag)); if (sps->scaling_list_data_present_flag) { OK_OR_RETURN(SkipScalingListData(br)); } } TRUE_OR_RETURN(br->ReadBool(&sps->amp_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&sps->sample_adaptive_offset_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&sps->pcm_enabled_flag)); if (sps->pcm_enabled_flag) { TRUE_OR_RETURN(br->ReadBits(4, &sps->pcm_sample_bit_depth_luma_minus1)); TRUE_OR_RETURN(br->ReadBits(4, &sps->pcm_sample_bit_depth_chroma_minus1)); TRUE_OR_RETURN( br->ReadUE(&sps->log2_min_pcm_luma_coding_block_size_minus3)); TRUE_OR_RETURN( br->ReadUE(&sps->log2_diff_max_min_pcm_luma_coding_block_size)); TRUE_OR_RETURN(br->ReadBool(&sps->pcm_loop_filter_disabled_flag)); } TRUE_OR_RETURN(br->ReadUE(&sps->num_short_term_ref_pic_sets)); sps->st_ref_pic_sets.resize(sps->num_short_term_ref_pic_sets); for (int i = 0; i < sps->num_short_term_ref_pic_sets; i++) { OK_OR_RETURN(ParseReferencePictureSet(sps->num_short_term_ref_pic_sets, i, sps->st_ref_pic_sets, br, &sps->st_ref_pic_sets[i])); } TRUE_OR_RETURN(br->ReadBool(&sps->long_term_ref_pic_present_flag)); if (sps->long_term_ref_pic_present_flag) { TRUE_OR_RETURN(br->ReadUE(&sps->num_long_term_ref_pics)); sps->lt_ref_pic_poc_lsb.resize(sps->num_long_term_ref_pics); sps->used_by_curr_pic_lt_flag.resize(sps->num_long_term_ref_pics); for (int i = 0; i < sps->num_long_term_ref_pics; i++) { TRUE_OR_RETURN(br->ReadBits(sps->log2_max_pic_order_cnt_lsb_minus4 + 4, &sps->lt_ref_pic_poc_lsb[i])); bool temp; TRUE_OR_RETURN(br->ReadBool(&temp)); sps->used_by_curr_pic_lt_flag[i] = temp; } } TRUE_OR_RETURN(br->ReadBool(&sps->temporal_mvp_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&sps->strong_intra_smoothing_enabled_flag)); TRUE_OR_RETURN(br->ReadBool(&sps->vui_parameters_present)); if (sps->vui_parameters_present) { OK_OR_RETURN(ParseVuiParameters(sps->max_sub_layers_minus1, br, &sps->vui_parameters)); } // Ignore remaining extension data. // This will replace any existing SPS instance. *sps_id = sps->seq_parameter_set_id; active_spses_[*sps_id] = std::move(sps); return kOk; } const H265Pps* H265Parser::GetPps(int pps_id) { return active_ppses_[pps_id].get(); } const H265Sps* H265Parser::GetSps(int sps_id) { return active_spses_[sps_id].get(); } H265Parser::Result H265Parser::ParseVuiParameters(int max_num_sub_layers_minus1, H26xBitReader* br, H265VuiParameters* vui) { // Reads whole element but ignores most of it. int ignored; TRUE_OR_RETURN(br->ReadBool(&vui->aspect_ratio_info_present_flag)); if (vui->aspect_ratio_info_present_flag) { TRUE_OR_RETURN(br->ReadBits(8, &vui->aspect_ratio_idc)); if (vui->aspect_ratio_idc == H265VuiParameters::kExtendedSar) { TRUE_OR_RETURN(br->ReadBits(16, &vui->sar_width)); TRUE_OR_RETURN(br->ReadBits(16, &vui->sar_height)); } } bool overscan_info_present_flag; TRUE_OR_RETURN(br->ReadBool(&overscan_info_present_flag)); if (overscan_info_present_flag) { TRUE_OR_RETURN(br->SkipBits(1)); // overscan_appropriate_flag } bool video_signal_type_present_flag; TRUE_OR_RETURN(br->ReadBool(&video_signal_type_present_flag)); if (video_signal_type_present_flag) { TRUE_OR_RETURN(br->SkipBits(3)); // video_format TRUE_OR_RETURN(br->SkipBits(1)); // video_full_range_flag bool colour_description_present_flag; TRUE_OR_RETURN(br->ReadBool(&colour_description_present_flag)); if (colour_description_present_flag) { TRUE_OR_RETURN(br->SkipBits(8)); // colour_primaries TRUE_OR_RETURN(br->ReadBits(8, &vui->transfer_characteristics)); TRUE_OR_RETURN(br->SkipBits(8)); // matrix_coeffs } } bool chroma_loc_info_present_flag; TRUE_OR_RETURN(br->ReadBool(&chroma_loc_info_present_flag)); if (chroma_loc_info_present_flag) { // chroma_sample_log_type_top_field, chroma_sample_log_type_bottom_field TRUE_OR_RETURN(br->ReadUE(&ignored)); TRUE_OR_RETURN(br->ReadUE(&ignored)); } // neutral_chroma_indication_flag, field_seq_flag, // frame_field_info_present_flag. TRUE_OR_RETURN(br->SkipBits(3)); bool default_display_window_flag; TRUE_OR_RETURN(br->ReadBool(&default_display_window_flag)); if (default_display_window_flag) { TRUE_OR_RETURN(br->ReadUE(&ignored)); // def_disp_win_left_offset TRUE_OR_RETURN(br->ReadUE(&ignored)); // def_disp_win_right_offset TRUE_OR_RETURN(br->ReadUE(&ignored)); // def_disp_win_top_offset TRUE_OR_RETURN(br->ReadUE(&ignored)); // def_disp_win_bottom_offset } TRUE_OR_RETURN(br->ReadBool(&vui->vui_timing_info_present_flag)); if (vui->vui_timing_info_present_flag) { READ_LONG_OR_RETURN(&vui->vui_num_units_in_tick); READ_LONG_OR_RETURN(&vui->vui_time_scale); bool vui_poc_proportional_to_timing_flag; TRUE_OR_RETURN(br->ReadBool(&vui_poc_proportional_to_timing_flag)); if (vui_poc_proportional_to_timing_flag) { // vui_num_ticks_poc_diff_one_minus1 TRUE_OR_RETURN(br->ReadUE(&ignored)); } bool vui_hdr_parameters_present_flag; TRUE_OR_RETURN(br->ReadBool(&vui_hdr_parameters_present_flag)); if (vui_hdr_parameters_present_flag) { OK_OR_RETURN(SkipHrdParameters(max_num_sub_layers_minus1, br)); } } TRUE_OR_RETURN(br->ReadBool(&vui->bitstream_restriction_flag)); if (vui->bitstream_restriction_flag) { // tiles_fixed_structure_flag, motion_vectors_over_pic_boundaries_flag, // restricted_ref_pic_lists_flag. TRUE_OR_RETURN(br->SkipBits(3)); TRUE_OR_RETURN(br->ReadUE(&vui->min_spatial_segmentation_idc)); TRUE_OR_RETURN(br->ReadUE(&ignored)); // max_bytes_per_pic_denom TRUE_OR_RETURN(br->ReadUE(&ignored)); // max_bits_per_min_cu_denum TRUE_OR_RETURN(br->ReadUE(&ignored)); // log2_max_mv_length_horizontal TRUE_OR_RETURN(br->ReadUE(&ignored)); // log2_max_mv_length_vertical } return kOk; } H265Parser::Result H265Parser::ParseReferencePictureSet( int num_short_term_ref_pic_sets, int st_rps_idx, const std::vector& ref_pic_sets, H26xBitReader* br, H265ReferencePictureSet* out_ref_pic_set) { // Parses and processess a short-term reference picture set. This needs to // be done since the size of this element may be dependent on previous // reference picture sets. bool inter_ref_pic_set_prediction = false; if (st_rps_idx != 0) { TRUE_OR_RETURN(br->ReadBool(&inter_ref_pic_set_prediction)); } if (inter_ref_pic_set_prediction) { int delta_idx = 1; if (st_rps_idx == num_short_term_ref_pic_sets) { TRUE_OR_RETURN(br->ReadUE(&delta_idx)); delta_idx++; TRUE_OR_RETURN(delta_idx <= st_rps_idx); } int ref_rps_idx = st_rps_idx - delta_idx; DCHECK_LE(0, ref_rps_idx); DCHECK_LT(ref_rps_idx, st_rps_idx); bool delta_rps_sign; int abs_delta_rps_minus1; TRUE_OR_RETURN(br->ReadBool(&delta_rps_sign)); TRUE_OR_RETURN(br->ReadUE(&abs_delta_rps_minus1)); int delta_rps = delta_rps_sign ? -(abs_delta_rps_minus1 + 1) : abs_delta_rps_minus1 + 1; int ref_num_delta_pocs = ref_pic_sets[ref_rps_idx].num_delta_pocs; std::vector used_by_curr_pic(ref_num_delta_pocs + 1); std::vector use_delta(ref_num_delta_pocs + 1); for (int j = 0; j <= ref_num_delta_pocs; j++) { bool temp; TRUE_OR_RETURN(br->ReadBool(&temp)); used_by_curr_pic[j] = temp; if (!used_by_curr_pic[j]) { TRUE_OR_RETURN(br->ReadBool(&temp)); use_delta[j] = temp; } else { use_delta[j] = true; } } int ref_num_positive_pics = ref_pic_sets[ref_rps_idx].num_positive_pics; int ref_num_negative_pics = ref_pic_sets[ref_rps_idx].num_negative_pics; int i; // Update list 0. { i = 0; for (int j = ref_num_positive_pics - 1; j >= 0; j--) { int d_poc = ref_pic_sets[ref_rps_idx].delta_poc_s1[j] + delta_rps; if (d_poc < 0 && use_delta[ref_num_negative_pics + j]) { out_ref_pic_set->delta_poc_s0[i] = d_poc; out_ref_pic_set->used_by_curr_pic_s0[i] = used_by_curr_pic[ref_num_negative_pics + j]; i++; } } if (delta_rps < 0 && use_delta[ref_num_delta_pocs]) { out_ref_pic_set->delta_poc_s0[i] = delta_rps; out_ref_pic_set->used_by_curr_pic_s0[i] = used_by_curr_pic[ref_num_delta_pocs]; i++; } for (int j = 0; j < ref_num_negative_pics; j++) { int d_poc = ref_pic_sets[ref_rps_idx].delta_poc_s0[j] + delta_rps; if (d_poc < 0 && use_delta[j]) { out_ref_pic_set->delta_poc_s0[i] = d_poc; out_ref_pic_set->used_by_curr_pic_s0[i] = used_by_curr_pic[j]; i++; } } out_ref_pic_set->num_negative_pics = i; } // Update list 1. { i = 0; for (int j = ref_num_negative_pics - 1; j >= 0; j--) { int d_poc = ref_pic_sets[ref_rps_idx].delta_poc_s0[j] + delta_rps; if (d_poc > 0 && use_delta[j]) { out_ref_pic_set->delta_poc_s1[i] = d_poc; out_ref_pic_set->used_by_curr_pic_s1[i] = used_by_curr_pic[j]; i++; } } if (delta_rps > 0 && use_delta[ref_num_delta_pocs]) { out_ref_pic_set->delta_poc_s1[i] = delta_rps; out_ref_pic_set->used_by_curr_pic_s1[i] = used_by_curr_pic[ref_num_delta_pocs]; i++; } for (int j = 0; j < ref_num_positive_pics; j++) { int d_poc = ref_pic_sets[ref_rps_idx].delta_poc_s1[j] + delta_rps; if (d_poc > 0 && use_delta[ref_num_negative_pics + j]) { out_ref_pic_set->delta_poc_s1[i] = d_poc; out_ref_pic_set->used_by_curr_pic_s1[i] = used_by_curr_pic[ref_num_negative_pics + j]; i++; } } out_ref_pic_set->num_positive_pics = i; } } else { TRUE_OR_RETURN(br->ReadUE(&out_ref_pic_set->num_negative_pics)); TRUE_OR_RETURN(out_ref_pic_set->num_negative_pics <= kMaxRefPicSetCount); TRUE_OR_RETURN(br->ReadUE(&out_ref_pic_set->num_positive_pics)); TRUE_OR_RETURN(out_ref_pic_set->num_positive_pics <= kMaxRefPicSetCount); int prev_poc = 0; for (int i = 0; i < out_ref_pic_set->num_negative_pics; i++) { int delta_poc_s0_minus1; TRUE_OR_RETURN(br->ReadUE(&delta_poc_s0_minus1)); out_ref_pic_set->delta_poc_s0[i] = prev_poc - (delta_poc_s0_minus1 + 1); prev_poc = out_ref_pic_set->delta_poc_s0[i]; TRUE_OR_RETURN(br->ReadBool(&out_ref_pic_set->used_by_curr_pic_s0[i])); } prev_poc = 0; for (int i = 0; i < out_ref_pic_set->num_positive_pics; i++) { int delta_poc_s1_minus1; TRUE_OR_RETURN(br->ReadUE(&delta_poc_s1_minus1)); out_ref_pic_set->delta_poc_s1[i] = prev_poc + delta_poc_s1_minus1 + 1; prev_poc = out_ref_pic_set->delta_poc_s1[i]; TRUE_OR_RETURN(br->ReadBool(&out_ref_pic_set->used_by_curr_pic_s1[i])); } } out_ref_pic_set->num_delta_pocs = out_ref_pic_set->num_positive_pics + out_ref_pic_set->num_negative_pics; return kOk; } H265Parser::Result H265Parser::SkipReferencePictureListModification( const H265SliceHeader& slice_header, const H265Pps&, int num_pic_total_curr, H26xBitReader* br) { // Reads whole element but ignores it all. bool ref_pic_list_modification_flag_l0; TRUE_OR_RETURN(br->ReadBool(&ref_pic_list_modification_flag_l0)); if (ref_pic_list_modification_flag_l0) { for (int i = 0; i <= slice_header.num_ref_idx_l0_active_minus1; i++) { TRUE_OR_RETURN(br->SkipBits(ceil(log2(num_pic_total_curr)))); } } if (slice_header.slice_type == kBSlice) { bool ref_pic_list_modification_flag_l1; TRUE_OR_RETURN(br->ReadBool(&ref_pic_list_modification_flag_l1)); if (ref_pic_list_modification_flag_l1) { for (int i = 0; i <= slice_header.num_ref_idx_l1_active_minus1; i++) { TRUE_OR_RETURN(br->SkipBits(ceil(log2(num_pic_total_curr)))); } } } return kOk; } H265Parser::Result H265Parser::SkipPredictionWeightTablePart( int num_ref_idx_minus1, int chroma_array_type, H26xBitReader* br) { // Reads whole element, ignores it. int ignored; std::vector luma_weight_flag(num_ref_idx_minus1 + 1); std::vector chroma_weight_flag(num_ref_idx_minus1 + 1); for (int i = 0; i <= num_ref_idx_minus1; i++) { bool temp; TRUE_OR_RETURN(br->ReadBool(&temp)); luma_weight_flag[i] = temp; } if (chroma_array_type != 0) { for (int i = 0; i <= num_ref_idx_minus1; i++) { bool temp; TRUE_OR_RETURN(br->ReadBool(&temp)); chroma_weight_flag[i] = temp; } } for (int i = 0; i <= num_ref_idx_minus1; i++) { if (luma_weight_flag[i]) { TRUE_OR_RETURN(br->ReadSE(&ignored)); // delta_luma_weight_l# TRUE_OR_RETURN(br->ReadSE(&ignored)); // luma_offset_l# } if (chroma_weight_flag[i]) { for (int j = 0; j < 2; j++) { TRUE_OR_RETURN(br->ReadSE(&ignored)); // delta_chroma_weight_l# TRUE_OR_RETURN(br->ReadSE(&ignored)); // delta_chroma_offset_l# } } } return kOk; } H265Parser::Result H265Parser::SkipPredictionWeightTable( bool is_b_slice, const H265Sps& sps, const H265SliceHeader& slice_header, H26xBitReader* br) { // Reads whole element, ignores it. int ignored; int chroma_array_type = sps.GetChromaArrayType(); TRUE_OR_RETURN(br->ReadUE(&ignored)); // luma_log2_weight_denom if (chroma_array_type != 0) { TRUE_OR_RETURN(br->ReadSE(&ignored)); // delta_chroma_log2_weight_denom } OK_OR_RETURN(SkipPredictionWeightTablePart( slice_header.num_ref_idx_l0_active_minus1, chroma_array_type, br)); if (is_b_slice) { OK_OR_RETURN(SkipPredictionWeightTablePart( slice_header.num_ref_idx_l1_active_minus1, chroma_array_type, br)); } return kOk; } H265Parser::Result H265Parser::ReadProfileTierLevel( bool profile_present, int max_num_sub_layers_minus1, H26xBitReader* br, H265Sps* sps) { // Reads whole element, ignores it. if (profile_present) { // 11 bytes of general_profile_tier flags: // general_profile_space, general_tier_flag, general_profile_idc // general_profile_compativility_flag // general_progressive_source_flag // general_interlaced_source_flag // general_non_packed_constraint_flag // general_frame_only_constraint_flag // 44-bits of other flags for (int i = 0; i < 11; i++) TRUE_OR_RETURN(br->ReadBits(8, &sps->general_profile_tier_level_data[i])); } // general_level_idc TRUE_OR_RETURN(br->ReadBits(8, &sps->general_profile_tier_level_data[11])); std::vector sub_layer_profile_present(max_num_sub_layers_minus1); std::vector sub_layer_level_present(max_num_sub_layers_minus1); for (int i = 0; i < max_num_sub_layers_minus1; i++) { bool profile, level; TRUE_OR_RETURN(br->ReadBool(&profile)); TRUE_OR_RETURN(br->ReadBool(&level)); sub_layer_profile_present[i] = profile; sub_layer_level_present[i] = level; } if (max_num_sub_layers_minus1 > 0) { for (int i = max_num_sub_layers_minus1; i < 8; i++) TRUE_OR_RETURN(br->SkipBits(2)); // reserved_zero_2bits } for (int i = 0; i < max_num_sub_layers_minus1; i++) { if (sub_layer_profile_present[i]) { // sub_layer_profile_space, sub_layer_tier_flag, sub_layer_profile_idc // sub_layer_profile_compatibility // sub_layer_reserved_zero_43bits // sub_layer_reserved_zero_bit TRUE_OR_RETURN(br->SkipBits(2 + 1 + 5 + 32 + 4 + 43 + 1)); } if (sub_layer_level_present[i]) { TRUE_OR_RETURN(br->SkipBits(8)); } } return kOk; } H265Parser::Result H265Parser::SkipScalingListData(H26xBitReader* br) { // Reads whole element, ignores it. int ignored; for (int size_id = 0; size_id < 4; size_id++) { for (int matrix_id = 0; matrix_id < 6; matrix_id += ((size_id == 3) ? 3 : 1)) { bool scaling_list_pred_mode; TRUE_OR_RETURN(br->ReadBool(&scaling_list_pred_mode)); if (!scaling_list_pred_mode) { // scaling_list_pred_matrix_id_delta TRUE_OR_RETURN(br->ReadUE(&ignored)); } else { int coefNum = std::min(64, (1 << (4 + (size_id << 1)))); if (size_id > 1) { TRUE_OR_RETURN(br->ReadSE(&ignored)); // scaling_list_dc_coef_minus8 } for (int i = 0; i < coefNum; i++) { TRUE_OR_RETURN(br->ReadSE(&ignored)); // scaling_list_delta_coef } } } } return kOk; } H265Parser::Result H265Parser::SkipHrdParameters(int max_num_sub_layers_minus1, H26xBitReader* br) { // common_inf_present_flag is always 1 when parsing vui_parameters. const bool common_inf_present_flag = true; int ignored; bool nal_hdr_parameters_present_flag; bool vcl_hdr_parameters_present_flag; bool sub_pic_hdr_params_present_flag = false; if (common_inf_present_flag) { TRUE_OR_RETURN(br->ReadBool(&nal_hdr_parameters_present_flag)); TRUE_OR_RETURN(br->ReadBool(&vcl_hdr_parameters_present_flag)); if (nal_hdr_parameters_present_flag || vcl_hdr_parameters_present_flag) { TRUE_OR_RETURN(br->ReadBool(&sub_pic_hdr_params_present_flag)); if (sub_pic_hdr_params_present_flag) { // tick_divisor_minus2, du_cpb_removal_delay_increment_length_minus1, // sub_pic_cpb_params_in_pic_timing_sei_flag // dpb_output_delay_du_length_minus1 TRUE_OR_RETURN(br->SkipBits(8 + 5 + 1 + 5)); } // bit_rate_scale, cpb_size_scale TRUE_OR_RETURN(br->SkipBits(4 + 4)); if (sub_pic_hdr_params_present_flag) TRUE_OR_RETURN(br->SkipBits(4)); // cpb_size_du_scale // initial_cpb_removal_delay_length_minus1, // au_cpb_removal_delay_length_minus1, dpb_output_delay_length_minus1 TRUE_OR_RETURN(br->SkipBits(5 + 5 + 5)); } } for (int i = 0; i <= max_num_sub_layers_minus1; i++) { bool fixed_pic_rate_general_flag; bool fixed_pic_rate_within_cvs_flag = true; bool low_delay_hdr_flag = false; int cpb_cnt_minus1 = 0; TRUE_OR_RETURN(br->ReadBool(&fixed_pic_rate_general_flag)); if (!fixed_pic_rate_general_flag) TRUE_OR_RETURN(br->ReadBool(&fixed_pic_rate_within_cvs_flag)); if (fixed_pic_rate_within_cvs_flag) TRUE_OR_RETURN(br->ReadUE(&ignored)); // elemental_duration_ic_tc_minus1 else TRUE_OR_RETURN(br->ReadBool(&low_delay_hdr_flag)); if (!low_delay_hdr_flag) TRUE_OR_RETURN(br->ReadUE(&cpb_cnt_minus1)); if (nal_hdr_parameters_present_flag) { OK_OR_RETURN(SkipSubLayerHrdParameters( cpb_cnt_minus1, sub_pic_hdr_params_present_flag, br)); } if (vcl_hdr_parameters_present_flag) { OK_OR_RETURN(SkipSubLayerHrdParameters( cpb_cnt_minus1, sub_pic_hdr_params_present_flag, br)); } } return kOk; } H265Parser::Result H265Parser::SkipSubLayerHrdParameters( int cpb_cnt_minus1, bool sub_pic_hdr_params_present_flag, H26xBitReader* br) { int ignored; for (int i = 0; i <= cpb_cnt_minus1; i++) { TRUE_OR_RETURN(br->ReadUE(&ignored)); // bit_rate_value_minus1 TRUE_OR_RETURN(br->ReadUE(&ignored)); // cpb_size_value_minus1 if (sub_pic_hdr_params_present_flag) { TRUE_OR_RETURN(br->ReadUE(&ignored)); // cpb_size_du_value_minus1 TRUE_OR_RETURN(br->ReadUE(&ignored)); // bit_rate_du_value_minus1 } TRUE_OR_RETURN(br->SkipBits(1)); // cbr_flag } return kOk; } H265Parser::Result H265Parser::ByteAlignment(H26xBitReader* br) { TRUE_OR_RETURN(br->SkipBits(1)); TRUE_OR_RETURN(br->SkipBits(br->NumBitsLeft() % 8)); return kOk; } } // namespace media } // namespace shaka