st/va: add VAAPI HEVC decode support
authorBoyuan Zhang <boyuan.zhang@amd.com>
Fri, 23 Oct 2015 17:37:48 +0000 (13:37 -0400)
committerLeo Liu <leo.liu@amd.com>
Tue, 27 Oct 2015 23:09:55 +0000 (19:09 -0400)
Signed-off-by: Boyuan Zhang <boyuan.zhang@amd.com>
Reviewed-by: Christian König <christian.koenig@amd.com>
Reviewed-by: Leo Liu <leo.liu@amd.com>
configure.ac
src/gallium/state_trackers/va/config.c
src/gallium/state_trackers/va/context.c
src/gallium/state_trackers/va/picture.c
src/gallium/state_trackers/va/va_private.h

index 5aa19a5a6de842bdb16745e24ead540bedc486d1..3f15881a18ef401fd4fa34a3cd438e02f06b0e94 100644 (file)
@@ -81,7 +81,7 @@ PRESENTPROTO_REQUIRED=1.0
 LIBUDEV_REQUIRED=151
 GLPROTO_REQUIRED=1.4.14
 LIBOMXIL_BELLAGIO_REQUIRED=0.0
-LIBVA_REQUIRED=0.35.0
+LIBVA_REQUIRED=0.38.0
 VDPAU_REQUIRED=1.1
 WAYLAND_REQUIRED=1.2.0
 XCB_REQUIRED=1.9.3
index cfb0b25b71f70225d8792703d013254de64c2e2f..5030f9e5d4338f9ede84f7a061992cc58d8092a7 100644 (file)
@@ -45,7 +45,7 @@ vlVaQueryConfigProfiles(VADriverContextP ctx, VAProfile *profile_list, int *num_
    *num_profiles = 0;
 
    pscreen = VL_VA_PSCREEN(ctx);
-   for (p = PIPE_VIDEO_PROFILE_MPEG2_SIMPLE; p <= PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH; ++p)
+   for (p = PIPE_VIDEO_PROFILE_MPEG2_SIMPLE; p <= PIPE_VIDEO_PROFILE_HEVC_MAIN_444; ++p)
       if (pscreen->get_video_param(pscreen, p, PIPE_VIDEO_ENTRYPOINT_BITSTREAM, PIPE_VIDEO_CAP_SUPPORTED)) {
          vap = PipeToProfile(p);
          if (vap != VAProfileNone)
index 8b003aedaece4f9eb46e7b203703b30bf2358463..5adbe768532b2de892d5d731458d9894627ff728 100644 (file)
@@ -194,6 +194,21 @@ vlVaCreateContext(VADriverContextP ctx, VAConfigID config_id, int picture_width,
       }
    }
 
+   if (u_reduce_video_profile(context->decoder->profile) ==
+         PIPE_VIDEO_FORMAT_HEVC) {
+      context->desc.h265.pps = CALLOC_STRUCT(pipe_h265_pps);
+      if (!context->desc.h265.pps) {
+         FREE(context);
+         return VA_STATUS_ERROR_ALLOCATION_FAILED;
+      }
+      context->desc.h265.pps->sps = CALLOC_STRUCT(pipe_h265_sps);
+      if (!context->desc.h265.pps->sps) {
+         FREE(context->desc.h265.pps);
+         FREE(context);
+         return VA_STATUS_ERROR_ALLOCATION_FAILED;
+      }
+   }
+
    context->desc.base.profile = config_id;
    *context_id = handle_table_add(drv->htab, context);
 
@@ -216,6 +231,11 @@ vlVaDestroyContext(VADriverContextP ctx, VAContextID context_id)
       FREE(context->desc.h264.pps->sps);
       FREE(context->desc.h264.pps);
    }
+   if (u_reduce_video_profile(context->decoder->profile) ==
+         PIPE_VIDEO_FORMAT_HEVC) {
+      FREE(context->desc.h265.pps->sps);
+      FREE(context->desc.h265.pps);
+   }
    context->decoder->destroy(context->decoder);
    FREE(context);
    handle_table_remove(drv->htab, context_id);
index a0d530bb797698396f8fae41c0bec579377e1711..9cd496f6417fc2c6109ee54ad889459230acaab9 100644 (file)
@@ -81,6 +81,7 @@ handlePictureParameterBuffer(vlVaDriver *drv, vlVaContext *context, vlVaBuffer *
    VAPictureParameterBufferH264 *h264;
    VAPictureParameterBufferVC1 * vc1;
    VAPictureParameterBufferMPEG4 *mpeg4;
+   VAPictureParameterBufferHEVC *hevc;
    vlVaSurface *surf_forward;
    vlVaSurface *surf_backward;
    unsigned int i;
@@ -286,6 +287,157 @@ handlePictureParameterBuffer(vlVaDriver *drv, vlVaContext *context, vlVaBuffer *
 
       break;
 
+  case PIPE_VIDEO_FORMAT_HEVC:
+      assert(buf->size >= sizeof(VAPictureParameterBufferHEVC) && buf->num_elements == 1);
+      hevc = buf->data;
+      context->desc.h265.pps->sps->chroma_format_idc = hevc->pic_fields.bits.chroma_format_idc;
+      context->desc.h265.pps->sps->separate_colour_plane_flag =
+         hevc->pic_fields.bits.separate_colour_plane_flag;
+      context->desc.h265.pps->sps->pic_width_in_luma_samples = hevc->pic_width_in_luma_samples;
+      context->desc.h265.pps->sps->pic_height_in_luma_samples = hevc->pic_height_in_luma_samples;
+      context->desc.h265.pps->sps->bit_depth_luma_minus8 = hevc->bit_depth_luma_minus8;
+      context->desc.h265.pps->sps->bit_depth_chroma_minus8 = hevc->bit_depth_chroma_minus8;
+      context->desc.h265.pps->sps->log2_max_pic_order_cnt_lsb_minus4 =
+         hevc->log2_max_pic_order_cnt_lsb_minus4;
+      context->desc.h265.pps->sps->sps_max_dec_pic_buffering_minus1 =
+         hevc->sps_max_dec_pic_buffering_minus1;
+      context->desc.h265.pps->sps->log2_min_luma_coding_block_size_minus3 =
+         hevc->log2_min_luma_coding_block_size_minus3;
+      context->desc.h265.pps->sps->log2_diff_max_min_luma_coding_block_size =
+         hevc->log2_diff_max_min_luma_coding_block_size;
+      context->desc.h265.pps->sps->log2_min_transform_block_size_minus2 =
+         hevc->log2_min_transform_block_size_minus2;
+      context->desc.h265.pps->sps->log2_diff_max_min_transform_block_size =
+         hevc->log2_diff_max_min_transform_block_size;
+      context->desc.h265.pps->sps->max_transform_hierarchy_depth_inter =
+         hevc->max_transform_hierarchy_depth_inter;
+      context->desc.h265.pps->sps->max_transform_hierarchy_depth_intra =
+         hevc->max_transform_hierarchy_depth_intra;
+      context->desc.h265.pps->sps->scaling_list_enabled_flag =
+         hevc->pic_fields.bits.scaling_list_enabled_flag;
+      context->desc.h265.pps->sps->amp_enabled_flag = hevc->pic_fields.bits.amp_enabled_flag;
+      context->desc.h265.pps->sps->sample_adaptive_offset_enabled_flag =
+         hevc->slice_parsing_fields.bits.sample_adaptive_offset_enabled_flag;
+      context->desc.h265.pps->sps->pcm_enabled_flag = hevc->pic_fields.bits.pcm_enabled_flag;
+      if (hevc->pic_fields.bits.pcm_enabled_flag == 1) {
+         context->desc.h265.pps->sps->pcm_sample_bit_depth_luma_minus1 =
+            hevc->pcm_sample_bit_depth_luma_minus1;
+         context->desc.h265.pps->sps->pcm_sample_bit_depth_chroma_minus1 =
+            hevc->pcm_sample_bit_depth_chroma_minus1;
+         context->desc.h265.pps->sps->log2_min_pcm_luma_coding_block_size_minus3 =
+            hevc->log2_min_pcm_luma_coding_block_size_minus3;
+         context->desc.h265.pps->sps->log2_diff_max_min_pcm_luma_coding_block_size =
+            hevc->log2_diff_max_min_pcm_luma_coding_block_size;
+         context->desc.h265.pps->sps->pcm_loop_filter_disabled_flag =
+            hevc->pic_fields.bits.pcm_loop_filter_disabled_flag;
+      }
+      context->desc.h265.pps->sps->num_short_term_ref_pic_sets = hevc->num_short_term_ref_pic_sets;
+      context->desc.h265.pps->sps->long_term_ref_pics_present_flag =
+         hevc->slice_parsing_fields.bits.long_term_ref_pics_present_flag;
+      context->desc.h265.pps->sps->num_long_term_ref_pics_sps = hevc->num_long_term_ref_pic_sps;
+      context->desc.h265.pps->sps->sps_temporal_mvp_enabled_flag =
+         hevc->slice_parsing_fields.bits.sps_temporal_mvp_enabled_flag;
+      context->desc.h265.pps->sps->strong_intra_smoothing_enabled_flag =
+         hevc->pic_fields.bits.strong_intra_smoothing_enabled_flag;
+
+      context->desc.h265.pps->dependent_slice_segments_enabled_flag =
+         hevc->slice_parsing_fields.bits.dependent_slice_segments_enabled_flag;
+      context->desc.h265.pps->output_flag_present_flag =
+         hevc->slice_parsing_fields.bits.output_flag_present_flag;
+      context->desc.h265.pps->num_extra_slice_header_bits = hevc->num_extra_slice_header_bits;
+      context->desc.h265.pps->sign_data_hiding_enabled_flag =
+         hevc->pic_fields.bits.sign_data_hiding_enabled_flag;
+      context->desc.h265.pps->cabac_init_present_flag =
+         hevc->slice_parsing_fields.bits.cabac_init_present_flag;
+      context->desc.h265.pps->num_ref_idx_l0_default_active_minus1 =
+         hevc->num_ref_idx_l0_default_active_minus1;
+      context->desc.h265.pps->num_ref_idx_l1_default_active_minus1 =
+         hevc->num_ref_idx_l1_default_active_minus1;
+      context->desc.h265.pps->init_qp_minus26 = hevc->init_qp_minus26;
+      context->desc.h265.pps->constrained_intra_pred_flag =
+         hevc->pic_fields.bits.constrained_intra_pred_flag;
+      context->desc.h265.pps->transform_skip_enabled_flag =
+         hevc->pic_fields.bits.transform_skip_enabled_flag;
+      context->desc.h265.pps->cu_qp_delta_enabled_flag =
+         hevc->pic_fields.bits.cu_qp_delta_enabled_flag;
+      context->desc.h265.pps->diff_cu_qp_delta_depth = hevc->diff_cu_qp_delta_depth;
+      context->desc.h265.pps->pps_cb_qp_offset = hevc->pps_cb_qp_offset;
+      context->desc.h265.pps->pps_cr_qp_offset = hevc->pps_cr_qp_offset;
+      context->desc.h265.pps->pps_slice_chroma_qp_offsets_present_flag =
+         hevc->slice_parsing_fields.bits.pps_slice_chroma_qp_offsets_present_flag;
+      context->desc.h265.pps->weighted_pred_flag = hevc->pic_fields.bits.weighted_pred_flag;
+      context->desc.h265.pps->weighted_bipred_flag = hevc->pic_fields.bits.weighted_bipred_flag;
+      context->desc.h265.pps->transquant_bypass_enabled_flag =
+         hevc->pic_fields.bits.transquant_bypass_enabled_flag;
+      context->desc.h265.pps->tiles_enabled_flag = hevc->pic_fields.bits.tiles_enabled_flag;
+      context->desc.h265.pps->entropy_coding_sync_enabled_flag =
+         hevc->pic_fields.bits.entropy_coding_sync_enabled_flag;
+      if (hevc->pic_fields.bits.tiles_enabled_flag == 1) {
+         context->desc.h265.pps->num_tile_columns_minus1 = hevc->num_tile_columns_minus1;
+         context->desc.h265.pps->num_tile_rows_minus1 = hevc->num_tile_rows_minus1;
+         for (i = 0 ; i < 19 ; i++)
+            context->desc.h265.pps->column_width_minus1[i] = hevc->column_width_minus1[i];
+         for (i = 0 ; i < 21 ; i++)
+            context->desc.h265.pps->row_height_minus1[i] = hevc->row_height_minus1[i];
+         context->desc.h265.pps->loop_filter_across_tiles_enabled_flag =
+            hevc->pic_fields.bits.loop_filter_across_tiles_enabled_flag;
+      }
+      context->desc.h265.pps->pps_loop_filter_across_slices_enabled_flag =
+         hevc->pic_fields.bits.pps_loop_filter_across_slices_enabled_flag;
+      context->desc.h265.pps->deblocking_filter_override_enabled_flag =
+         hevc->slice_parsing_fields.bits.deblocking_filter_override_enabled_flag;
+      context->desc.h265.pps->pps_deblocking_filter_disabled_flag =
+         hevc->slice_parsing_fields.bits.pps_disable_deblocking_filter_flag;
+      context->desc.h265.pps->pps_beta_offset_div2 = hevc->pps_beta_offset_div2;
+      context->desc.h265.pps->pps_tc_offset_div2 = hevc->pps_tc_offset_div2;
+      context->desc.h265.pps->lists_modification_present_flag =
+         hevc->slice_parsing_fields.bits.lists_modification_present_flag;
+      context->desc.h265.pps->log2_parallel_merge_level_minus2 =
+         hevc->log2_parallel_merge_level_minus2;
+      context->desc.h265.pps->slice_segment_header_extension_present_flag =
+         hevc->slice_parsing_fields.bits.slice_segment_header_extension_present_flag;
+
+      context->desc.h265.IDRPicFlag = hevc->slice_parsing_fields.bits.IdrPicFlag;
+      context->desc.h265.RAPPicFlag = hevc->slice_parsing_fields.bits.RapPicFlag;
+
+      context->desc.h265.CurrPicOrderCntVal = hevc->CurrPic.pic_order_cnt;
+
+      for (i = 0 ; i < 8 ; i++) {
+         context->desc.h265.RefPicSetStCurrBefore[i] = 0xFF;
+         context->desc.h265.RefPicSetStCurrAfter[i] = 0xFF;
+         context->desc.h265.RefPicSetLtCurr[i] = 0xFF;
+      }
+      context->desc.h265.NumPocStCurrBefore = 0;
+      context->desc.h265.NumPocStCurrAfter = 0;
+      context->desc.h265.NumPocLtCurr = 0;
+      unsigned int iBefore = 0;
+      unsigned int iAfter = 0;
+      unsigned int iCurr = 0;
+      for (i = 0 ; i < 15 ; i++) {
+         context->desc.h265.PicOrderCntVal[i] = hevc->ReferenceFrames[i].pic_order_cnt;
+
+         unsigned int index = hevc->ReferenceFrames[i].picture_id & 0x7F;
+
+         if (index == 0x7F)
+            continue;
+
+         getReferenceFrame(drv, hevc->ReferenceFrames[i].picture_id, &context->desc.h265.ref[i]);
+
+         if ((hevc->ReferenceFrames[i].flags & VA_PICTURE_HEVC_RPS_ST_CURR_BEFORE) && (iBefore < 8)) {
+            context->desc.h265.RefPicSetStCurrBefore[iBefore++] = i;
+            context->desc.h265.NumPocStCurrBefore++;
+         }
+         if ((hevc->ReferenceFrames[i].flags & VA_PICTURE_HEVC_RPS_ST_CURR_AFTER) && (iAfter < 8)) {
+            context->desc.h265.RefPicSetStCurrAfter[iAfter++] = i;
+            context->desc.h265.NumPocStCurrAfter++;
+         }
+         if ((hevc->ReferenceFrames[i].flags & VA_PICTURE_HEVC_RPS_LT_CURR) && (iCurr < 8)) {
+            context->desc.h265.RefPicSetLtCurr[iCurr++] = i;
+            context->desc.h265.NumPocLtCurr++;
+         }
+      }
+      break;
+
    default:
       break;
    }
@@ -297,6 +449,7 @@ handleIQMatrixBuffer(vlVaContext *context, vlVaBuffer *buf)
    VAIQMatrixBufferMPEG2 *mpeg2;
    VAIQMatrixBufferH264 *h264;
    VAIQMatrixBufferMPEG4 *mpeg4;
+   VAIQMatrixBufferHEVC *h265;
 
    switch (u_reduce_video_profile(context->decoder->profile)) {
    case PIPE_VIDEO_FORMAT_MPEG12:
@@ -320,6 +473,17 @@ handleIQMatrixBuffer(vlVaContext *context, vlVaBuffer *buf)
       memcpy(&context->desc.h264.pps->ScalingList8x8, h264->ScalingList8x8, 2 * 64);
       break;
 
+   case PIPE_VIDEO_FORMAT_HEVC:
+      assert(buf->size >= sizeof(VAIQMatrixBufferH264) && buf->num_elements == 1);
+      h265 = buf->data;
+      memcpy(&context->desc.h265.pps->sps->ScalingList4x4, h265->ScalingList4x4, 6 * 16);
+      memcpy(&context->desc.h265.pps->sps->ScalingList8x8, h265->ScalingList8x8, 6 * 64);
+      memcpy(&context->desc.h265.pps->sps->ScalingList16x16, h265->ScalingList16x16, 6 * 64);
+      memcpy(&context->desc.h265.pps->sps->ScalingList32x32, h265->ScalingList32x32, 2 * 64);
+      memcpy(&context->desc.h265.pps->sps->ScalingListDCCoeff16x16, h265->ScalingListDC16x16, 6);
+      memcpy(&context->desc.h265.pps->sps->ScalingListDCCoeff32x32, h265->ScalingListDC32x32, 2);
+      break;
+
    case PIPE_VIDEO_FORMAT_MPEG4:
       assert(buf->size >= sizeof(VAIQMatrixBufferMPEG4) && buf->num_elements == 1);
       mpeg4 = buf->data;
@@ -345,6 +509,7 @@ handleSliceParameterBuffer(vlVaContext *context, vlVaBuffer *buf)
 {
    VASliceParameterBufferH264 *h264;
    VASliceParameterBufferMPEG4 *mpeg4;
+   VASliceParameterBufferHEVC *h265;
 
    switch (u_reduce_video_profile(context->decoder->profile)) {
    case PIPE_VIDEO_FORMAT_MPEG4_AVC:
@@ -361,6 +526,15 @@ handleSliceParameterBuffer(vlVaContext *context, vlVaBuffer *buf)
 
       context->mpeg4.quant_scale = mpeg4->quant_scale;
       break;
+   case PIPE_VIDEO_FORMAT_HEVC:
+      assert(buf->size >= sizeof(VASliceParameterBufferHEVC) && buf->num_elements == 1);
+      h265 = buf->data;
+      for (int i = 0 ; i < 2 ; i++) {
+         for (int j = 0 ; j < 15 ; j++)
+            context->desc.h265.RefPicList[i][j] = h265->RefPicList[i][j];
+      }
+      context->desc.h265.UseRefPicList = true;
+      break;
    default:
       break;
    }
@@ -483,6 +657,7 @@ handleVASliceDataBufferType(vlVaContext *context, vlVaBuffer *buf)
    void * const *buffers[2];
    unsigned sizes[2];
    static const uint8_t start_code_h264[] = { 0x00, 0x00, 0x01 };
+   static const uint8_t start_code_h265[] = { 0x00, 0x00, 0x01 };
    static const uint8_t start_code_vc1[] = { 0x00, 0x00, 0x01, 0x0d };
 
    format = u_reduce_video_profile(context->decoder->profile);
@@ -494,6 +669,13 @@ handleVASliceDataBufferType(vlVaContext *context, vlVaBuffer *buf)
          buffers[num_buffers] = (void *const)&start_code_h264;
          sizes[num_buffers++] = sizeof(start_code_h264);
       break;
+   case PIPE_VIDEO_FORMAT_HEVC:
+      if (bufHasStartcode(buf, 0x000001, 24))
+         break;
+
+         buffers[num_buffers] = (void *const)&start_code_h265;
+         sizes[num_buffers++] = sizeof(start_code_h265);
+         break;
    case PIPE_VIDEO_FORMAT_VC1:
       if (bufHasStartcode(buf, 0x0000010d, 32) ||
           bufHasStartcode(buf, 0x0000010c, 32) ||
index 1ea7be79aa3fb9cc9815bc329ebbb84f1b11b1c0..93af1be19a7fc96e13442c5773d1938808ee0561 100644 (file)
@@ -112,6 +112,8 @@ PipeToProfile(enum pipe_video_profile profile)
       return VAProfileH264High;
    case PIPE_VIDEO_PROFILE_MPEG4_AVC_EXTENDED:
        return VAProfileNone;
+   case PIPE_VIDEO_PROFILE_HEVC_MAIN:
+      return VAProfileHEVCMain;
    default:
       assert(0);
       return -1;
@@ -142,6 +144,8 @@ ProfileToPipe(VAProfile profile)
       return PIPE_VIDEO_PROFILE_MPEG4_AVC_MAIN;
    case VAProfileH264High:
       return PIPE_VIDEO_PROFILE_MPEG4_AVC_HIGH;
+   case VAProfileHEVCMain:
+      return PIPE_VIDEO_PROFILE_HEVC_MAIN;
    default:
       return PIPE_VIDEO_PROFILE_UNKNOWN;
    }
@@ -174,6 +178,7 @@ typedef struct {
       struct pipe_mpeg4_picture_desc mpeg4;
       struct pipe_vc1_picture_desc vc1;
       struct pipe_h264_picture_desc h264;
+      struct pipe_h265_picture_desc h265;
    } desc;
 
    struct {