yading@10: /* yading@10: * Video Decode and Presentation API for UNIX (VDPAU) is used for yading@10: * HW decode acceleration for MPEG-1/2, MPEG-4 ASP, H.264 and VC-1. yading@10: * yading@10: * Copyright (c) 2008 NVIDIA yading@10: * yading@10: * This file is part of FFmpeg. yading@10: * yading@10: * FFmpeg is free software; you can redistribute it and/or yading@10: * modify it under the terms of the GNU Lesser General Public yading@10: * License as published by the Free Software Foundation; either yading@10: * version 2.1 of the License, or (at your option) any later version. yading@10: * yading@10: * FFmpeg is distributed in the hope that it will be useful, yading@10: * but WITHOUT ANY WARRANTY; without even the implied warranty of yading@10: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU yading@10: * Lesser General Public License for more details. yading@10: * yading@10: * You should have received a copy of the GNU Lesser General Public yading@10: * License along with FFmpeg; if not, write to the Free Software yading@10: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA yading@10: */ yading@10: yading@10: #include yading@10: #include "avcodec.h" yading@10: #include "h264.h" yading@10: #include "vc1.h" yading@10: yading@10: #undef NDEBUG yading@10: #include yading@10: yading@10: #include "vdpau.h" yading@10: #include "vdpau_internal.h" yading@10: yading@10: /** yading@10: * @addtogroup VDPAU_Decoding yading@10: * yading@10: * @{ yading@10: */ yading@10: yading@10: int ff_vdpau_common_start_frame(AVCodecContext *avctx, yading@10: av_unused const uint8_t *buffer, yading@10: av_unused uint32_t size) yading@10: { yading@10: AVVDPAUContext *hwctx = avctx->hwaccel_context; yading@10: yading@10: hwctx->bitstream_buffers_used = 0; yading@10: return 0; yading@10: } yading@10: yading@10: #if CONFIG_H263_VDPAU_HWACCEL || CONFIG_MPEG1_VDPAU_HWACCEL || \ yading@10: CONFIG_MPEG2_VDPAU_HWACCEL || CONFIG_MPEG4_VDPAU_HWACCEL || \ yading@10: CONFIG_VC1_VDPAU_HWACCEL || CONFIG_WMV3_VDPAU_HWACCEL yading@10: int ff_vdpau_mpeg_end_frame(AVCodecContext *avctx) yading@10: { yading@10: AVVDPAUContext *hwctx = avctx->hwaccel_context; yading@10: MpegEncContext *s = avctx->priv_data; yading@10: VdpVideoSurface surf = ff_vdpau_get_surface_id(s->current_picture_ptr); yading@10: yading@10: hwctx->render(hwctx->decoder, surf, (void *)&hwctx->info, yading@10: hwctx->bitstream_buffers_used, hwctx->bitstream_buffers); yading@10: yading@10: ff_mpeg_draw_horiz_band(s, 0, s->avctx->height); yading@10: hwctx->bitstream_buffers_used = 0; yading@10: yading@10: return 0; yading@10: } yading@10: #endif yading@10: yading@10: int ff_vdpau_add_buffer(AVCodecContext *avctx, yading@10: const uint8_t *buf, uint32_t size) yading@10: { yading@10: AVVDPAUContext *hwctx = avctx->hwaccel_context; yading@10: VdpBitstreamBuffer *buffers = hwctx->bitstream_buffers; yading@10: yading@10: buffers = av_fast_realloc(buffers, &hwctx->bitstream_buffers_allocated, yading@10: (hwctx->bitstream_buffers_used + 1) * sizeof(*buffers)); yading@10: if (!buffers) yading@10: return AVERROR(ENOMEM); yading@10: yading@10: hwctx->bitstream_buffers = buffers; yading@10: buffers += hwctx->bitstream_buffers_used++; yading@10: yading@10: buffers->struct_version = VDP_BITSTREAM_BUFFER_VERSION; yading@10: buffers->bitstream = buf; yading@10: buffers->bitstream_bytes = size; yading@10: return 0; yading@10: } yading@10: yading@10: /* Obsolete non-hwaccel VDPAU support below... */ yading@10: yading@10: void ff_vdpau_h264_set_reference_frames(H264Context *h) yading@10: { yading@10: struct vdpau_render_state *render, *render_ref; yading@10: VdpReferenceFrameH264 *rf, *rf2; yading@10: Picture *pic; yading@10: int i, list, pic_frame_idx; yading@10: yading@10: render = (struct vdpau_render_state *)h->cur_pic_ptr->f.data[0]; yading@10: assert(render); yading@10: yading@10: rf = &render->info.h264.referenceFrames[0]; yading@10: #define H264_RF_COUNT FF_ARRAY_ELEMS(render->info.h264.referenceFrames) yading@10: yading@10: for (list = 0; list < 2; ++list) { yading@10: Picture **lp = list ? h->long_ref : h->short_ref; yading@10: int ls = list ? 16 : h->short_ref_count; yading@10: yading@10: for (i = 0; i < ls; ++i) { yading@10: pic = lp[i]; yading@10: if (!pic || !pic->reference) yading@10: continue; yading@10: pic_frame_idx = pic->long_ref ? pic->pic_id : pic->frame_num; yading@10: yading@10: render_ref = (struct vdpau_render_state *)pic->f.data[0]; yading@10: assert(render_ref); yading@10: yading@10: rf2 = &render->info.h264.referenceFrames[0]; yading@10: while (rf2 != rf) { yading@10: if ( yading@10: (rf2->surface == render_ref->surface) yading@10: && (rf2->is_long_term == pic->long_ref) yading@10: && (rf2->frame_idx == pic_frame_idx) yading@10: ) yading@10: break; yading@10: ++rf2; yading@10: } yading@10: if (rf2 != rf) { yading@10: rf2->top_is_reference |= (pic->reference & PICT_TOP_FIELD) ? VDP_TRUE : VDP_FALSE; yading@10: rf2->bottom_is_reference |= (pic->reference & PICT_BOTTOM_FIELD) ? VDP_TRUE : VDP_FALSE; yading@10: continue; yading@10: } yading@10: yading@10: if (rf >= &render->info.h264.referenceFrames[H264_RF_COUNT]) yading@10: continue; yading@10: yading@10: rf->surface = render_ref->surface; yading@10: rf->is_long_term = pic->long_ref; yading@10: rf->top_is_reference = (pic->reference & PICT_TOP_FIELD) ? VDP_TRUE : VDP_FALSE; yading@10: rf->bottom_is_reference = (pic->reference & PICT_BOTTOM_FIELD) ? VDP_TRUE : VDP_FALSE; yading@10: rf->field_order_cnt[0] = pic->field_poc[0]; yading@10: rf->field_order_cnt[1] = pic->field_poc[1]; yading@10: rf->frame_idx = pic_frame_idx; yading@10: yading@10: ++rf; yading@10: } yading@10: } yading@10: yading@10: for (; rf < &render->info.h264.referenceFrames[H264_RF_COUNT]; ++rf) { yading@10: rf->surface = VDP_INVALID_HANDLE; yading@10: rf->is_long_term = 0; yading@10: rf->top_is_reference = 0; yading@10: rf->bottom_is_reference = 0; yading@10: rf->field_order_cnt[0] = 0; yading@10: rf->field_order_cnt[1] = 0; yading@10: rf->frame_idx = 0; yading@10: } yading@10: } yading@10: yading@10: void ff_vdpau_add_data_chunk(uint8_t *data, const uint8_t *buf, int buf_size) yading@10: { yading@10: struct vdpau_render_state *render = (struct vdpau_render_state*)data; yading@10: assert(render); yading@10: yading@10: render->bitstream_buffers= av_fast_realloc( yading@10: render->bitstream_buffers, yading@10: &render->bitstream_buffers_allocated, yading@10: sizeof(*render->bitstream_buffers)*(render->bitstream_buffers_used + 1) yading@10: ); yading@10: yading@10: render->bitstream_buffers[render->bitstream_buffers_used].struct_version = VDP_BITSTREAM_BUFFER_VERSION; yading@10: render->bitstream_buffers[render->bitstream_buffers_used].bitstream = buf; yading@10: render->bitstream_buffers[render->bitstream_buffers_used].bitstream_bytes = buf_size; yading@10: render->bitstream_buffers_used++; yading@10: } yading@10: yading@10: #if CONFIG_H264_VDPAU_DECODER yading@10: void ff_vdpau_h264_picture_start(H264Context *h) yading@10: { yading@10: struct vdpau_render_state *render; yading@10: int i; yading@10: yading@10: render = (struct vdpau_render_state *)h->cur_pic_ptr->f.data[0]; yading@10: assert(render); yading@10: yading@10: for (i = 0; i < 2; ++i) { yading@10: int foc = h->cur_pic_ptr->field_poc[i]; yading@10: if (foc == INT_MAX) yading@10: foc = 0; yading@10: render->info.h264.field_order_cnt[i] = foc; yading@10: } yading@10: yading@10: render->info.h264.frame_num = h->frame_num; yading@10: } yading@10: yading@10: void ff_vdpau_h264_picture_complete(H264Context *h) yading@10: { yading@10: struct vdpau_render_state *render; yading@10: yading@10: render = (struct vdpau_render_state *)h->cur_pic_ptr->f.data[0]; yading@10: assert(render); yading@10: yading@10: render->info.h264.slice_count = h->slice_num; yading@10: if (render->info.h264.slice_count < 1) yading@10: return; yading@10: yading@10: render->info.h264.is_reference = (h->cur_pic_ptr->reference & 3) ? VDP_TRUE : VDP_FALSE; yading@10: render->info.h264.field_pic_flag = h->picture_structure != PICT_FRAME; yading@10: render->info.h264.bottom_field_flag = h->picture_structure == PICT_BOTTOM_FIELD; yading@10: render->info.h264.num_ref_frames = h->sps.ref_frame_count; yading@10: render->info.h264.mb_adaptive_frame_field_flag = h->sps.mb_aff && !render->info.h264.field_pic_flag; yading@10: render->info.h264.constrained_intra_pred_flag = h->pps.constrained_intra_pred; yading@10: render->info.h264.weighted_pred_flag = h->pps.weighted_pred; yading@10: render->info.h264.weighted_bipred_idc = h->pps.weighted_bipred_idc; yading@10: render->info.h264.frame_mbs_only_flag = h->sps.frame_mbs_only_flag; yading@10: render->info.h264.transform_8x8_mode_flag = h->pps.transform_8x8_mode; yading@10: render->info.h264.chroma_qp_index_offset = h->pps.chroma_qp_index_offset[0]; yading@10: render->info.h264.second_chroma_qp_index_offset = h->pps.chroma_qp_index_offset[1]; yading@10: render->info.h264.pic_init_qp_minus26 = h->pps.init_qp - 26; yading@10: render->info.h264.num_ref_idx_l0_active_minus1 = h->pps.ref_count[0] - 1; yading@10: render->info.h264.num_ref_idx_l1_active_minus1 = h->pps.ref_count[1] - 1; yading@10: render->info.h264.log2_max_frame_num_minus4 = h->sps.log2_max_frame_num - 4; yading@10: render->info.h264.pic_order_cnt_type = h->sps.poc_type; yading@10: render->info.h264.log2_max_pic_order_cnt_lsb_minus4 = h->sps.poc_type ? 0 : h->sps.log2_max_poc_lsb - 4; yading@10: render->info.h264.delta_pic_order_always_zero_flag = h->sps.delta_pic_order_always_zero_flag; yading@10: render->info.h264.direct_8x8_inference_flag = h->sps.direct_8x8_inference_flag; yading@10: render->info.h264.entropy_coding_mode_flag = h->pps.cabac; yading@10: render->info.h264.pic_order_present_flag = h->pps.pic_order_present; yading@10: render->info.h264.deblocking_filter_control_present_flag = h->pps.deblocking_filter_parameters_present; yading@10: render->info.h264.redundant_pic_cnt_present_flag = h->pps.redundant_pic_cnt_present; yading@10: memcpy(render->info.h264.scaling_lists_4x4, h->pps.scaling_matrix4, sizeof(render->info.h264.scaling_lists_4x4)); yading@10: memcpy(render->info.h264.scaling_lists_8x8[0], h->pps.scaling_matrix8[0], sizeof(render->info.h264.scaling_lists_8x8[0])); yading@10: memcpy(render->info.h264.scaling_lists_8x8[1], h->pps.scaling_matrix8[3], sizeof(render->info.h264.scaling_lists_8x8[0])); yading@10: yading@10: ff_h264_draw_horiz_band(h, 0, h->avctx->height); yading@10: render->bitstream_buffers_used = 0; yading@10: } yading@10: #endif /* CONFIG_H264_VDPAU_DECODER */ yading@10: yading@10: #if CONFIG_MPEG_VDPAU_DECODER || CONFIG_MPEG1_VDPAU_DECODER yading@10: void ff_vdpau_mpeg_picture_complete(MpegEncContext *s, const uint8_t *buf, yading@10: int buf_size, int slice_count) yading@10: { yading@10: struct vdpau_render_state *render, *last, *next; yading@10: int i; yading@10: yading@10: if (!s->current_picture_ptr) return; yading@10: yading@10: render = (struct vdpau_render_state *)s->current_picture_ptr->f.data[0]; yading@10: assert(render); yading@10: yading@10: /* fill VdpPictureInfoMPEG1Or2 struct */ yading@10: render->info.mpeg.picture_structure = s->picture_structure; yading@10: render->info.mpeg.picture_coding_type = s->pict_type; yading@10: render->info.mpeg.intra_dc_precision = s->intra_dc_precision; yading@10: render->info.mpeg.frame_pred_frame_dct = s->frame_pred_frame_dct; yading@10: render->info.mpeg.concealment_motion_vectors = s->concealment_motion_vectors; yading@10: render->info.mpeg.intra_vlc_format = s->intra_vlc_format; yading@10: render->info.mpeg.alternate_scan = s->alternate_scan; yading@10: render->info.mpeg.q_scale_type = s->q_scale_type; yading@10: render->info.mpeg.top_field_first = s->top_field_first; yading@10: render->info.mpeg.full_pel_forward_vector = s->full_pel[0]; // MPEG-1 only. Set 0 for MPEG-2 yading@10: render->info.mpeg.full_pel_backward_vector = s->full_pel[1]; // MPEG-1 only. Set 0 for MPEG-2 yading@10: render->info.mpeg.f_code[0][0] = s->mpeg_f_code[0][0]; // For MPEG-1 fill both horiz. & vert. yading@10: render->info.mpeg.f_code[0][1] = s->mpeg_f_code[0][1]; yading@10: render->info.mpeg.f_code[1][0] = s->mpeg_f_code[1][0]; yading@10: render->info.mpeg.f_code[1][1] = s->mpeg_f_code[1][1]; yading@10: for (i = 0; i < 64; ++i) { yading@10: render->info.mpeg.intra_quantizer_matrix[i] = s->intra_matrix[i]; yading@10: render->info.mpeg.non_intra_quantizer_matrix[i] = s->inter_matrix[i]; yading@10: } yading@10: yading@10: render->info.mpeg.forward_reference = VDP_INVALID_HANDLE; yading@10: render->info.mpeg.backward_reference = VDP_INVALID_HANDLE; yading@10: yading@10: switch(s->pict_type){ yading@10: case AV_PICTURE_TYPE_B: yading@10: next = (struct vdpau_render_state *)s->next_picture.f.data[0]; yading@10: assert(next); yading@10: render->info.mpeg.backward_reference = next->surface; yading@10: // no return here, going to set forward prediction yading@10: case AV_PICTURE_TYPE_P: yading@10: last = (struct vdpau_render_state *)s->last_picture.f.data[0]; yading@10: if (!last) // FIXME: Does this test make sense? yading@10: last = render; // predict second field from the first yading@10: render->info.mpeg.forward_reference = last->surface; yading@10: } yading@10: yading@10: ff_vdpau_add_data_chunk(s->current_picture_ptr->f.data[0], buf, buf_size); yading@10: yading@10: render->info.mpeg.slice_count = slice_count; yading@10: yading@10: if (slice_count) yading@10: ff_mpeg_draw_horiz_band(s, 0, s->avctx->height); yading@10: render->bitstream_buffers_used = 0; yading@10: } yading@10: #endif /* CONFIG_MPEG_VDPAU_DECODER || CONFIG_MPEG1_VDPAU_DECODER */ yading@10: yading@10: #if CONFIG_VC1_VDPAU_DECODER yading@10: void ff_vdpau_vc1_decode_picture(MpegEncContext *s, const uint8_t *buf, yading@10: int buf_size) yading@10: { yading@10: VC1Context *v = s->avctx->priv_data; yading@10: struct vdpau_render_state *render, *last, *next; yading@10: yading@10: render = (struct vdpau_render_state *)s->current_picture.f.data[0]; yading@10: assert(render); yading@10: yading@10: /* fill LvPictureInfoVC1 struct */ yading@10: render->info.vc1.frame_coding_mode = v->fcm; yading@10: render->info.vc1.postprocflag = v->postprocflag; yading@10: render->info.vc1.pulldown = v->broadcast; yading@10: render->info.vc1.interlace = v->interlace; yading@10: render->info.vc1.tfcntrflag = v->tfcntrflag; yading@10: render->info.vc1.finterpflag = v->finterpflag; yading@10: render->info.vc1.psf = v->psf; yading@10: render->info.vc1.dquant = v->dquant; yading@10: render->info.vc1.panscan_flag = v->panscanflag; yading@10: render->info.vc1.refdist_flag = v->refdist_flag; yading@10: render->info.vc1.quantizer = v->quantizer_mode; yading@10: render->info.vc1.extended_mv = v->extended_mv; yading@10: render->info.vc1.extended_dmv = v->extended_dmv; yading@10: render->info.vc1.overlap = v->overlap; yading@10: render->info.vc1.vstransform = v->vstransform; yading@10: render->info.vc1.loopfilter = v->s.loop_filter; yading@10: render->info.vc1.fastuvmc = v->fastuvmc; yading@10: render->info.vc1.range_mapy_flag = v->range_mapy_flag; yading@10: render->info.vc1.range_mapy = v->range_mapy; yading@10: render->info.vc1.range_mapuv_flag = v->range_mapuv_flag; yading@10: render->info.vc1.range_mapuv = v->range_mapuv; yading@10: /* Specific to simple/main profile only */ yading@10: render->info.vc1.multires = v->multires; yading@10: render->info.vc1.syncmarker = v->s.resync_marker; yading@10: render->info.vc1.rangered = v->rangered | (v->rangeredfrm << 1); yading@10: render->info.vc1.maxbframes = v->s.max_b_frames; yading@10: yading@10: render->info.vc1.deblockEnable = v->postprocflag & 1; yading@10: render->info.vc1.pquant = v->pq; yading@10: yading@10: render->info.vc1.forward_reference = VDP_INVALID_HANDLE; yading@10: render->info.vc1.backward_reference = VDP_INVALID_HANDLE; yading@10: yading@10: if (v->bi_type) yading@10: render->info.vc1.picture_type = 4; yading@10: else yading@10: render->info.vc1.picture_type = s->pict_type - 1 + s->pict_type / 3; yading@10: yading@10: switch(s->pict_type){ yading@10: case AV_PICTURE_TYPE_B: yading@10: next = (struct vdpau_render_state *)s->next_picture.f.data[0]; yading@10: assert(next); yading@10: render->info.vc1.backward_reference = next->surface; yading@10: // no break here, going to set forward prediction yading@10: case AV_PICTURE_TYPE_P: yading@10: last = (struct vdpau_render_state *)s->last_picture.f.data[0]; yading@10: if (!last) // FIXME: Does this test make sense? yading@10: last = render; // predict second field from the first yading@10: render->info.vc1.forward_reference = last->surface; yading@10: } yading@10: yading@10: ff_vdpau_add_data_chunk(s->current_picture_ptr->f.data[0], buf, buf_size); yading@10: yading@10: render->info.vc1.slice_count = 1; yading@10: yading@10: ff_mpeg_draw_horiz_band(s, 0, s->avctx->height); yading@10: render->bitstream_buffers_used = 0; yading@10: } yading@10: #endif /* (CONFIG_VC1_VDPAU_DECODER */ yading@10: yading@10: #if CONFIG_MPEG4_VDPAU_DECODER yading@10: void ff_vdpau_mpeg4_decode_picture(MpegEncContext *s, const uint8_t *buf, yading@10: int buf_size) yading@10: { yading@10: struct vdpau_render_state *render, *last, *next; yading@10: int i; yading@10: yading@10: if (!s->current_picture_ptr) return; yading@10: yading@10: render = (struct vdpau_render_state *)s->current_picture_ptr->f.data[0]; yading@10: assert(render); yading@10: yading@10: /* fill VdpPictureInfoMPEG4Part2 struct */ yading@10: render->info.mpeg4.trd[0] = s->pp_time; yading@10: render->info.mpeg4.trb[0] = s->pb_time; yading@10: render->info.mpeg4.trd[1] = s->pp_field_time >> 1; yading@10: render->info.mpeg4.trb[1] = s->pb_field_time >> 1; yading@10: render->info.mpeg4.vop_time_increment_resolution = s->avctx->time_base.den; yading@10: render->info.mpeg4.vop_coding_type = 0; yading@10: render->info.mpeg4.vop_fcode_forward = s->f_code; yading@10: render->info.mpeg4.vop_fcode_backward = s->b_code; yading@10: render->info.mpeg4.resync_marker_disable = !s->resync_marker; yading@10: render->info.mpeg4.interlaced = !s->progressive_sequence; yading@10: render->info.mpeg4.quant_type = s->mpeg_quant; yading@10: render->info.mpeg4.quarter_sample = s->quarter_sample; yading@10: render->info.mpeg4.short_video_header = s->avctx->codec->id == AV_CODEC_ID_H263; yading@10: render->info.mpeg4.rounding_control = s->no_rounding; yading@10: render->info.mpeg4.alternate_vertical_scan_flag = s->alternate_scan; yading@10: render->info.mpeg4.top_field_first = s->top_field_first; yading@10: for (i = 0; i < 64; ++i) { yading@10: render->info.mpeg4.intra_quantizer_matrix[i] = s->intra_matrix[i]; yading@10: render->info.mpeg4.non_intra_quantizer_matrix[i] = s->inter_matrix[i]; yading@10: } yading@10: render->info.mpeg4.forward_reference = VDP_INVALID_HANDLE; yading@10: render->info.mpeg4.backward_reference = VDP_INVALID_HANDLE; yading@10: yading@10: switch (s->pict_type) { yading@10: case AV_PICTURE_TYPE_B: yading@10: next = (struct vdpau_render_state *)s->next_picture.f.data[0]; yading@10: assert(next); yading@10: render->info.mpeg4.backward_reference = next->surface; yading@10: render->info.mpeg4.vop_coding_type = 2; yading@10: // no break here, going to set forward prediction yading@10: case AV_PICTURE_TYPE_P: yading@10: last = (struct vdpau_render_state *)s->last_picture.f.data[0]; yading@10: assert(last); yading@10: render->info.mpeg4.forward_reference = last->surface; yading@10: } yading@10: yading@10: ff_vdpau_add_data_chunk(s->current_picture_ptr->f.data[0], buf, buf_size); yading@10: yading@10: ff_mpeg_draw_horiz_band(s, 0, s->avctx->height); yading@10: render->bitstream_buffers_used = 0; yading@10: } yading@10: #endif /* CONFIG_MPEG4_VDPAU_DECODER */ yading@10: yading@10: /* @}*/