Add VDPAU hardware accelerated decoding for H264 which can be used by
[libav.git] / libavcodec / vdpauvideo.c
CommitLineData
369122dd
NC
1/*
2 * Video Decode and Presentation API for UNIX (VDPAU) is used for
3 * HW decode acceleration for MPEG-1/2, H.264 and VC-1.
4 *
5 * Copyright (c) 2008 NVIDIA.
6 *
7 * This file is part of FFmpeg.
8 *
9 * FFmpeg is free software; you can redistribute it and/or
10 * modify it under the terms of the GNU Lesser General Public
11 * License as published by the Free Software Foundation; either
12 * version 2.1 of the License, or (at your option) any later version.
13 *
14 * FFmpeg is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17 * Lesser General Public License for more details.
18 *
19 * You should have received a copy of the GNU Lesser General Public
20 * License along with FFmpeg; if not, write to the Free Software
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22 */
23
24#include <limits.h>
25#include "avcodec.h"
26#include "h264.h"
27
28#undef NDEBUG
29#include <assert.h>
30
31#include "vdpau_render.h"
32#include "vdpau_internal.h"
33
34/**
35 * \addtogroup VDPAU_Decoding
36 *
37 * @{
38 */
39
40static void VDPAU_h264_set_reference_frames(H264Context *h)
41{
42 MpegEncContext * s = &h->s;
43 struct vdpau_render_state * render, * render_ref;
44 VdpReferenceFrameH264 * rf, * rf2;
45 Picture * pic;
46 int i, list, pic_frame_idx;
47
48 render = (struct vdpau_render_state*)s->current_picture_ptr->data[0];
49 assert(render);
50
51 rf = &render->info.h264.referenceFrames[0];
52#define H264_RF_COUNT FF_ARRAY_ELEMS(render->info.h264.referenceFrames)
53
54 for (list = 0; list < 2; ++list) {
55 Picture **lp = list ? h->long_ref : h->short_ref;
56 int ls = list ? h->long_ref_count : h->short_ref_count;
57
58 for (i = 0; i < ls; ++i) {
59 pic = lp[i];
60 if (!pic || !pic->reference)
61 continue;
62 pic_frame_idx = pic->long_ref ? pic->pic_id : pic->frame_num;
63
64 render_ref = (struct vdpau_render_state*)pic->data[0];
65 assert(render_ref);
66
67 rf2 = &render->info.h264.referenceFrames[0];
68 while (rf2 != rf) {
69 if (
70 (rf2->surface == render_ref->surface)
71 && (rf2->is_long_term == pic->long_ref)
72 && (rf2->frame_idx == pic_frame_idx)
73 )
74 break;
75 ++rf2;
76 }
77 if (rf2 != rf) {
78 rf2->top_is_reference |= (pic->reference & PICT_TOP_FIELD) ? VDP_TRUE : VDP_FALSE;
79 rf2->bottom_is_reference |= (pic->reference & PICT_BOTTOM_FIELD) ? VDP_TRUE : VDP_FALSE;
80 continue;
81 }
82
83 if (rf >= &render->info.h264.referenceFrames[H264_RF_COUNT])
84 continue;
85
86 rf->surface = render_ref->surface;
87 rf->is_long_term = pic->long_ref;
88 rf->top_is_reference = (pic->reference & PICT_TOP_FIELD) ? VDP_TRUE : VDP_FALSE;
89 rf->bottom_is_reference = (pic->reference & PICT_BOTTOM_FIELD) ? VDP_TRUE : VDP_FALSE;
90 rf->field_order_cnt[0] = pic->field_poc[0];
91 rf->field_order_cnt[1] = pic->field_poc[1];
92 rf->frame_idx = pic_frame_idx;
93
94 ++rf;
95 }
96 }
97
98 for (; rf < &render->info.h264.referenceFrames[H264_RF_COUNT]; ++rf) {
99 rf->surface = VDP_INVALID_HANDLE;
100 rf->is_long_term = 0;
101 rf->top_is_reference = 0;
102 rf->bottom_is_reference = 0;
103 rf->field_order_cnt[0] = 0;
104 rf->field_order_cnt[1] = 0;
105 rf->frame_idx = 0;
106 }
107}
108
109void ff_VDPAU_h264_add_data_chunk(H264Context *h, const uint8_t *buf, int buf_size)
110{
111 MpegEncContext * s = &h->s;
112 struct vdpau_render_state * render;
113
114 render = (struct vdpau_render_state*)s->current_picture_ptr->data[0];
115 assert(render);
116
117 if (!render->bitstreamBuffersUsed)
118 VDPAU_h264_set_reference_frames(h);
119
120 render->bitstreamBuffers= av_fast_realloc(
121 render->bitstreamBuffers,
122 &render->bitstreamBuffersAlloced,
123 sizeof(*render->bitstreamBuffers)*(render->bitstreamBuffersUsed + 1)
124 );
125
126 render->bitstreamBuffers[render->bitstreamBuffersUsed].struct_version = VDP_BITSTREAM_BUFFER_VERSION;
127 render->bitstreamBuffers[render->bitstreamBuffersUsed].bitstream = buf;
128 render->bitstreamBuffers[render->bitstreamBuffersUsed].bitstream_bytes = buf_size;
129 render->bitstreamBuffersUsed++;
130}
131
132void ff_VDPAU_h264_picture_complete(H264Context *h)
133{
134 MpegEncContext * s = &h->s;
135 struct vdpau_render_state * render;
136
137 render = (struct vdpau_render_state*)s->current_picture_ptr->data[0];
138 assert(render);
139
140 render->info.h264.slice_count = h->slice_num;
141 if (render->info.h264.slice_count < 1)
142 return;
143
144 for (int i = 0; i < 2; ++i) {
145 int foc = s->current_picture_ptr->field_poc[i];
146 if (foc == INT_MAX)
147 foc = 0;
148 render->info.h264.field_order_cnt[i] = foc;
149 }
150
151 render->info.h264.is_reference = s->current_picture_ptr->reference ? VDP_TRUE : VDP_FALSE;
152 render->info.h264.frame_num = h->frame_num;
153 render->info.h264.field_pic_flag = s->picture_structure != PICT_FRAME;
154 render->info.h264.bottom_field_flag = s->picture_structure == PICT_BOTTOM_FIELD;
155 render->info.h264.num_ref_frames = h->sps.ref_frame_count;
156 render->info.h264.mb_adaptive_frame_field_flag = h->sps.mb_aff;
157 render->info.h264.constrained_intra_pred_flag = h->pps.constrained_intra_pred;
158 render->info.h264.weighted_pred_flag = h->pps.weighted_pred;
159 render->info.h264.weighted_bipred_idc = h->pps.weighted_bipred_idc;
160 render->info.h264.frame_mbs_only_flag = h->sps.frame_mbs_only_flag;
161 render->info.h264.transform_8x8_mode_flag = h->pps.transform_8x8_mode;
162 render->info.h264.chroma_qp_index_offset = h->pps.chroma_qp_index_offset[0];
163 render->info.h264.second_chroma_qp_index_offset = h->pps.chroma_qp_index_offset[1];
164 render->info.h264.pic_init_qp_minus26 = h->pps.init_qp - 26;
165 render->info.h264.num_ref_idx_l0_active_minus1 = h->pps.ref_count[0] - 1;
166 render->info.h264.num_ref_idx_l1_active_minus1 = h->pps.ref_count[1] - 1;
167 render->info.h264.log2_max_frame_num_minus4 = h->sps.log2_max_frame_num - 4;
168 render->info.h264.pic_order_cnt_type = h->sps.poc_type;
169 render->info.h264.log2_max_pic_order_cnt_lsb_minus4 = h->sps.log2_max_poc_lsb - 4;
170 render->info.h264.delta_pic_order_always_zero_flag = h->sps.delta_pic_order_always_zero_flag;
171 render->info.h264.direct_8x8_inference_flag = h->sps.direct_8x8_inference_flag;
172 render->info.h264.entropy_coding_mode_flag = h->pps.cabac;
173 render->info.h264.pic_order_present_flag = h->pps.pic_order_present;
174 render->info.h264.deblocking_filter_control_present_flag = h->pps.deblocking_filter_parameters_present;
175 render->info.h264.redundant_pic_cnt_present_flag = h->pps.redundant_pic_cnt_present;
176 memcpy(render->info.h264.scaling_lists_4x4, h->pps.scaling_matrix4, sizeof(render->info.h264.scaling_lists_4x4));
177 memcpy(render->info.h264.scaling_lists_8x8, h->pps.scaling_matrix8, sizeof(render->info.h264.scaling_lists_8x8));
178
179 ff_draw_horiz_band(s, 0, s->avctx->height);
180 render->bitstreamBuffersUsed = 0;
181}
182
183/* @}*/