2 * This file is part of Libav.
4 * Libav is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * Libav is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with Libav; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 #include "libavutil/avassert.h"
20 #include "libavutil/common.h"
21 #include "libavutil/pixdesc.h"
25 #include "vaapi_decode.h"
28 int ff_vaapi_decode_make_param_buffer(AVCodecContext
*avctx
,
29 VAAPIDecodePicture
*pic
,
34 VAAPIDecodeContext
*ctx
= avctx
->internal
->hwaccel_priv_data
;
38 av_assert0(pic
->nb_param_buffers
+ 1 <= MAX_PARAM_BUFFERS
);
40 vas
= vaCreateBuffer(ctx
->hwctx
->display
, ctx
->va_context
,
41 type
, size
, 1, (void*)data
, &buffer
);
42 if (vas
!= VA_STATUS_SUCCESS
) {
43 av_log(avctx
, AV_LOG_ERROR
, "Failed to create parameter "
44 "buffer (type %d): %d (%s).\n",
45 type
, vas
, vaErrorStr(vas
));
49 pic
->param_buffers
[pic
->nb_param_buffers
++] = buffer
;
51 av_log(avctx
, AV_LOG_DEBUG
, "Param buffer (type %d, %zu bytes) "
52 "is %#x.\n", type
, size
, buffer
);
57 int ff_vaapi_decode_make_slice_buffer(AVCodecContext
*avctx
,
58 VAAPIDecodePicture
*pic
,
59 const void *params_data
,
61 const void *slice_data
,
64 VAAPIDecodeContext
*ctx
= avctx
->internal
->hwaccel_priv_data
;
68 av_assert0(pic
->nb_slices
<= pic
->slices_allocated
);
69 if (pic
->nb_slices
== pic
->slices_allocated
) {
70 if (pic
->slices_allocated
> 0)
71 pic
->slices_allocated
*= 2;
73 pic
->slices_allocated
= 64;
76 av_realloc_array(pic
->slice_buffers
,
77 pic
->slices_allocated
,
78 2 * sizeof(*pic
->slice_buffers
));
79 if (!pic
->slice_buffers
)
80 return AVERROR(ENOMEM
);
82 av_assert0(pic
->nb_slices
+ 1 <= pic
->slices_allocated
);
84 index
= 2 * pic
->nb_slices
;
86 vas
= vaCreateBuffer(ctx
->hwctx
->display
, ctx
->va_context
,
87 VASliceParameterBufferType
,
88 params_size
, 1, (void*)params_data
,
89 &pic
->slice_buffers
[index
]);
90 if (vas
!= VA_STATUS_SUCCESS
) {
91 av_log(avctx
, AV_LOG_ERROR
, "Failed to create slice "
92 "parameter buffer: %d (%s).\n", vas
, vaErrorStr(vas
));
96 av_log(avctx
, AV_LOG_DEBUG
, "Slice %d param buffer (%zu bytes) "
97 "is %#x.\n", pic
->nb_slices
, params_size
,
98 pic
->slice_buffers
[index
]);
100 vas
= vaCreateBuffer(ctx
->hwctx
->display
, ctx
->va_context
,
101 VASliceDataBufferType
,
102 slice_size
, 1, (void*)slice_data
,
103 &pic
->slice_buffers
[index
+ 1]);
104 if (vas
!= VA_STATUS_SUCCESS
) {
105 av_log(avctx
, AV_LOG_ERROR
, "Failed to create slice "
106 "data buffer (size %zu): %d (%s).\n",
107 slice_size
, vas
, vaErrorStr(vas
));
108 vaDestroyBuffer(ctx
->hwctx
->display
,
109 pic
->slice_buffers
[index
]);
113 av_log(avctx
, AV_LOG_DEBUG
, "Slice %d data buffer (%zu bytes) "
114 "is %#x.\n", pic
->nb_slices
, slice_size
,
115 pic
->slice_buffers
[index
+ 1]);
121 static void ff_vaapi_decode_destroy_buffers(AVCodecContext
*avctx
,
122 VAAPIDecodePicture
*pic
)
124 VAAPIDecodeContext
*ctx
= avctx
->internal
->hwaccel_priv_data
;
128 for (i
= 0; i
< pic
->nb_param_buffers
; i
++) {
129 vas
= vaDestroyBuffer(ctx
->hwctx
->display
,
130 pic
->param_buffers
[i
]);
131 if (vas
!= VA_STATUS_SUCCESS
) {
132 av_log(avctx
, AV_LOG_ERROR
, "Failed to destroy "
133 "parameter buffer %#x: %d (%s).\n",
134 pic
->param_buffers
[i
], vas
, vaErrorStr(vas
));
138 for (i
= 0; i
< 2 * pic
->nb_slices
; i
++) {
139 vas
= vaDestroyBuffer(ctx
->hwctx
->display
,
140 pic
->slice_buffers
[i
]);
141 if (vas
!= VA_STATUS_SUCCESS
) {
142 av_log(avctx
, AV_LOG_ERROR
, "Failed to destroy slice "
143 "slice buffer %#x: %d (%s).\n",
144 pic
->slice_buffers
[i
], vas
, vaErrorStr(vas
));
149 int ff_vaapi_decode_issue(AVCodecContext
*avctx
,
150 VAAPIDecodePicture
*pic
)
152 VAAPIDecodeContext
*ctx
= avctx
->internal
->hwaccel_priv_data
;
156 av_log(avctx
, AV_LOG_DEBUG
, "Decode to surface %#x.\n",
157 pic
->output_surface
);
159 vas
= vaBeginPicture(ctx
->hwctx
->display
, ctx
->va_context
,
160 pic
->output_surface
);
161 if (vas
!= VA_STATUS_SUCCESS
) {
162 av_log(avctx
, AV_LOG_ERROR
, "Failed to begin picture decode "
163 "issue: %d (%s).\n", vas
, vaErrorStr(vas
));
165 goto fail_with_picture
;
168 vas
= vaRenderPicture(ctx
->hwctx
->display
, ctx
->va_context
,
169 pic
->param_buffers
, pic
->nb_param_buffers
);
170 if (vas
!= VA_STATUS_SUCCESS
) {
171 av_log(avctx
, AV_LOG_ERROR
, "Failed to upload decode "
172 "parameters: %d (%s).\n", vas
, vaErrorStr(vas
));
174 goto fail_with_picture
;
177 vas
= vaRenderPicture(ctx
->hwctx
->display
, ctx
->va_context
,
178 pic
->slice_buffers
, 2 * pic
->nb_slices
);
179 if (vas
!= VA_STATUS_SUCCESS
) {
180 av_log(avctx
, AV_LOG_ERROR
, "Failed to upload slices: "
181 "%d (%s).\n", vas
, vaErrorStr(vas
));
183 goto fail_with_picture
;
186 vas
= vaEndPicture(ctx
->hwctx
->display
, ctx
->va_context
);
187 if (vas
!= VA_STATUS_SUCCESS
) {
188 av_log(avctx
, AV_LOG_ERROR
, "Failed to end picture decode "
189 "issue: %d (%s).\n", vas
, vaErrorStr(vas
));
191 if (ctx
->hwctx
->driver_quirks
&
192 AV_VAAPI_DRIVER_QUIRK_RENDER_PARAM_BUFFERS
)
198 if (ctx
->hwctx
->driver_quirks
&
199 AV_VAAPI_DRIVER_QUIRK_RENDER_PARAM_BUFFERS
)
200 ff_vaapi_decode_destroy_buffers(avctx
, pic
);
202 pic
->nb_param_buffers
= 0;
204 pic
->slices_allocated
= 0;
205 av_freep(&pic
->slice_buffers
);
210 vas
= vaEndPicture(ctx
->hwctx
->display
, ctx
->va_context
);
211 if (vas
!= VA_STATUS_SUCCESS
) {
212 av_log(avctx
, AV_LOG_ERROR
, "Failed to end picture decode "
213 "after error: %d (%s).\n", vas
, vaErrorStr(vas
));
216 ff_vaapi_decode_destroy_buffers(avctx
, pic
);
221 int ff_vaapi_decode_cancel(AVCodecContext
*avctx
,
222 VAAPIDecodePicture
*pic
)
224 ff_vaapi_decode_destroy_buffers(avctx
, pic
);
226 pic
->nb_param_buffers
= 0;
228 pic
->slices_allocated
= 0;
229 av_freep(&pic
->slice_buffers
);
234 static const struct {
235 enum AVCodecID codec_id
;
237 VAProfile va_profile
;
238 } vaapi_profile_map
[] = {
239 #define MAP(c, p, v) { AV_CODEC_ID_ ## c, FF_PROFILE_ ## p, VAProfile ## v }
240 MAP(MPEG2VIDEO
, MPEG2_SIMPLE
, MPEG2Simple
),
241 MAP(MPEG2VIDEO
, MPEG2_MAIN
, MPEG2Main
),
242 MAP(H263
, UNKNOWN
, H263Baseline
),
243 MAP(MPEG4
, MPEG4_SIMPLE
, MPEG4Simple
),
244 MAP(MPEG4
, MPEG4_ADVANCED_SIMPLE
,
245 MPEG4AdvancedSimple
),
246 MAP(MPEG4
, MPEG4_MAIN
, MPEG4Main
),
247 MAP(H264
, H264_CONSTRAINED_BASELINE
,
248 H264ConstrainedBaseline
),
249 MAP(H264
, H264_BASELINE
, H264Baseline
),
250 MAP(H264
, H264_MAIN
, H264Main
),
251 MAP(H264
, H264_HIGH
, H264High
),
252 #if VA_CHECK_VERSION(0, 37, 0)
253 MAP(HEVC
, HEVC_MAIN
, HEVCMain
),
254 MAP(HEVC
, HEVC_MAIN_10
, HEVCMain10
),
256 MAP(WMV3
, VC1_SIMPLE
, VC1Simple
),
257 MAP(WMV3
, VC1_MAIN
, VC1Main
),
258 MAP(WMV3
, VC1_COMPLEX
, VC1Advanced
),
259 MAP(WMV3
, VC1_ADVANCED
, VC1Advanced
),
260 MAP(VC1
, VC1_SIMPLE
, VC1Simple
),
261 MAP(VC1
, VC1_MAIN
, VC1Main
),
262 MAP(VC1
, VC1_COMPLEX
, VC1Advanced
),
263 MAP(VC1
, VC1_ADVANCED
, VC1Advanced
),
264 #if VA_CHECK_VERSION(0, 35, 0)
265 MAP(VP8
, UNKNOWN
, VP8Version0_3
),
267 #if VA_CHECK_VERSION(0, 38, 0)
268 MAP(VP9
, VP9_0
, VP9Profile0
),
273 static int vaapi_decode_make_config(AVCodecContext
*avctx
)
275 VAAPIDecodeContext
*ctx
= avctx
->internal
->hwaccel_priv_data
;
277 AVVAAPIHWConfig
*hwconfig
= NULL
;
278 AVHWFramesConstraints
*constraints
= NULL
;
281 const AVCodecDescriptor
*codec_desc
;
282 VAProfile profile
, *profile_list
= NULL
;
283 int profile_count
, exact_match
, alt_profile
;
284 const AVPixFmtDescriptor
*sw_desc
, *desc
;
286 codec_desc
= avcodec_descriptor_get(avctx
->codec_id
);
288 err
= AVERROR(EINVAL
);
292 profile_count
= vaMaxNumProfiles(ctx
->hwctx
->display
);
293 profile_list
= av_malloc_array(profile_count
,
296 err
= AVERROR(ENOMEM
);
300 vas
= vaQueryConfigProfiles(ctx
->hwctx
->display
,
301 profile_list
, &profile_count
);
302 if (vas
!= VA_STATUS_SUCCESS
) {
303 av_log(avctx
, AV_LOG_ERROR
, "Failed to query profiles: "
304 "%d (%s).\n", vas
, vaErrorStr(vas
));
305 err
= AVERROR(ENOSYS
);
309 profile
= VAProfileNone
;
312 for (i
= 0; i
< FF_ARRAY_ELEMS(vaapi_profile_map
); i
++) {
313 int profile_match
= 0;
314 if (avctx
->codec_id
!= vaapi_profile_map
[i
].codec_id
)
316 if (avctx
->profile
== vaapi_profile_map
[i
].codec_profile
||
317 vaapi_profile_map
[i
].codec_profile
== FF_PROFILE_UNKNOWN
)
319 profile
= vaapi_profile_map
[i
].va_profile
;
320 for (j
= 0; j
< profile_count
; j
++) {
321 if (profile
== profile_list
[j
]) {
322 exact_match
= profile_match
;
326 if (j
< profile_count
) {
329 alt_profile
= vaapi_profile_map
[i
].codec_profile
;
332 av_freep(&profile_list
);
334 if (profile
== VAProfileNone
) {
335 av_log(avctx
, AV_LOG_ERROR
, "No support for codec %s "
336 "profile %d.\n", codec_desc
->name
, avctx
->profile
);
337 err
= AVERROR(ENOSYS
);
341 if (avctx
->hwaccel_flags
&
342 AV_HWACCEL_FLAG_ALLOW_PROFILE_MISMATCH
) {
343 av_log(avctx
, AV_LOG_VERBOSE
, "Codec %s profile %d not "
344 "supported for hardware decode.\n",
345 codec_desc
->name
, avctx
->profile
);
346 av_log(avctx
, AV_LOG_WARNING
, "Using possibly-"
347 "incompatible profile %d instead.\n",
350 av_log(avctx
, AV_LOG_VERBOSE
, "Codec %s profile %d not "
351 "supported for hardware decode.\n",
352 codec_desc
->name
, avctx
->profile
);
353 err
= AVERROR(EINVAL
);
358 ctx
->va_profile
= profile
;
359 ctx
->va_entrypoint
= VAEntrypointVLD
;
361 vas
= vaCreateConfig(ctx
->hwctx
->display
, ctx
->va_profile
,
362 ctx
->va_entrypoint
, NULL
, 0,
364 if (vas
!= VA_STATUS_SUCCESS
) {
365 av_log(avctx
, AV_LOG_ERROR
, "Failed to create decode "
366 "configuration: %d (%s).\n", vas
, vaErrorStr(vas
));
371 hwconfig
= av_hwdevice_hwconfig_alloc(avctx
->hw_device_ctx ?
372 avctx
->hw_device_ctx
:
373 ctx
->frames
->device_ref
);
375 err
= AVERROR(ENOMEM
);
378 hwconfig
->config_id
= ctx
->va_config
;
381 av_hwdevice_get_hwframe_constraints(avctx
->hw_device_ctx ?
382 avctx
->hw_device_ctx
:
383 ctx
->frames
->device_ref
,
386 err
= AVERROR(ENOMEM
);
390 if (avctx
->coded_width
< constraints
->min_width
||
391 avctx
->coded_height
< constraints
->min_height
||
392 avctx
->coded_width
> constraints
->max_width
||
393 avctx
->coded_height
> constraints
->max_height
) {
394 av_log(avctx
, AV_LOG_ERROR
, "Hardware does not support image "
395 "size %dx%d (constraints: width %d-%d height %d-%d).\n",
396 avctx
->coded_width
, avctx
->coded_height
,
397 constraints
->min_width
, constraints
->max_width
,
398 constraints
->min_height
, constraints
->max_height
);
399 err
= AVERROR(EINVAL
);
402 if (!constraints
->valid_sw_formats
||
403 constraints
->valid_sw_formats
[0] == AV_PIX_FMT_NONE
) {
404 av_log(avctx
, AV_LOG_ERROR
, "Hardware does not offer any "
405 "usable surface formats.\n");
406 err
= AVERROR(EINVAL
);
410 // Find the first format in the list which matches the expected
411 // bit depth and subsampling. If none are found (this can happen
412 // when 10-bit streams are decoded to 8-bit surfaces, for example)
413 // then just take the first format on the list.
414 ctx
->surface_format
= constraints
->valid_sw_formats
[0];
415 sw_desc
= av_pix_fmt_desc_get(avctx
->sw_pix_fmt
);
416 for (i
= 0; constraints
->valid_sw_formats
[i
] != AV_PIX_FMT_NONE
; i
++) {
417 desc
= av_pix_fmt_desc_get(constraints
->valid_sw_formats
[i
]);
418 if (desc
->nb_components
!= sw_desc
->nb_components
||
419 desc
->log2_chroma_w
!= sw_desc
->log2_chroma_w
||
420 desc
->log2_chroma_h
!= sw_desc
->log2_chroma_h
)
422 for (j
= 0; j
< desc
->nb_components
; j
++) {
423 if (desc
->comp
[j
].depth
!= sw_desc
->comp
[j
].depth
)
426 if (j
< desc
->nb_components
)
428 ctx
->surface_format
= constraints
->valid_sw_formats
[i
];
432 // Start with at least four surfaces.
433 ctx
->surface_count
= 4;
434 // Add per-codec number of surfaces used for storing reference frames.
435 switch (avctx
->codec_id
) {
436 case AV_CODEC_ID_H264
:
437 case AV_CODEC_ID_HEVC
:
438 ctx
->surface_count
+= 16;
440 case AV_CODEC_ID_VP9
:
441 ctx
->surface_count
+= 8;
443 case AV_CODEC_ID_VP8
:
444 ctx
->surface_count
+= 3;
447 ctx
->surface_count
+= 2;
449 // Add an additional surface per thread is frame threading is enabled.
450 if (avctx
->active_thread_type
& FF_THREAD_FRAME
)
451 ctx
->surface_count
+= avctx
->thread_count
;
453 av_hwframe_constraints_free(&constraints
);
459 av_hwframe_constraints_free(&constraints
);
461 if (ctx
->va_config
!= VA_INVALID_ID
) {
462 vaDestroyConfig(ctx
->hwctx
->display
, ctx
->va_config
);
463 ctx
->va_config
= VA_INVALID_ID
;
465 av_freep(&profile_list
);
469 int ff_vaapi_decode_init(AVCodecContext
*avctx
)
471 VAAPIDecodeContext
*ctx
= avctx
->internal
->hwaccel_priv_data
;
475 ctx
->va_config
= VA_INVALID_ID
;
476 ctx
->va_context
= VA_INVALID_ID
;
478 #if FF_API_VAAPI_CONTEXT
479 if (avctx
->hwaccel_context
) {
480 av_log(avctx
, AV_LOG_WARNING
, "Using deprecated struct "
481 "vaapi_context in decode.\n");
483 ctx
->have_old_context
= 1;
484 ctx
->old_context
= avctx
->hwaccel_context
;
486 // Really we only want the VAAPI device context, but this
487 // allocates a whole generic device context because we don't
488 // have any other way to determine how big it should be.
490 av_hwdevice_ctx_alloc(AV_HWDEVICE_TYPE_VAAPI
);
491 if (!ctx
->device_ref
) {
492 err
= AVERROR(ENOMEM
);
495 ctx
->device
= (AVHWDeviceContext
*)ctx
->device_ref
->data
;
496 ctx
->hwctx
= ctx
->device
->hwctx
;
498 ctx
->hwctx
->display
= ctx
->old_context
->display
;
500 // The old VAAPI decode setup assumed this quirk was always
501 // present, so set it here to avoid the behaviour changing.
502 ctx
->hwctx
->driver_quirks
=
503 AV_VAAPI_DRIVER_QUIRK_RENDER_PARAM_BUFFERS
;
507 if (avctx
->hw_frames_ctx
) {
508 // This structure has a shorter lifetime than the enclosing
509 // AVCodecContext, so we inherit the references from there
510 // and do not need to make separate ones.
512 ctx
->frames
= (AVHWFramesContext
*)avctx
->hw_frames_ctx
->data
;
513 ctx
->hwfc
= ctx
->frames
->hwctx
;
514 ctx
->device
= ctx
->frames
->device_ctx
;
515 ctx
->hwctx
= ctx
->device
->hwctx
;
517 } else if (avctx
->hw_device_ctx
) {
518 ctx
->device
= (AVHWDeviceContext
*)avctx
->hw_device_ctx
->data
;
519 ctx
->hwctx
= ctx
->device
->hwctx
;
521 if (ctx
->device
->type
!= AV_HWDEVICE_TYPE_VAAPI
) {
522 av_log(avctx
, AV_LOG_ERROR
, "Device supplied for VAAPI "
523 "decoding must be a VAAPI device (not %d).\n",
525 err
= AVERROR(EINVAL
);
530 av_log(avctx
, AV_LOG_ERROR
, "A hardware device or frames context "
531 "is required for VAAPI decoding.\n");
532 err
= AVERROR(EINVAL
);
536 #if FF_API_VAAPI_CONTEXT
537 if (ctx
->have_old_context
) {
538 ctx
->va_config
= ctx
->old_context
->config_id
;
539 ctx
->va_context
= ctx
->old_context
->context_id
;
541 av_log(avctx
, AV_LOG_DEBUG
, "Using user-supplied decoder "
542 "context: %#x/%#x.\n", ctx
->va_config
, ctx
->va_context
);
546 err
= vaapi_decode_make_config(avctx
);
550 if (!avctx
->hw_frames_ctx
) {
551 avctx
->hw_frames_ctx
= av_hwframe_ctx_alloc(avctx
->hw_device_ctx
);
552 if (!avctx
->hw_frames_ctx
) {
553 err
= AVERROR(ENOMEM
);
556 ctx
->frames
= (AVHWFramesContext
*)avctx
->hw_frames_ctx
->data
;
558 ctx
->frames
->format
= AV_PIX_FMT_VAAPI
;
559 ctx
->frames
->width
= avctx
->coded_width
;
560 ctx
->frames
->height
= avctx
->coded_height
;
562 ctx
->frames
->sw_format
= ctx
->surface_format
;
563 ctx
->frames
->initial_pool_size
= ctx
->surface_count
;
565 err
= av_hwframe_ctx_init(avctx
->hw_frames_ctx
);
567 av_log(avctx
, AV_LOG_ERROR
, "Failed to initialise internal "
568 "frames context: %d.\n", err
);
572 ctx
->hwfc
= ctx
->frames
->hwctx
;
575 vas
= vaCreateContext(ctx
->hwctx
->display
, ctx
->va_config
,
576 avctx
->coded_width
, avctx
->coded_height
,
578 ctx
->hwfc
->surface_ids
,
579 ctx
->hwfc
->nb_surfaces
,
581 if (vas
!= VA_STATUS_SUCCESS
) {
582 av_log(avctx
, AV_LOG_ERROR
, "Failed to create decode "
583 "context: %d (%s).\n", vas
, vaErrorStr(vas
));
588 av_log(avctx
, AV_LOG_DEBUG
, "Decode context initialised: "
589 "%#x/%#x.\n", ctx
->va_config
, ctx
->va_context
);
590 #if FF_API_VAAPI_CONTEXT
597 ff_vaapi_decode_uninit(avctx
);
601 int ff_vaapi_decode_uninit(AVCodecContext
*avctx
)
603 VAAPIDecodeContext
*ctx
= avctx
->internal
->hwaccel_priv_data
;
606 #if FF_API_VAAPI_CONTEXT
607 if (ctx
->have_old_context
) {
608 av_buffer_unref(&ctx
->device_ref
);
612 if (ctx
->va_context
!= VA_INVALID_ID
) {
613 vas
= vaDestroyContext(ctx
->hwctx
->display
, ctx
->va_context
);
614 if (vas
!= VA_STATUS_SUCCESS
) {
615 av_log(avctx
, AV_LOG_ERROR
, "Failed to destroy decode "
616 "context %#x: %d (%s).\n",
617 ctx
->va_context
, vas
, vaErrorStr(vas
));
620 if (ctx
->va_config
!= VA_INVALID_ID
) {
621 vas
= vaDestroyConfig(ctx
->hwctx
->display
, ctx
->va_config
);
622 if (vas
!= VA_STATUS_SUCCESS
) {
623 av_log(avctx
, AV_LOG_ERROR
, "Failed to destroy decode "
624 "configuration %#x: %d (%s).\n",
625 ctx
->va_config
, vas
, vaErrorStr(vas
));
629 #if FF_API_VAAPI_CONTEXT