lavc: Add new VDA hwaccel
[libav.git] / libavcodec / vda_h264.c
CommitLineData
ac3dbb4d
SZ
1/*
2 * VDA H.264 hardware acceleration
3 *
4 * copyright (c) 2011 Sebastien Zwickert
5 *
6 * This file is part of Libav.
7 *
8 * Libav is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * Libav is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with Libav; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
dc87ac55
SZ
23#include <CoreFoundation/CFNumber.h>
24#include <CoreFoundation/CFData.h>
25#include <CoreFoundation/CFString.h>
26
27#include "libavutil/avutil.h"
ac3dbb4d 28#include "h264.h"
67afcefb 29#include "internal.h"
dc87ac55 30#include "vda.h"
67afcefb 31#include "vda_internal.h"
dc87ac55 32
31a46750
AK
33typedef struct VDAContext {
34 // The current bitstream buffer.
35 uint8_t *bitstream;
36
37 // The current size of the bitstream.
38 int bitstream_size;
39
40 // The reference size used for fast reallocation.
41 int allocated_size;
67afcefb
AK
42
43 CVImageBufferRef frame;
31a46750
AK
44} VDAContext;
45
dc87ac55
SZ
46/* Decoder callback that adds the VDA frame to the queue in display order. */
47static void vda_decoder_callback(void *vda_hw_ctx,
48 CFDictionaryRef user_info,
49 OSStatus status,
50 uint32_t infoFlags,
51 CVImageBufferRef image_buffer)
52{
53 struct vda_context *vda_ctx = vda_hw_ctx;
54
55 if (!image_buffer)
56 return;
57
58 if (vda_ctx->cv_pix_fmt_type != CVPixelBufferGetPixelFormatType(image_buffer))
59 return;
60
202c2acc 61 vda_ctx->cv_buffer = CVPixelBufferRetain(image_buffer);
dc87ac55
SZ
62}
63
31a46750 64static int vda_sync_decode(VDAContext *ctx, struct vda_context *vda_ctx)
dc87ac55
SZ
65{
66 OSStatus status;
67 CFDataRef coded_frame;
68 uint32_t flush_flags = 1 << 0; ///< kVDADecoderFlush_emitFrames
69
70 coded_frame = CFDataCreate(kCFAllocatorDefault,
31a46750
AK
71 ctx->bitstream,
72 ctx->bitstream_size);
dc87ac55
SZ
73
74 status = VDADecoderDecode(vda_ctx->decoder, 0, coded_frame, NULL);
75
76 if (kVDADecoderNoErr == status)
77 status = VDADecoderFlush(vda_ctx->decoder, flush_flags);
78
79 CFRelease(coded_frame);
80
81 return status;
82}
83
ac3dbb4d 84
67afcefb 85static int vda_old_h264_start_frame(AVCodecContext *avctx,
c57a5936
DB
86 av_unused const uint8_t *buffer,
87 av_unused uint32_t size)
ac3dbb4d 88{
31a46750 89 VDAContext *vda = avctx->internal->hwaccel_priv_data;
ac3dbb4d 90 struct vda_context *vda_ctx = avctx->hwaccel_context;
ac3dbb4d
SZ
91
92 if (!vda_ctx->decoder)
93 return -1;
94
31a46750 95 vda->bitstream_size = 0;
ac3dbb4d
SZ
96
97 return 0;
98}
99
67afcefb 100static int vda_old_h264_decode_slice(AVCodecContext *avctx,
c57a5936
DB
101 const uint8_t *buffer,
102 uint32_t size)
ac3dbb4d 103{
31a46750 104 VDAContext *vda = avctx->internal->hwaccel_priv_data;
ac3dbb4d 105 struct vda_context *vda_ctx = avctx->hwaccel_context;
ac3dbb4d
SZ
106 void *tmp;
107
108 if (!vda_ctx->decoder)
109 return -1;
110
31a46750
AK
111 tmp = av_fast_realloc(vda->bitstream,
112 &vda->allocated_size,
113 vda->bitstream_size + size + 4);
ac3dbb4d
SZ
114 if (!tmp)
115 return AVERROR(ENOMEM);
116
31a46750 117 vda->bitstream = tmp;
ac3dbb4d 118
31a46750
AK
119 AV_WB32(vda->bitstream + vda->bitstream_size, size);
120 memcpy(vda->bitstream + vda->bitstream_size + 4, buffer, size);
ac3dbb4d 121
31a46750 122 vda->bitstream_size += size + 4;
ac3dbb4d
SZ
123
124 return 0;
125}
126
67afcefb 127static int vda_old_h264_end_frame(AVCodecContext *avctx)
ac3dbb4d
SZ
128{
129 H264Context *h = avctx->priv_data;
31a46750 130 VDAContext *vda = avctx->internal->hwaccel_priv_data;
ac3dbb4d 131 struct vda_context *vda_ctx = avctx->hwaccel_context;
2c541554 132 AVFrame *frame = &h->cur_pic_ptr->f;
ac3dbb4d
SZ
133 int status;
134
31a46750 135 if (!vda_ctx->decoder || !vda->bitstream)
ac3dbb4d
SZ
136 return -1;
137
31a46750 138 status = vda_sync_decode(vda, vda_ctx);
202c2acc 139 frame->data[3] = (void*)vda_ctx->cv_buffer;
ac3dbb4d
SZ
140
141 if (status)
142 av_log(avctx, AV_LOG_ERROR, "Failed to decode frame (%d)\n", status);
143
ac3dbb4d
SZ
144 return status;
145}
146
dc87ac55
SZ
147int ff_vda_create_decoder(struct vda_context *vda_ctx,
148 uint8_t *extradata,
149 int extradata_size)
150{
151 OSStatus status = kVDADecoderNoErr;
152 CFNumberRef height;
153 CFNumberRef width;
154 CFNumberRef format;
155 CFDataRef avc_data;
156 CFMutableDictionaryRef config_info;
157 CFMutableDictionaryRef buffer_attributes;
158 CFMutableDictionaryRef io_surface_properties;
159 CFNumberRef cv_pix_fmt;
160
dc87ac55 161 /* Each VCL NAL in the bistream sent to the decoder
511cf612 162 * is preceded by a 4 bytes length header.
dc87ac55
SZ
163 * Change the avcC atom header if needed, to signal headers of 4 bytes. */
164 if (extradata_size >= 4 && (extradata[4] & 0x03) != 0x03) {
165 uint8_t *rw_extradata;
166
167 if (!(rw_extradata = av_malloc(extradata_size)))
168 return AVERROR(ENOMEM);
169
170 memcpy(rw_extradata, extradata, extradata_size);
171
172 rw_extradata[4] |= 0x03;
173
174 avc_data = CFDataCreate(kCFAllocatorDefault, rw_extradata, extradata_size);
175
176 av_freep(&rw_extradata);
177 } else {
178 avc_data = CFDataCreate(kCFAllocatorDefault, extradata, extradata_size);
179 }
180
181 config_info = CFDictionaryCreateMutable(kCFAllocatorDefault,
182 4,
183 &kCFTypeDictionaryKeyCallBacks,
184 &kCFTypeDictionaryValueCallBacks);
185
186 height = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &vda_ctx->height);
187 width = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &vda_ctx->width);
188 format = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &vda_ctx->format);
189
190 CFDictionarySetValue(config_info, kVDADecoderConfiguration_Height, height);
191 CFDictionarySetValue(config_info, kVDADecoderConfiguration_Width, width);
192 CFDictionarySetValue(config_info, kVDADecoderConfiguration_SourceFormat, format);
193 CFDictionarySetValue(config_info, kVDADecoderConfiguration_avcCData, avc_data);
194
195 buffer_attributes = CFDictionaryCreateMutable(kCFAllocatorDefault,
196 2,
197 &kCFTypeDictionaryKeyCallBacks,
198 &kCFTypeDictionaryValueCallBacks);
199 io_surface_properties = CFDictionaryCreateMutable(kCFAllocatorDefault,
200 0,
201 &kCFTypeDictionaryKeyCallBacks,
202 &kCFTypeDictionaryValueCallBacks);
203 cv_pix_fmt = CFNumberCreate(kCFAllocatorDefault,
204 kCFNumberSInt32Type,
205 &vda_ctx->cv_pix_fmt_type);
206 CFDictionarySetValue(buffer_attributes,
207 kCVPixelBufferPixelFormatTypeKey,
208 cv_pix_fmt);
209 CFDictionarySetValue(buffer_attributes,
210 kCVPixelBufferIOSurfacePropertiesKey,
211 io_surface_properties);
212
213 status = VDADecoderCreate(config_info,
214 buffer_attributes,
67afcefb 215 (VDADecoderOutputCallback *)vda_decoder_callback,
dc87ac55
SZ
216 vda_ctx,
217 &vda_ctx->decoder);
218
219 CFRelease(height);
220 CFRelease(width);
221 CFRelease(format);
222 CFRelease(avc_data);
223 CFRelease(config_info);
224 CFRelease(io_surface_properties);
225 CFRelease(cv_pix_fmt);
226 CFRelease(buffer_attributes);
227
228 return status;
229}
230
231int ff_vda_destroy_decoder(struct vda_context *vda_ctx)
232{
233 OSStatus status = kVDADecoderNoErr;
234
235 if (vda_ctx->decoder)
236 status = VDADecoderDestroy(vda_ctx->decoder);
237
dc87ac55
SZ
238 return status;
239}
240
67afcefb 241static int vda_h264_uninit(AVCodecContext *avctx)
31a46750 242{
67afcefb 243 VDAContext *vda = avctx->internal->hwaccel_priv_data;
31a46750 244 av_freep(&vda->bitstream);
67afcefb
AK
245 if (vda->frame)
246 CVPixelBufferRelease(vda->frame);
247 return 0;
31a46750
AK
248}
249
67afcefb 250AVHWAccel ff_h264_vda_old_hwaccel = {
ac3dbb4d
SZ
251 .name = "h264_vda",
252 .type = AVMEDIA_TYPE_VIDEO,
36ef5369 253 .id = AV_CODEC_ID_H264,
716d413c 254 .pix_fmt = AV_PIX_FMT_VDA_VLD,
67afcefb
AK
255 .start_frame = vda_old_h264_start_frame,
256 .decode_slice = vda_old_h264_decode_slice,
257 .end_frame = vda_old_h264_end_frame,
258 .uninit = vda_h264_uninit,
259 .priv_data_size = sizeof(VDAContext),
260};
261
262void ff_vda_output_callback(void *opaque,
263 CFDictionaryRef user_info,
264 OSStatus status,
265 uint32_t infoFlags,
266 CVImageBufferRef image_buffer)
267{
268 AVCodecContext *ctx = opaque;
269 VDAContext *vda = ctx->internal->hwaccel_priv_data;
270
271
272 if (vda->frame) {
273 CVPixelBufferRelease(vda->frame);
274 vda->frame = NULL;
275 }
276
277 if (!image_buffer)
278 return;
279
280 vda->frame = CVPixelBufferRetain(image_buffer);
281}
282
283static int vda_h264_start_frame(AVCodecContext *avctx,
284 const uint8_t *buffer,
285 uint32_t size)
286{
287 VDAContext *vda = avctx->internal->hwaccel_priv_data;
288
289 vda->bitstream_size = 0;
290
291 return 0;
292}
293
294static int vda_h264_decode_slice(AVCodecContext *avctx,
295 const uint8_t *buffer,
296 uint32_t size)
297{
298 VDAContext *vda = avctx->internal->hwaccel_priv_data;
299 void *tmp;
300
301 tmp = av_fast_realloc(vda->bitstream,
302 &vda->allocated_size,
303 vda->bitstream_size + size + 4);
304 if (!tmp)
305 return AVERROR(ENOMEM);
306
307 vda->bitstream = tmp;
308
309 AV_WB32(vda->bitstream + vda->bitstream_size, size);
310 memcpy(vda->bitstream + vda->bitstream_size + 4, buffer, size);
311
312 vda->bitstream_size += size + 4;
313
314 return 0;
315}
316
317static void release_buffer(void *opaque, uint8_t *data)
318{
319 CVImageBufferRef frame = (CVImageBufferRef)data;
320 CVPixelBufferRelease(frame);
321}
322
323static int vda_h264_end_frame(AVCodecContext *avctx)
324{
325 H264Context *h = avctx->priv_data;
326 VDAContext *vda = avctx->internal->hwaccel_priv_data;
327 AVVDAContext *vda_ctx = avctx->hwaccel_context;
328 AVFrame *frame = &h->cur_pic_ptr->f;
329 uint32_t flush_flags = 1 << 0; ///< kVDADecoderFlush_emitFrames
330 CFDataRef coded_frame;
331 OSStatus status;
332
333 if (!vda->bitstream_size)
334 return AVERROR_INVALIDDATA;
335
336
337 coded_frame = CFDataCreate(kCFAllocatorDefault,
338 vda->bitstream,
339 vda->bitstream_size);
340
341 status = VDADecoderDecode(vda_ctx->decoder, 0, coded_frame, NULL);
342
343 if (status == kVDADecoderNoErr)
344 status = VDADecoderFlush(vda_ctx->decoder, flush_flags);
345
346 CFRelease(coded_frame);
347
348 if (status != kVDADecoderNoErr) {
349 av_log(avctx, AV_LOG_ERROR, "Failed to decode frame (%d)\n", status);
350 return AVERROR_UNKNOWN;
351 }
352
353 if (vda->frame) {
354 av_buffer_unref(&frame->buf[0]);
355
356 frame->buf[0] = av_buffer_create((uint8_t*)vda->frame,
357 sizeof(vda->frame),
358 release_buffer, NULL,
359 AV_BUFFER_FLAG_READONLY);
360 if (!frame->buf)
361 return AVERROR(ENOMEM);
362
363 frame->data[3] = (uint8_t*)vda->frame;
364 vda->frame = NULL;
365 }
366
367 return 0;
368}
369
370int ff_vda_default_init(AVCodecContext *avctx)
371{
372 AVVDAContext *vda_ctx = avctx->hwaccel_context;
373 OSStatus status = kVDADecoderNoErr;
374 CFNumberRef height;
375 CFNumberRef width;
376 CFNumberRef format;
377 CFDataRef avc_data;
378 CFMutableDictionaryRef config_info;
379 CFMutableDictionaryRef buffer_attributes;
380 CFMutableDictionaryRef io_surface_properties;
381 CFNumberRef cv_pix_fmt;
382 int32_t fmt = 'avc1', pix_fmt = kCVPixelFormatType_422YpCbCr8;
383
384 // kCVPixelFormatType_420YpCbCr8Planar;
385
386 /* Each VCL NAL in the bistream sent to the decoder
387 * is preceded by a 4 bytes length header.
388 * Change the avcC atom header if needed, to signal headers of 4 bytes. */
389 if (avctx->extradata_size >= 4 && (avctx->extradata[4] & 0x03) != 0x03) {
390 uint8_t *rw_extradata;
391
392 if (!(rw_extradata = av_malloc(avctx->extradata_size)))
393 return AVERROR(ENOMEM);
394
395 memcpy(rw_extradata, avctx->extradata, avctx->extradata_size);
396
397 rw_extradata[4] |= 0x03;
398
399 avc_data = CFDataCreate(kCFAllocatorDefault, rw_extradata, avctx->extradata_size);
400
401 av_freep(&rw_extradata);
402 } else {
403 avc_data = CFDataCreate(kCFAllocatorDefault,
404 avctx->extradata, avctx->extradata_size);
405 }
406
407 config_info = CFDictionaryCreateMutable(kCFAllocatorDefault,
408 4,
409 &kCFTypeDictionaryKeyCallBacks,
410 &kCFTypeDictionaryValueCallBacks);
411
412 height = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &avctx->height);
413 width = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &avctx->width);
414 format = CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type, &fmt);
415 CFDictionarySetValue(config_info, kVDADecoderConfiguration_Height, height);
416 CFDictionarySetValue(config_info, kVDADecoderConfiguration_Width, width);
417 CFDictionarySetValue(config_info, kVDADecoderConfiguration_avcCData, avc_data);
418 CFDictionarySetValue(config_info, kVDADecoderConfiguration_SourceFormat, format);
419
420 buffer_attributes = CFDictionaryCreateMutable(kCFAllocatorDefault,
421 2,
422 &kCFTypeDictionaryKeyCallBacks,
423 &kCFTypeDictionaryValueCallBacks);
424 io_surface_properties = CFDictionaryCreateMutable(kCFAllocatorDefault,
425 0,
426 &kCFTypeDictionaryKeyCallBacks,
427 &kCFTypeDictionaryValueCallBacks);
428 cv_pix_fmt = CFNumberCreate(kCFAllocatorDefault,
429 kCFNumberSInt32Type,
430 &pix_fmt);
431
432 CFDictionarySetValue(buffer_attributes,
433 kCVPixelBufferPixelFormatTypeKey,
434 cv_pix_fmt);
435 CFDictionarySetValue(buffer_attributes,
436 kCVPixelBufferIOSurfacePropertiesKey,
437 io_surface_properties);
438
439 status = VDADecoderCreate(config_info,
440 buffer_attributes,
441 (VDADecoderOutputCallback *)ff_vda_output_callback,
442 avctx,
443 &vda_ctx->decoder);
444
445 CFRelease(format);
446 CFRelease(height);
447 CFRelease(width);
448 CFRelease(avc_data);
449 CFRelease(config_info);
450 CFRelease(cv_pix_fmt);
451 CFRelease(io_surface_properties);
452 CFRelease(buffer_attributes);
453
454 if (status != kVDADecoderNoErr) {
455 av_log(avctx, AV_LOG_ERROR, "Cannot initialize VDA %d\n", status);
456 }
457
458 switch (status) {
459 case kVDADecoderHardwareNotSupportedErr:
460 case kVDADecoderFormatNotSupportedErr:
461 return AVERROR(ENOSYS);
462 case kVDADecoderConfigurationError:
463 return AVERROR(EINVAL);
464 case kVDADecoderDecoderFailedErr:
465 return AVERROR_INVALIDDATA;
466 case kVDADecoderNoErr:
467 return 0;
468 default:
469 return AVERROR_UNKNOWN;
470 }
471}
472
473static int vda_h264_alloc_frame(AVCodecContext *avctx, AVFrame *frame)
474{
475 frame->width = avctx->width;
476 frame->height = avctx->height;
477 frame->format = avctx->pix_fmt;
478 frame->buf[0] = av_buffer_alloc(1);
479
480 if (!frame->buf[0])
481 return AVERROR(ENOMEM);
482 return 0;
483}
484
485AVHWAccel ff_h264_vda_hwaccel = {
486 .name = "h264_vda",
487 .type = AVMEDIA_TYPE_VIDEO,
488 .id = AV_CODEC_ID_H264,
489 .pix_fmt = AV_PIX_FMT_VDA,
490 .alloc_frame = vda_h264_alloc_frame,
c57a5936
DB
491 .start_frame = vda_h264_start_frame,
492 .decode_slice = vda_h264_decode_slice,
493 .end_frame = vda_h264_end_frame,
31a46750
AK
494 .uninit = vda_h264_uninit,
495 .priv_data_size = sizeof(VDAContext),
ac3dbb4d 496};