Check size_bmp more fully
[platform/upstream/libav.git] / avconv_dxva2.c
1 /*
2  * This file is part of Libav.
3  *
4  * Libav is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * Libav is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with Libav; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17  */
18
19 #include <windows.h>
20
21 #ifdef _WIN32_WINNT
22 #undef _WIN32_WINNT
23 #endif
24 #define _WIN32_WINNT 0x0600
25 #define DXVA2API_USE_BITFIELDS
26 #define COBJMACROS
27
28 #include <stdint.h>
29
30 #include <d3d9.h>
31 #include <dxva2api.h>
32
33 #include "avconv.h"
34
35 #include "libavcodec/dxva2.h"
36
37 #include "libavutil/avassert.h"
38 #include "libavutil/buffer.h"
39 #include "libavutil/frame.h"
40 #include "libavutil/imgutils.h"
41 #include "libavutil/pixfmt.h"
42
43 #include "libavutil/hwcontext.h"
44 #include "libavutil/hwcontext_dxva2.h"
45
46 /* define all the GUIDs used directly here,
47    to avoid problems with inconsistent dxva2api.h versions in mingw-w64 and different MSVC version */
48 #include <initguid.h>
49 DEFINE_GUID(IID_IDirectXVideoDecoderService, 0xfc51a551,0xd5e7,0x11d9,0xaf,0x55,0x00,0x05,0x4e,0x43,0xff,0x02);
50
51 DEFINE_GUID(DXVA2_ModeMPEG2_VLD,      0xee27417f, 0x5e28,0x4e65,0xbe,0xea,0x1d,0x26,0xb5,0x08,0xad,0xc9);
52 DEFINE_GUID(DXVA2_ModeMPEG2and1_VLD,  0x86695f12, 0x340e,0x4f04,0x9f,0xd3,0x92,0x53,0xdd,0x32,0x74,0x60);
53 DEFINE_GUID(DXVA2_ModeH264_E,         0x1b81be68, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
54 DEFINE_GUID(DXVA2_ModeH264_F,         0x1b81be69, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
55 DEFINE_GUID(DXVADDI_Intel_ModeH264_E, 0x604F8E68, 0x4951,0x4C54,0x88,0xFE,0xAB,0xD2,0x5C,0x15,0xB3,0xD6);
56 DEFINE_GUID(DXVA2_ModeVC1_D,          0x1b81beA3, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
57 DEFINE_GUID(DXVA2_ModeVC1_D2010,      0x1b81beA4, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
58 DEFINE_GUID(DXVA2_ModeHEVC_VLD_Main,  0x5b11d51b, 0x2f4c,0x4452,0xbc,0xc3,0x09,0xf2,0xa1,0x16,0x0c,0xc0);
59 DEFINE_GUID(DXVA2_ModeHEVC_VLD_Main10,0x107af0e0, 0xef1a,0x4d19,0xab,0xa8,0x67,0xa1,0x63,0x07,0x3d,0x13);
60 DEFINE_GUID(DXVA2_NoEncrypt,          0x1b81beD0, 0xa0c7,0x11d3,0xb9,0x84,0x00,0xc0,0x4f,0x2e,0x73,0xc5);
61 DEFINE_GUID(GUID_NULL,                0x00000000, 0x0000,0x0000,0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00);
62
63 typedef struct dxva2_mode {
64   const GUID     *guid;
65   enum AVCodecID codec;
66 } dxva2_mode;
67
68 static const dxva2_mode dxva2_modes[] = {
69     /* MPEG-2 */
70     { &DXVA2_ModeMPEG2_VLD,      AV_CODEC_ID_MPEG2VIDEO },
71     { &DXVA2_ModeMPEG2and1_VLD,  AV_CODEC_ID_MPEG2VIDEO },
72
73     /* H.264 */
74     { &DXVA2_ModeH264_F,         AV_CODEC_ID_H264 },
75     { &DXVA2_ModeH264_E,         AV_CODEC_ID_H264 },
76     /* Intel specific H.264 mode */
77     { &DXVADDI_Intel_ModeH264_E, AV_CODEC_ID_H264 },
78
79     /* VC-1 / WMV3 */
80     { &DXVA2_ModeVC1_D2010,      AV_CODEC_ID_VC1  },
81     { &DXVA2_ModeVC1_D2010,      AV_CODEC_ID_WMV3 },
82     { &DXVA2_ModeVC1_D,          AV_CODEC_ID_VC1  },
83     { &DXVA2_ModeVC1_D,          AV_CODEC_ID_WMV3 },
84
85     /* HEVC/H.265 */
86     { &DXVA2_ModeHEVC_VLD_Main,  AV_CODEC_ID_HEVC },
87     { &DXVA2_ModeHEVC_VLD_Main10, AV_CODEC_ID_HEVC },
88
89     { NULL,                      0 },
90 };
91
92 typedef struct DXVA2Context {
93     IDirectXVideoDecoder        *decoder;
94
95     GUID                        decoder_guid;
96     DXVA2_ConfigPictureDecode   decoder_config;
97     IDirectXVideoDecoderService *decoder_service;
98
99     AVFrame                     *tmp_frame;
100
101     AVBufferRef                 *hw_device_ctx;
102     AVBufferRef                 *hw_frames_ctx;
103 } DXVA2Context;
104
105 static void dxva2_uninit(AVCodecContext *s)
106 {
107     InputStream  *ist = s->opaque;
108     DXVA2Context *ctx = ist->hwaccel_ctx;
109
110     ist->hwaccel_uninit        = NULL;
111     ist->hwaccel_get_buffer    = NULL;
112     ist->hwaccel_retrieve_data = NULL;
113
114     if (ctx->decoder_service)
115         IDirectXVideoDecoderService_Release(ctx->decoder_service);
116
117     av_buffer_unref(&ctx->hw_frames_ctx);
118     av_buffer_unref(&ctx->hw_device_ctx);
119
120     av_frame_free(&ctx->tmp_frame);
121
122     av_freep(&ist->hwaccel_ctx);
123     av_freep(&s->hwaccel_context);
124 }
125
126 static int dxva2_get_buffer(AVCodecContext *s, AVFrame *frame, int flags)
127 {
128     InputStream  *ist = s->opaque;
129     DXVA2Context *ctx = ist->hwaccel_ctx;
130
131     return av_hwframe_get_buffer(ctx->hw_frames_ctx, frame, 0);
132 }
133
134 static int dxva2_retrieve_data(AVCodecContext *s, AVFrame *frame)
135 {
136     InputStream        *ist = s->opaque;
137     DXVA2Context       *ctx = ist->hwaccel_ctx;
138     int                ret;
139
140     ret = av_hwframe_transfer_data(ctx->tmp_frame, frame, 0);
141     if (ret < 0)
142         return ret;
143
144     ret = av_frame_copy_props(ctx->tmp_frame, frame);
145     if (ret < 0) {
146         av_frame_unref(ctx->tmp_frame);
147         return ret;
148     }
149
150     av_frame_unref(frame);
151     av_frame_move_ref(frame, ctx->tmp_frame);
152
153     return 0;
154 }
155
156 static int dxva2_alloc(AVCodecContext *s)
157 {
158     InputStream  *ist = s->opaque;
159     int loglevel = (ist->hwaccel_id == HWACCEL_AUTO) ? AV_LOG_VERBOSE : AV_LOG_ERROR;
160     DXVA2Context *ctx;
161     HANDLE device_handle;
162     HRESULT hr;
163
164     AVHWDeviceContext    *device_ctx;
165     AVDXVA2DeviceContext *device_hwctx;
166     int ret;
167
168     ctx = av_mallocz(sizeof(*ctx));
169     if (!ctx)
170         return AVERROR(ENOMEM);
171
172     ist->hwaccel_ctx           = ctx;
173     ist->hwaccel_uninit        = dxva2_uninit;
174     ist->hwaccel_get_buffer    = dxva2_get_buffer;
175     ist->hwaccel_retrieve_data = dxva2_retrieve_data;
176
177     ret = av_hwdevice_ctx_create(&ctx->hw_device_ctx, AV_HWDEVICE_TYPE_DXVA2,
178                                  ist->hwaccel_device, NULL, 0);
179     if (ret < 0)
180         goto fail;
181     device_ctx   = (AVHWDeviceContext*)ctx->hw_device_ctx->data;
182     device_hwctx = device_ctx->hwctx;
183
184     hr = IDirect3DDeviceManager9_OpenDeviceHandle(device_hwctx->devmgr,
185                                                   &device_handle);
186     if (FAILED(hr)) {
187         av_log(NULL, loglevel, "Failed to open a device handle\n");
188         goto fail;
189     }
190
191     hr = IDirect3DDeviceManager9_GetVideoService(device_hwctx->devmgr, device_handle,
192                                                  &IID_IDirectXVideoDecoderService,
193                                                  (void **)&ctx->decoder_service);
194     IDirect3DDeviceManager9_CloseDeviceHandle(device_hwctx->devmgr, device_handle);
195     if (FAILED(hr)) {
196         av_log(NULL, loglevel, "Failed to create IDirectXVideoDecoderService\n");
197         goto fail;
198     }
199
200     ctx->tmp_frame = av_frame_alloc();
201     if (!ctx->tmp_frame)
202         goto fail;
203
204     s->hwaccel_context = av_mallocz(sizeof(struct dxva_context));
205     if (!s->hwaccel_context)
206         goto fail;
207
208     return 0;
209 fail:
210     dxva2_uninit(s);
211     return AVERROR(EINVAL);
212 }
213
214 static int dxva2_get_decoder_configuration(AVCodecContext *s, const GUID *device_guid,
215                                            const DXVA2_VideoDesc *desc,
216                                            DXVA2_ConfigPictureDecode *config)
217 {
218     InputStream  *ist = s->opaque;
219     int loglevel = (ist->hwaccel_id == HWACCEL_AUTO) ? AV_LOG_VERBOSE : AV_LOG_ERROR;
220     DXVA2Context *ctx = ist->hwaccel_ctx;
221     unsigned cfg_count = 0, best_score = 0;
222     DXVA2_ConfigPictureDecode *cfg_list = NULL;
223     DXVA2_ConfigPictureDecode best_cfg = {{0}};
224     HRESULT hr;
225     int i;
226
227     hr = IDirectXVideoDecoderService_GetDecoderConfigurations(ctx->decoder_service, device_guid, desc, NULL, &cfg_count, &cfg_list);
228     if (FAILED(hr)) {
229         av_log(NULL, loglevel, "Unable to retrieve decoder configurations\n");
230         return AVERROR(EINVAL);
231     }
232
233     for (i = 0; i < cfg_count; i++) {
234         DXVA2_ConfigPictureDecode *cfg = &cfg_list[i];
235
236         unsigned score;
237         if (cfg->ConfigBitstreamRaw == 1)
238             score = 1;
239         else if (s->codec_id == AV_CODEC_ID_H264 && cfg->ConfigBitstreamRaw == 2)
240             score = 2;
241         else
242             continue;
243         if (IsEqualGUID(&cfg->guidConfigBitstreamEncryption, &DXVA2_NoEncrypt))
244             score += 16;
245         if (score > best_score) {
246             best_score = score;
247             best_cfg   = *cfg;
248         }
249     }
250     CoTaskMemFree(cfg_list);
251
252     if (!best_score) {
253         av_log(NULL, loglevel, "No valid decoder configuration available\n");
254         return AVERROR(EINVAL);
255     }
256
257     *config = best_cfg;
258     return 0;
259 }
260
261 static int dxva2_create_decoder(AVCodecContext *s)
262 {
263     InputStream  *ist = s->opaque;
264     int loglevel = (ist->hwaccel_id == HWACCEL_AUTO) ? AV_LOG_VERBOSE : AV_LOG_ERROR;
265     DXVA2Context *ctx = ist->hwaccel_ctx;
266     struct dxva_context *dxva_ctx = s->hwaccel_context;
267     GUID *guid_list = NULL;
268     unsigned guid_count = 0, i, j;
269     GUID device_guid = GUID_NULL;
270     const D3DFORMAT surface_format = s->sw_pix_fmt == AV_PIX_FMT_YUV420P10 ?
271                                      MKTAG('P', '0', '1', '0') : MKTAG('N', 'V', '1', '2');
272     D3DFORMAT target_format = 0;
273     DXVA2_VideoDesc desc = { 0 };
274     DXVA2_ConfigPictureDecode config;
275     HRESULT hr;
276     int surface_alignment, num_surfaces;
277     int ret;
278
279     AVDXVA2FramesContext *frames_hwctx;
280     AVHWFramesContext *frames_ctx;
281
282     hr = IDirectXVideoDecoderService_GetDecoderDeviceGuids(ctx->decoder_service, &guid_count, &guid_list);
283     if (FAILED(hr)) {
284         av_log(NULL, loglevel, "Failed to retrieve decoder device GUIDs\n");
285         goto fail;
286     }
287
288     for (i = 0; dxva2_modes[i].guid; i++) {
289         D3DFORMAT *target_list = NULL;
290         unsigned target_count = 0;
291         const dxva2_mode *mode = &dxva2_modes[i];
292         if (mode->codec != s->codec_id)
293             continue;
294
295         for (j = 0; j < guid_count; j++) {
296             if (IsEqualGUID(mode->guid, &guid_list[j]))
297                 break;
298         }
299         if (j == guid_count)
300             continue;
301
302         hr = IDirectXVideoDecoderService_GetDecoderRenderTargets(ctx->decoder_service, mode->guid, &target_count, &target_list);
303         if (FAILED(hr)) {
304             continue;
305         }
306         for (j = 0; j < target_count; j++) {
307             const D3DFORMAT format = target_list[j];
308             if (format == surface_format) {
309                 target_format = format;
310                 break;
311             }
312         }
313         CoTaskMemFree(target_list);
314         if (target_format) {
315             device_guid = *mode->guid;
316             break;
317         }
318     }
319     CoTaskMemFree(guid_list);
320
321     if (IsEqualGUID(&device_guid, &GUID_NULL)) {
322         av_log(NULL, loglevel, "No decoder device for codec found\n");
323         goto fail;
324     }
325
326     desc.SampleWidth  = s->coded_width;
327     desc.SampleHeight = s->coded_height;
328     desc.Format       = target_format;
329
330     ret = dxva2_get_decoder_configuration(s, &device_guid, &desc, &config);
331     if (ret < 0) {
332         goto fail;
333     }
334
335     /* decoding MPEG-2 requires additional alignment on some Intel GPUs,
336        but it causes issues for H.264 on certain AMD GPUs..... */
337     if (s->codec_id == AV_CODEC_ID_MPEG2VIDEO)
338         surface_alignment = 32;
339     /* the HEVC DXVA2 spec asks for 128 pixel aligned surfaces to ensure
340        all coding features have enough room to work with */
341     else if  (s->codec_id == AV_CODEC_ID_HEVC)
342         surface_alignment = 128;
343     else
344         surface_alignment = 16;
345
346     /* 4 base work surfaces */
347     num_surfaces = 4;
348
349     /* add surfaces based on number of possible refs */
350     if (s->codec_id == AV_CODEC_ID_H264 || s->codec_id == AV_CODEC_ID_HEVC)
351         num_surfaces += 16;
352     else
353         num_surfaces += 2;
354
355     /* add extra surfaces for frame threading */
356     if (s->active_thread_type & FF_THREAD_FRAME)
357         num_surfaces += s->thread_count;
358
359     ctx->hw_frames_ctx = av_hwframe_ctx_alloc(ctx->hw_device_ctx);
360     if (!ctx->hw_frames_ctx)
361         goto fail;
362     frames_ctx   = (AVHWFramesContext*)ctx->hw_frames_ctx->data;
363     frames_hwctx = frames_ctx->hwctx;
364
365     frames_ctx->format            = AV_PIX_FMT_DXVA2_VLD;
366     frames_ctx->sw_format         = s->sw_pix_fmt == AV_PIX_FMT_YUV420P10 ?
367                                     AV_PIX_FMT_P010 : AV_PIX_FMT_NV12;
368     frames_ctx->width             = FFALIGN(s->coded_width, surface_alignment);
369     frames_ctx->height            = FFALIGN(s->coded_height, surface_alignment);
370     frames_ctx->initial_pool_size = num_surfaces;
371
372     frames_hwctx->surface_type = DXVA2_VideoDecoderRenderTarget;
373
374     ret = av_hwframe_ctx_init(ctx->hw_frames_ctx);
375     if (ret < 0) {
376         av_log(NULL, loglevel, "Failed to initialize the HW frames context\n");
377         goto fail;
378     }
379
380     hr = IDirectXVideoDecoderService_CreateVideoDecoder(ctx->decoder_service, &device_guid,
381                                                         &desc, &config, frames_hwctx->surfaces,
382                                                         frames_hwctx->nb_surfaces, &frames_hwctx->decoder_to_release);
383     if (FAILED(hr)) {
384         av_log(NULL, loglevel, "Failed to create DXVA2 video decoder\n");
385         goto fail;
386     }
387
388     ctx->decoder_guid   = device_guid;
389     ctx->decoder_config = config;
390
391     dxva_ctx->cfg           = &ctx->decoder_config;
392     dxva_ctx->decoder       = frames_hwctx->decoder_to_release;
393     dxva_ctx->surface       = frames_hwctx->surfaces;
394     dxva_ctx->surface_count = frames_hwctx->nb_surfaces;
395
396     if (IsEqualGUID(&ctx->decoder_guid, &DXVADDI_Intel_ModeH264_E))
397         dxva_ctx->workaround |= FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO;
398
399     return 0;
400 fail:
401     av_buffer_unref(&ctx->hw_frames_ctx);
402     return AVERROR(EINVAL);
403 }
404
405 int dxva2_init(AVCodecContext *s)
406 {
407     InputStream *ist = s->opaque;
408     int loglevel = (ist->hwaccel_id == HWACCEL_AUTO) ? AV_LOG_VERBOSE : AV_LOG_ERROR;
409     DXVA2Context *ctx;
410     int ret;
411
412     if (!ist->hwaccel_ctx) {
413         ret = dxva2_alloc(s);
414         if (ret < 0)
415             return ret;
416     }
417     ctx = ist->hwaccel_ctx;
418
419     if (s->codec_id == AV_CODEC_ID_H264 &&
420         (s->profile & ~FF_PROFILE_H264_CONSTRAINED) > FF_PROFILE_H264_HIGH) {
421         av_log(NULL, loglevel, "Unsupported H.264 profile for DXVA2 HWAccel: %d\n", s->profile);
422         return AVERROR(EINVAL);
423     }
424
425     if (s->codec_id == AV_CODEC_ID_HEVC &&
426         s->profile != FF_PROFILE_HEVC_MAIN && s->profile != FF_PROFILE_HEVC_MAIN_10) {
427         av_log(NULL, loglevel, "Unsupported HEVC profile for DXVA2 HWAccel: %d\n", s->profile);
428         return AVERROR(EINVAL);
429     }
430
431     av_buffer_unref(&ctx->hw_frames_ctx);
432
433     ret = dxva2_create_decoder(s);
434     if (ret < 0) {
435         av_log(NULL, loglevel, "Error creating the DXVA2 decoder\n");
436         return ret;
437     }
438
439     return 0;
440 }