From 9850932722eb252fcf685080f14edd8b10c8685e Mon Sep 17 00:00:00 2001 From: wm4 Date: Tue, 17 Jan 2017 08:11:12 +0100 Subject: build: prefix hwaccel decoder wrapper filenames with hw_ Should have done this a long time ago. d3d.c remains as it is, because it's just a bunch of helper functions. --- video/decode/cuda.c | 104 -------- video/decode/d3d11va.c | 584 ----------------------------------------- video/decode/dxva2.c | 542 -------------------------------------- video/decode/hw_cuda.c | 104 ++++++++ video/decode/hw_d3d11va.c | 584 +++++++++++++++++++++++++++++++++++++++++ video/decode/hw_dxva2.c | 542 ++++++++++++++++++++++++++++++++++++++ video/decode/hw_vaapi.c | 226 ++++++++++++++++ video/decode/hw_vaapi_old.c | 443 +++++++++++++++++++++++++++++++ video/decode/hw_vdpau.c | 189 +++++++++++++ video/decode/hw_videotoolbox.c | 228 ++++++++++++++++ video/decode/vaapi.c | 226 ---------------- video/decode/vaapi_old.c | 443 ------------------------------- video/decode/vdpau.c | 189 ------------- video/decode/videotoolbox.c | 228 ---------------- wscript_build.py | 16 +- 15 files changed, 2324 insertions(+), 2324 deletions(-) delete mode 100644 video/decode/cuda.c delete mode 100644 video/decode/d3d11va.c delete mode 100644 video/decode/dxva2.c create mode 100644 video/decode/hw_cuda.c create mode 100644 video/decode/hw_d3d11va.c create mode 100644 video/decode/hw_dxva2.c create mode 100644 video/decode/hw_vaapi.c create mode 100644 video/decode/hw_vaapi_old.c create mode 100644 video/decode/hw_vdpau.c create mode 100644 video/decode/hw_videotoolbox.c delete mode 100644 video/decode/vaapi.c delete mode 100644 video/decode/vaapi_old.c delete mode 100644 video/decode/vdpau.c delete mode 100644 video/decode/videotoolbox.c diff --git a/video/decode/cuda.c b/video/decode/cuda.c deleted file mode 100644 index 92ba0772c4..0000000000 --- a/video/decode/cuda.c +++ /dev/null @@ -1,104 +0,0 @@ -/* - * This file is part of mpv. - * - * Copyright (c) 2016 Philip Langdale - * - * mpv is free software; you can redistribute it and/or - * modify it under the terms of the GNU Lesser General Public - * License as published by the Free Software Foundation; either - * version 2.1 of the License, or (at your option) any later version. - * - * mpv is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public - * License along with mpv. If not, see . - */ - -// This define and typedef prevent hwcontext_cuda.h trying to include cuda.h -#define CUDA_VERSION 7050 -typedef void * CUcontext; - -#include -#include - -#include "common/av_common.h" -#include "video/fmt-conversion.h" -#include "video/decode/lavc.h" - -static int probe(struct lavc_ctx *ctx, struct vd_lavc_hwdec *hwdec, - const char *codec) -{ - if (!hwdec_devices_load(ctx->hwdec_devs, HWDEC_CUDA)) - return HWDEC_ERR_NO_CTX; - return 0; -} - -static int init(struct lavc_ctx *ctx) -{ - ctx->hwdec_priv = hwdec_devices_get(ctx->hwdec_devs, HWDEC_CUDA); - return 0; -} - -static int init_decoder(struct lavc_ctx *ctx, int w, int h) -{ - AVCodecContext *avctx = ctx->avctx; - struct mp_hwdec_ctx *hwctx = ctx->hwdec_priv; - - if (avctx->hw_frames_ctx) { - MP_ERR(ctx, "hw_frames_ctx already initialised!\n"); - return -1; - } - - avctx->hw_frames_ctx = av_hwframe_ctx_alloc(hwctx->av_device_ref); - if (!avctx->hw_frames_ctx) { - MP_ERR(ctx, "av_hwframe_ctx_alloc failed\n"); - goto error; - } - - AVHWFramesContext *hwframe_ctx = (void* )avctx->hw_frames_ctx->data; - hwframe_ctx->format = AV_PIX_FMT_CUDA; - - // This is proper use of the hw_frames_ctx API, but it does not work - // (appaears to work but fails e.g. with 10 bit). The cuvid wrapper - // does non-standard things, and it's a meesy situation. - /* - hwframe_ctx->width = w; - hwframe_ctx->height = h; - hwframe_ctx->sw_format = avctx->sw_pix_fmt; - - if (av_hwframe_ctx_init(avctx->hw_frames_ctx) < 0) - goto error; - */ - - return 0; - - error: - av_buffer_unref(&avctx->hw_frames_ctx); - return -1; -} - -static void uninit(struct lavc_ctx *ctx) -{ - ctx->hwdec_priv = NULL; -} - -static struct mp_image *process_image(struct lavc_ctx *ctx, struct mp_image *img) -{ - if (img->imgfmt == IMGFMT_CUDA) - img->params.hw_subfmt = pixfmt2imgfmt(ctx->avctx->sw_pix_fmt); - return img; -} - -const struct vd_lavc_hwdec mp_vd_lavc_cuda = { - .type = HWDEC_CUDA, - .image_format = IMGFMT_CUDA, - .lavc_suffix = "_cuvid", - .probe = probe, - .init = init, - .uninit = uninit, - .init_decoder = init_decoder, - .process_image = process_image, -}; diff --git a/video/decode/d3d11va.c b/video/decode/d3d11va.c deleted file mode 100644 index a69a3890bd..0000000000 --- a/video/decode/d3d11va.c +++ /dev/null @@ -1,584 +0,0 @@ -/* - * This file is part of mpv. - * - * mpv is free software; you can redistribute it and/or - * modify it under the terms of the GNU Lesser General Public - * License as published by the Free Software Foundation; either - * version 2.1 of the License, or (at your option) any later version. - * - * mpv is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - * GNU Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public - * License along with mpv. If not, see . - */ - -#include - -#include "lavc.h" -#include "common/common.h" -#include "common/av_common.h" -#include "osdep/windows_utils.h" -#include "video/fmt-conversion.h" -#include "video/mp_image_pool.h" -#include "video/hwdec.h" - -#include "d3d.h" - -#define ADDITIONAL_SURFACES (HWDEC_EXTRA_SURFACES + HWDEC_DELAY_QUEUE_COUNT) - -struct d3d11va_decoder { - ID3D11VideoDecoder *decoder; - struct mp_image_pool *pool; - ID3D11Texture2D *staging; - int mpfmt_decoded; -}; - -struct priv { - struct mp_log *log; - - ID3D11Device *device; - ID3D11DeviceContext *device_ctx; - ID3D11VideoDevice *video_dev; - ID3D11VideoContext *video_ctx; - - struct d3d11va_decoder *decoder; - struct mp_image_pool *sw_pool; -}; - -struct d3d11va_surface { - ID3D11Texture2D *texture; - ID3D11VideoDecoderOutputView *surface; -}; - -static void d3d11va_release_img(void *arg) -{ - struct d3d11va_surface *surface = arg; - if (surface->surface) - ID3D11VideoDecoderOutputView_Release(surface->surface); - - if (surface->texture) - ID3D11Texture2D_Release(surface->texture); - - talloc_free(surface); -} - -static struct mp_image *d3d11va_new_ref(ID3D11VideoDecoderOutputView *view, - int w, int h) -{ - if (!view) - return NULL; - struct d3d11va_surface *surface = talloc_zero(NULL, struct d3d11va_surface); - - surface->surface = view; - ID3D11VideoDecoderOutputView_AddRef(surface->surface); - ID3D11VideoDecoderOutputView_GetResource( - surface->surface, (ID3D11Resource **)&surface->texture); - - D3D11_VIDEO_DECODER_OUTPUT_VIEW_DESC surface_desc; - ID3D11VideoDecoderOutputView_GetDesc(surface->surface, &surface_desc); - - struct mp_image *mpi = - mp_image_new_custom_ref(NULL, surface, d3d11va_release_img); - if (!mpi) - abort(); - - mp_image_setfmt(mpi, IMGFMT_D3D11VA); - mp_image_set_size(mpi, w, h); - mpi->planes[0] = NULL; - mpi->planes[1] = (void *)surface->texture; - mpi->planes[2] = (void *)(intptr_t)surface_desc.Texture2D.ArraySlice; - mpi->planes[3] = (void *)surface->surface; - - return mpi; -} - -static struct mp_image *d3d11va_allocate_image(struct lavc_ctx *s, int w, int h) -{ - struct priv *p = s->hwdec_priv; - struct mp_image *img = mp_image_pool_get_no_alloc(p->decoder->pool, - IMGFMT_D3D11VA, w, h); - if (!img) - MP_ERR(p, "Failed to get free D3D11VA surface\n"); - return img; -} - -static struct mp_image *d3d11va_retrieve_image(struct lavc_ctx *s, - struct mp_image *img) -{ - HRESULT hr; - struct priv *p = s->hwdec_priv; - ID3D11Texture2D *staging = p->decoder->staging; - - if (img->imgfmt != IMGFMT_D3D11VA) - return img; - - ID3D11Texture2D *texture = (void *)img->planes[1]; - int subindex = (intptr_t)img->planes[2]; - - if (!texture) { - MP_ERR(p, "Failed to get Direct3D texture and surface from mp_image\n"); - return img; - } - - D3D11_TEXTURE2D_DESC texture_desc; - ID3D11Texture2D_GetDesc(texture, &texture_desc); - if (texture_desc.Width < img->w || texture_desc.Height < img->h) { - MP_ERR(p, "Direct3D11 texture smaller than mp_image dimensions\n"); - return img; - } - - // copy to the staging texture - ID3D11DeviceContext_CopySubresourceRegion( - p->device_ctx, - (ID3D11Resource *)staging, 0, 0, 0, 0, - (ID3D11Resource *)texture, subindex, NULL); - - struct mp_image *sw_img = mp_image_pool_get(p->sw_pool, - p->decoder->mpfmt_decoded, - texture_desc.Width, - texture_desc.Height); - if (!sw_img) { - MP_ERR(p, "Failed to get %s surface from CPU pool\n", - mp_imgfmt_to_name(p->decoder->mpfmt_decoded)); - return img; - } - - // copy staging texture to the cpu mp_image - D3D11_MAPPED_SUBRESOURCE lock; - hr = ID3D11DeviceContext_Map(p->device_ctx, (ID3D11Resource *)staging, - 0, D3D11_MAP_READ, 0, &lock); - if (FAILED(hr)) { - MP_ERR(p, "Failed to map D3D11 surface: %s\n", mp_HRESULT_to_str(hr)); - talloc_free(sw_img); - return img; - } - copy_nv12(sw_img, lock.pData, lock.RowPitch, texture_desc.Height); - ID3D11DeviceContext_Unmap(p->device_ctx, (ID3D11Resource *)staging, 0); - - mp_image_set_size(sw_img, img->w, img->h); - mp_image_copy_attributes(sw_img, img); - talloc_free(img); - return sw_img; -} - -#define DFMT(name) MP_CONCAT(DXGI_FORMAT_, name), # name -static const struct d3d_decoded_format d3d11_formats[] = { - {DFMT(NV12), 8, IMGFMT_NV12}, - {DFMT(P010), 10, IMGFMT_P010}, - {DFMT(P016), 16, IMGFMT_P010}, -}; -#undef DFMT - -// Update hw_subfmt to the underlying format. Needed because AVFrame does not -// have such an attribute, so it can't be passed through, and is updated here -// instead. (But in the future, AVHWFramesContext could be used.) -static struct mp_image *d3d11va_update_image_attribs(struct lavc_ctx *s, - struct mp_image *img) -{ - ID3D11Texture2D *texture = (void *)img->planes[1]; - - if (!texture) - return img; - - D3D11_TEXTURE2D_DESC texture_desc; - ID3D11Texture2D_GetDesc(texture, &texture_desc); - for (int n = 0; n < MP_ARRAY_SIZE(d3d11_formats); n++) { - if (d3d11_formats[n].dxfmt == texture_desc.Format) { - img->params.hw_subfmt = d3d11_formats[n].mpfmt; - break; - } - } - - if (img->params.hw_subfmt == IMGFMT_NV12) - mp_image_setfmt(img, IMGFMT_D3D11NV12); - - return img; -} - -static bool d3d11_format_supported(struct lavc_ctx *s, const GUID *guid, - const struct d3d_decoded_format *format) -{ - struct priv *p = s->hwdec_priv; - BOOL is_supported = FALSE; - HRESULT hr = ID3D11VideoDevice_CheckVideoDecoderFormat( - p->video_dev, guid, format->dxfmt, &is_supported); - if (FAILED(hr)) { - MP_ERR(p, "Check decoder output format %s for decoder %s: %s\n", - format->name, d3d_decoder_guid_to_desc(guid), - mp_HRESULT_to_str(hr)); - } - return is_supported; -} - -static void dump_decoder_info(struct lavc_ctx *s, const GUID *guid) -{ - struct priv *p = s->hwdec_priv; - char fmts[256] = {0}; - for (int i = 0; i < MP_ARRAY_SIZE(d3d11_formats); i++) { - const struct d3d_decoded_format *format = &d3d11_formats[i]; - if (d3d11_format_supported(s, guid, format)) - mp_snprintf_cat(fmts, sizeof(fmts), " %s", format->name); - } - MP_VERBOSE(p, "%s %s\n", d3d_decoder_guid_to_desc(guid), fmts); -} - -static void d3d11va_destroy_decoder(void *arg) -{ - struct d3d11va_decoder *decoder = arg; - - if (decoder->decoder) - ID3D11VideoDecoder_Release(decoder->decoder); - - if (decoder->staging) - ID3D11Texture2D_Release(decoder->staging); -} - -static int d3d11va_init_decoder(struct lavc_ctx *s, int w, int h) -{ - HRESULT hr; - int ret = -1; - struct priv *p = s->hwdec_priv; - TA_FREEP(&p->decoder); - - ID3D11Texture2D *texture = NULL; - void *tmp = talloc_new(NULL); - - UINT n_guids = ID3D11VideoDevice_GetVideoDecoderProfileCount(p->video_dev); - GUID *device_guids = talloc_array(tmp, GUID, n_guids); - for (UINT i = 0; i < n_guids; i++) { - GUID *guid = &device_guids[i]; - hr = ID3D11VideoDevice_GetVideoDecoderProfile(p->video_dev, i, guid); - if (FAILED(hr)) { - MP_ERR(p, "Failed to get VideoDecoderProfile %d: %s\n", - i, mp_HRESULT_to_str(hr)); - goto done; - } - dump_decoder_info(s, guid); - } - - struct d3d_decoder_fmt fmt = - d3d_select_decoder_mode(s, device_guids, n_guids, - d3d11_formats, MP_ARRAY_SIZE(d3d11_formats), - d3d11_format_supported); - if (!fmt.format) { - MP_ERR(p, "Failed to find a suitable decoder\n"); - goto done; - } - - struct d3d11va_decoder *decoder = talloc_zero(tmp, struct d3d11va_decoder); - talloc_set_destructor(decoder, d3d11va_destroy_decoder); - decoder->mpfmt_decoded = fmt.format->mpfmt; - - int n_surfaces = hwdec_get_max_refs(s) + ADDITIONAL_SURFACES; - int w_align = w, h_align = h; - d3d_surface_align(s, &w_align, &h_align); - - D3D11_TEXTURE2D_DESC tex_desc = { - .Width = w_align, - .Height = h_align, - .MipLevels = 1, - .Format = fmt.format->dxfmt, - .SampleDesc.Count = 1, - .MiscFlags = 0, - .ArraySize = n_surfaces, - .Usage = D3D11_USAGE_DEFAULT, - .BindFlags = D3D11_BIND_DECODER | D3D11_BIND_SHADER_RESOURCE, - .CPUAccessFlags = 0, - }; - hr = ID3D11Device_CreateTexture2D(p->device, &tex_desc, NULL, &texture); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create Direct3D11 texture with %d surfaces: %s\n", - n_surfaces, mp_HRESULT_to_str(hr)); - goto done; - } - - if (s->hwdec->type == HWDEC_D3D11VA_COPY) { - // create staging texture shared with the CPU with mostly the same - // parameters as the above decoder-bound texture - ID3D11Texture2D_GetDesc(texture, &tex_desc); - tex_desc.MipLevels = 1; - tex_desc.MiscFlags = 0; - tex_desc.ArraySize = 1; - tex_desc.Usage = D3D11_USAGE_STAGING; - tex_desc.CPUAccessFlags = D3D11_CPU_ACCESS_READ; - tex_desc.BindFlags = 0; - hr = ID3D11Device_CreateTexture2D(p->device, &tex_desc, NULL, - &decoder->staging); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create staging texture: %s\n", - mp_HRESULT_to_str(hr)); - goto done; - } - } - - // pool to hold the mp_image wrapped surfaces - decoder->pool = talloc_steal(decoder, mp_image_pool_new(n_surfaces)); - // array of the same surfaces (needed by ffmpeg) - ID3D11VideoDecoderOutputView **surfaces = - talloc_array_ptrtype(decoder->pool, surfaces, n_surfaces); - - D3D11_VIDEO_DECODER_OUTPUT_VIEW_DESC view_desc = { - .DecodeProfile = *fmt.guid, - .ViewDimension = D3D11_VDOV_DIMENSION_TEXTURE2D, - }; - for (int i = 0; i < n_surfaces; i++) { - ID3D11VideoDecoderOutputView **surface = &surfaces[i]; - view_desc.Texture2D.ArraySlice = i; - hr = ID3D11VideoDevice_CreateVideoDecoderOutputView( - p->video_dev, (ID3D11Resource *)texture, &view_desc, surface); - if (FAILED(hr)) { - MP_ERR(p, "Failed getting decoder output view %d: %s\n", - i, mp_HRESULT_to_str(hr)); - goto done; - } - struct mp_image *img = d3d11va_new_ref(*surface, w, h); - ID3D11VideoDecoderOutputView_Release(*surface); // transferred to img - if (!img) { - MP_ERR(p, "Failed to create D3D11VA image %d\n", i); - goto done; - } - mp_image_pool_add(decoder->pool, img); // transferred to pool - } - - D3D11_VIDEO_DECODER_DESC decoder_desc = { - .Guid = *fmt.guid, - .SampleWidth = w, - .SampleHeight = h, - .OutputFormat = fmt.format->dxfmt, - }; - UINT n_cfg; - hr = ID3D11VideoDevice_GetVideoDecoderConfigCount(p->video_dev, - &decoder_desc, &n_cfg); - if (FAILED(hr)) { - MP_ERR(p, "Failed to get number of decoder configurations: %s)", - mp_HRESULT_to_str(hr)); - goto done; - } - - // pick the config with the highest score - D3D11_VIDEO_DECODER_CONFIG *decoder_config = - talloc_zero(decoder, D3D11_VIDEO_DECODER_CONFIG); - unsigned max_score = 0; - for (UINT i = 0; i < n_cfg; i++) { - D3D11_VIDEO_DECODER_CONFIG cfg; - hr = ID3D11VideoDevice_GetVideoDecoderConfig(p->video_dev, - &decoder_desc, - i, &cfg); - if (FAILED(hr)) { - MP_ERR(p, "Failed to get decoder config %d: %s\n", - i, mp_HRESULT_to_str(hr)); - goto done; - } - unsigned score = d3d_decoder_config_score( - s, &cfg.guidConfigBitstreamEncryption, cfg.ConfigBitstreamRaw); - if (score > max_score) { - max_score = score; - *decoder_config = cfg; - } - } - if (!max_score) { - MP_ERR(p, "Failed to find a suitable decoder configuration\n"); - goto done; - } - - hr = ID3D11VideoDevice_CreateVideoDecoder(p->video_dev, &decoder_desc, - decoder_config, - &decoder->decoder); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create video decoder: %s\n", - mp_HRESULT_to_str(hr)); - goto done; - } - - struct AVD3D11VAContext *avd3d11va_ctx = s->avctx->hwaccel_context; - avd3d11va_ctx->decoder = decoder->decoder; - avd3d11va_ctx->video_context = p->video_ctx; - avd3d11va_ctx->cfg = decoder_config; - avd3d11va_ctx->surface_count = n_surfaces; - avd3d11va_ctx->surface = surfaces; - avd3d11va_ctx->workaround = is_clearvideo(fmt.guid) ? - FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO : 0; - - p->decoder = talloc_steal(NULL, decoder); - ret = 0; -done: - // still referenced by pool images / surfaces - if (texture) - ID3D11Texture2D_Release(texture); - - talloc_free(tmp); - return ret; -} - -static void destroy_device(struct lavc_ctx *s) -{ - struct priv *p = s->hwdec_priv; - - if (p->device) - ID3D11Device_Release(p->device); - - if (p->device_ctx) - ID3D11DeviceContext_Release(p->device_ctx); -} - -static bool create_device(struct lavc_ctx *s, BOOL thread_safe) -{ - HRESULT hr; - struct priv *p = s->hwdec_priv; - - if (!d3d11_dll) { - MP_ERR(p, "Failed to load D3D11 library\n"); - return false; - } - - PFN_D3D11_CREATE_DEVICE CreateDevice = - (void *)GetProcAddress(d3d11_dll, "D3D11CreateDevice"); - if (!CreateDevice) { - MP_ERR(p, "Failed to get D3D11CreateDevice symbol from DLL: %s\n", - mp_LastError_to_str()); - return false; - } - - hr = CreateDevice(NULL, D3D_DRIVER_TYPE_HARDWARE, NULL, - D3D11_CREATE_DEVICE_VIDEO_SUPPORT, NULL, 0, - D3D11_SDK_VERSION, &p->device, NULL, &p->device_ctx); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create D3D11 Device: %s\n", - mp_HRESULT_to_str(hr)); - return false; - } - - ID3D10Multithread *multithread; - hr = ID3D11Device_QueryInterface(p->device, &IID_ID3D10Multithread, - (void **)&multithread); - if (FAILED(hr)) { - MP_ERR(p, "Failed to get Multithread interface: %s\n", - mp_HRESULT_to_str(hr)); - return false; - } - ID3D10Multithread_SetMultithreadProtected(multithread, thread_safe); - ID3D10Multithread_Release(multithread); - return true; -} - -static void d3d11va_uninit(struct lavc_ctx *s) -{ - struct priv *p = s->hwdec_priv; - if (!p) - return; - - talloc_free(p->decoder); - av_freep(&s->avctx->hwaccel_context); - - if (p->video_dev) - ID3D11VideoDevice_Release(p->video_dev); - - if (p->video_ctx) - ID3D11VideoContext_Release(p->video_ctx); - - destroy_device(s); - - TA_FREEP(&s->hwdec_priv); -} - -static int d3d11va_init(struct lavc_ctx *s) -{ - HRESULT hr; - struct priv *p = talloc_zero(NULL, struct priv); - if (!p) - return -1; - - // Unconditionally load Direct3D DLLs, even when using a VO-supplied D3D11 - // device. This prevents a crash that occurs at least with NVIDIA drivers, - // where D3D objects are accessed after ANGLE unloads d3d11.dll. - d3d_load_dlls(); - - s->hwdec_priv = p; - p->log = mp_log_new(s, s->log, "d3d11va"); - if (s->hwdec->type == HWDEC_D3D11VA_COPY) { - mp_check_gpu_memcpy(p->log, NULL); - p->sw_pool = talloc_steal(p, mp_image_pool_new(17)); - } - - p->device = hwdec_devices_load(s->hwdec_devs, s->hwdec->type); - if (p->device) { - ID3D11Device_AddRef(p->device); - ID3D11Device_GetImmediateContext(p->device, &p->device_ctx); - if (!p->device_ctx) - goto fail; - MP_VERBOSE(p, "Using VO-supplied device %p.\n", p->device); - } else if (s->hwdec->type == HWDEC_D3D11VA) { - MP_ERR(p, "No Direct3D device provided for native d3d11 decoding\n"); - goto fail; - } else { - if (!create_device(s, FALSE)) - goto fail; - } - - hr = ID3D11DeviceContext_QueryInterface(p->device_ctx, - &IID_ID3D11VideoContext, - (void **)&p->video_ctx); - if (FAILED(hr)) { - MP_ERR(p, "Failed to get VideoContext interface: %s\n", - mp_HRESULT_to_str(hr)); - goto fail; - } - - hr = ID3D11Device_QueryInterface(p->device, - &IID_ID3D11VideoDevice, - (void **)&p->video_dev); - if (FAILED(hr)) { - MP_ERR(p, "Failed to get VideoDevice interface. %s\n", - mp_HRESULT_to_str(hr)); - goto fail; - } - - s->avctx->hwaccel_context = av_d3d11va_alloc_context(); - if (!s->avctx->hwaccel_context) { - MP_ERR(p, "Failed to allocate hwaccel_context\n"); - goto fail; - } - - return 0; -fail: - d3d11va_uninit(s); - return -1; -} - -static int d3d11va_probe(struct lavc_ctx *ctx, struct vd_lavc_hwdec *hwdec, - const char *codec) -{ - // d3d11va-copy can do without external context; dxva2 requires it. - if (hwdec->type != HWDEC_D3D11VA_COPY) { - if (!hwdec_devices_load(ctx->hwdec_devs, HWDEC_D3D11VA)) - return HWDEC_ERR_NO_CTX; - } - return d3d_probe_codec(codec); -} - -const struct vd_lavc_hwdec mp_vd_lavc_d3d11va = { - .type = HWDEC_D3D11VA, - .image_format = IMGFMT_D3D11VA, - .probe = d3d11va_probe, - .init = d3d11va_init, - .uninit = d3d11va_uninit, - .init_decoder = d3d11va_init_decoder, - .allocate_image = d3d11va_allocate_image, - .process_image = d3d11va_update_image_attribs, -}; - -const struct vd_lavc_hwdec mp_vd_lavc_d3d11va_copy = { - .type = HWDEC_D3D11VA_COPY, - .copying = true, - .image_format = IMGFMT_D3D11VA, - .probe = d3d11va_probe, - .init = d3d11va_init, - .uninit = d3d11va_uninit, - .init_decoder = d3d11va_init_decoder, - .allocate_image = d3d11va_allocate_image, - .process_image = d3d11va_retrieve_image, - .delay_queue = HWDEC_DELAY_QUEUE_COUNT, -}; diff --git a/video/decode/dxva2.c b/video/decode/dxva2.c deleted file mode 100644 index c6a34a2e70..0000000000 --- a/video/decode/dxva2.c +++ /dev/null @@ -1,542 +0,0 @@ -/* - * Ported from FFmpeg ffmpeg_dxva2.c (2dbee1a3935a91842c22eb65fd13f77e8d590e07). - * Original copyright header follows: - * - * This file is part of FFmpeg. - * - * FFmpeg is free software; you can redistribute it and/or - * modify it under the terms of the GNU Lesser General Public - * License as published by the Free Software Foundation; either - * version 2.1 of the License, or (at your option) any later version. - * - * FFmpeg is distributed in the hope that it will be useful, - * but WITHOUT ANY WARRANTY; without even the implied warranty of - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU - * Lesser General Public License for more details. - * - * You should have received a copy of the GNU Lesser General Public - * License along with FFmpeg; if not, write to the Free Software - * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA - */ - -#define DXVA2API_USE_BITFIELDS -#include - -#include "lavc.h" -#include "common/common.h" -#include "common/av_common.h" -#include "osdep/windows_utils.h" -#include "video/fmt-conversion.h" -#include "video/mp_image_pool.h" -#include "video/hwdec.h" - -#include "d3d.h" - -#define ADDITIONAL_SURFACES (HWDEC_EXTRA_SURFACES + HWDEC_DELAY_QUEUE_COUNT) - -struct priv { - struct mp_log *log; - - IDirect3D9 *d3d9; - IDirect3DDevice9 *device; - HANDLE device_handle; - IDirect3DDeviceManager9 *device_manager; - IDirectXVideoDecoderService *decoder_service; - - struct mp_image_pool *decoder_pool; - struct mp_image_pool *sw_pool; - int mpfmt_decoded; -}; - -struct dxva2_surface { - IDirectXVideoDecoder *decoder; - IDirect3DSurface9 *surface; -}; - -static void dxva2_release_img(void *arg) -{ - struct dxva2_surface *surface = arg; - if (surface->surface) - IDirect3DSurface9_Release(surface->surface); - - if (surface->decoder) - IDirectXVideoDecoder_Release(surface->decoder); - - talloc_free(surface); -} - -static struct mp_image *dxva2_new_ref(IDirectXVideoDecoder *decoder, - IDirect3DSurface9 *d3d9_surface, - int w, int h) -{ - if (!decoder || !d3d9_surface) - return NULL; - struct dxva2_surface *surface = talloc_zero(NULL, struct dxva2_surface); - - surface->surface = d3d9_surface; - IDirect3DSurface9_AddRef(surface->surface); - surface->decoder = decoder; - IDirectXVideoDecoder_AddRef(surface->decoder); - - struct mp_image *mpi = - mp_image_new_custom_ref(NULL, surface, dxva2_release_img); - if (!mpi) - abort(); - - mp_image_setfmt(mpi, IMGFMT_DXVA2); - mp_image_set_size(mpi, w, h); - mpi->planes[3] = (void *)surface->surface; - return mpi; -} - -static struct mp_image *dxva2_allocate_image(struct lavc_ctx *s, int w, int h) -{ - struct priv *p = s->hwdec_priv; - struct mp_image *img = mp_image_pool_get_no_alloc(p->decoder_pool, - IMGFMT_DXVA2, w, h); - if (!img) - MP_ERR(p, "Failed to allocate additional DXVA2 surface.\n"); - return img; -} - -static struct mp_image *dxva2_retrieve_image(struct lavc_ctx *s, - struct mp_image *img) -{ - HRESULT hr; - struct priv *p = s->hwdec_priv; - IDirect3DSurface9 *surface = img->imgfmt == IMGFMT_DXVA2 ? - (IDirect3DSurface9 *)img->planes[3] : NULL; - - if (!surface) { - MP_ERR(p, "Failed to get Direct3D surface from mp_image\n"); - return img; - } - - D3DSURFACE_DESC surface_desc; - IDirect3DSurface9_GetDesc(surface, &surface_desc); - if (surface_desc.Width < img->w || surface_desc.Height < img->h) { - MP_ERR(p, "Direct3D11 texture smaller than mp_image dimensions\n"); - return img; - } - - struct mp_image *sw_img = mp_image_pool_get(p->sw_pool, - p->mpfmt_decoded, - surface_desc.Width, - surface_desc.Height); - if (!sw_img) { - MP_ERR(p, "Failed to get %s surface from CPU pool\n", - mp_imgfmt_to_name(p->mpfmt_decoded)); - return img; - } - - D3DLOCKED_RECT lock; - hr = IDirect3DSurface9_LockRect(surface, &lock, NULL, D3DLOCK_READONLY); - if (FAILED(hr)) { - MP_ERR(p, "Unable to lock DXVA2 surface: %s\n", - mp_HRESULT_to_str(hr)); - talloc_free(sw_img); - return img; - } - copy_nv12(sw_img, lock.pBits, lock.Pitch, surface_desc.Height); - IDirect3DSurface9_UnlockRect(surface); - - mp_image_set_size(sw_img, img->w, img->h); - mp_image_copy_attributes(sw_img, img); - talloc_free(img); - return sw_img; -} - -static const struct d3d_decoded_format d3d9_formats[] = { - {MKTAG('N','V','1','2'), "NV12", 8, IMGFMT_NV12}, - {MKTAG('P','0','1','0'), "P010", 10, IMGFMT_P010}, - {MKTAG('P','0','1','6'), "P016", 16, IMGFMT_P010}, -}; - -static void dump_decoder_info(struct lavc_ctx *s, - GUID *device_guids, UINT n_guids) -{ - struct priv *p = s->hwdec_priv; - MP_VERBOSE(p, "%u decoder devices:\n", (unsigned)n_guids); - for (UINT i = 0; i < n_guids; i++) { - GUID *guid = &device_guids[i]; - char *description = d3d_decoder_guid_to_desc(guid); - - D3DFORMAT *formats = NULL; - UINT n_formats = 0; - HRESULT hr = IDirectXVideoDecoderService_GetDecoderRenderTargets( - p->decoder_service, guid, &n_formats, &formats); - if (FAILED(hr)) { - MP_ERR(p, "Failed to get render targets for decoder %s:%s\n", - description, mp_HRESULT_to_str(hr)); - } - - char fmts[256] = {0}; - for (UINT j = 0; j < n_formats; j++) { - mp_snprintf_cat(fmts, sizeof(fmts), - " %s", mp_tag_str(formats[j])); - } - CoTaskMemFree(formats); - - MP_VERBOSE(p, "%s %s\n", description, fmts); - } -} - -static bool dxva2_format_supported(struct lavc_ctx *s, const GUID *guid, - const struct d3d_decoded_format *format) -{ - bool ret = false; - struct priv *p = s->hwdec_priv; - D3DFORMAT *formats = NULL; - UINT n_formats = 0; - HRESULT hr = IDirectXVideoDecoderService_GetDecoderRenderTargets( - p->decoder_service, guid, &n_formats, &formats); - if (FAILED(hr)) { - MP_ERR(p, "Callback failed to get render targets for decoder %s: %s", - d3d_decoder_guid_to_desc(guid), mp_HRESULT_to_str(hr)); - return 0; - } - - for (int i = 0; i < n_formats; i++) { - ret = formats[i] == format->dxfmt; - if (ret) - break; - } - - CoTaskMemFree(formats); - return ret; -} - -static int dxva2_init_decoder(struct lavc_ctx *s, int w, int h) -{ - HRESULT hr; - int ret = -1; - struct priv *p = s->hwdec_priv; - TA_FREEP(&p->decoder_pool); - - int n_surfaces = hwdec_get_max_refs(s) + ADDITIONAL_SURFACES; - IDirect3DSurface9 **surfaces = NULL; - IDirectXVideoDecoder *decoder = NULL; - void *tmp = talloc_new(NULL); - - UINT n_guids; - GUID *device_guids; - hr = IDirectXVideoDecoderService_GetDecoderDeviceGuids( - p->decoder_service, &n_guids, &device_guids); - if (FAILED(hr)) { - MP_ERR(p, "Failed to retrieve decoder device GUIDs: %s\n", - mp_HRESULT_to_str(hr)); - goto done; - } - - dump_decoder_info(s, device_guids, n_guids); - - struct d3d_decoder_fmt fmt = - d3d_select_decoder_mode(s, device_guids, n_guids, - d3d9_formats, MP_ARRAY_SIZE(d3d9_formats), - dxva2_format_supported); - CoTaskMemFree(device_guids); - if (!fmt.format) { - MP_ERR(p, "Failed to find a suitable decoder\n"); - goto done; - } - - p->mpfmt_decoded = fmt.format->mpfmt; - struct mp_image_pool *decoder_pool = - talloc_steal(tmp, mp_image_pool_new(n_surfaces)); - DXVA2_ConfigPictureDecode *decoder_config = - talloc_zero(decoder_pool, DXVA2_ConfigPictureDecode); - - int w_align = w, h_align = h; - d3d_surface_align(s, &w_align, &h_align); - DXVA2_VideoDesc video_desc ={ - .SampleWidth = w, - .SampleHeight = h, - .Format = fmt.format->dxfmt, - }; - UINT n_configs = 0; - DXVA2_ConfigPictureDecode *configs = NULL; - hr = IDirectXVideoDecoderService_GetDecoderConfigurations( - p->decoder_service, fmt.guid, &video_desc, NULL, - &n_configs, &configs); - if (FAILED(hr)) { - MP_ERR(p, "Unable to retrieve decoder configurations: %s\n", - mp_HRESULT_to_str(hr)); - goto done; - } - - unsigned max_score = 0; - for (UINT i = 0; i < n_configs; i++) { - unsigned score = d3d_decoder_config_score( - s, &configs[i].guidConfigBitstreamEncryption, - configs[i].ConfigBitstreamRaw); - if (score > max_score) { - max_score = score; - *decoder_config = configs[i]; - } - } - CoTaskMemFree(configs); - if (!max_score) { - MP_ERR(p, "Failed to find a suitable decoder configuration\n"); - goto done; - } - - surfaces = talloc_zero_array(decoder_pool, IDirect3DSurface9*, n_surfaces); - hr = IDirectXVideoDecoderService_CreateSurface( - p->decoder_service, - w_align, h_align, - n_surfaces - 1, fmt.format->dxfmt, D3DPOOL_DEFAULT, 0, - DXVA2_VideoDecoderRenderTarget, surfaces, NULL); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create %d video surfaces: %s\n", - n_surfaces, mp_HRESULT_to_str(hr)); - goto done; - } - - hr = IDirectXVideoDecoderService_CreateVideoDecoder( - p->decoder_service, fmt.guid, &video_desc, decoder_config, - surfaces, n_surfaces, &decoder); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create DXVA2 video decoder: %s\n", - mp_HRESULT_to_str(hr)); - goto done; - } - - for (int i = 0; i < n_surfaces; i++) { - struct mp_image *img = dxva2_new_ref(decoder, surfaces[i], w, h); - if (!img) { - MP_ERR(p, "Failed to create DXVA2 image\n"); - goto done; - } - mp_image_pool_add(decoder_pool, img); // transferred to pool - } - - // Pass required information on to ffmpeg. - struct dxva_context *dxva_ctx = s->avctx->hwaccel_context; - dxva_ctx->cfg = decoder_config; - dxva_ctx->decoder = decoder; - dxva_ctx->surface_count = n_surfaces; - dxva_ctx->surface = surfaces; - dxva_ctx->workaround = is_clearvideo(fmt.guid) ? - FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO : 0; - - p->decoder_pool = talloc_steal(NULL, decoder_pool); - ret = 0; -done: - // On success, `p->decoder_pool` mp_images still hold refs to `surfaces` and - // `decoder`, so the pointers in the ffmpeg `dxva_context` strcture remain - // valid for the lifetime of the pool. - if (surfaces) { - for (int i = 0; i < n_surfaces; i++) - IDirect3DSurface9_Release(surfaces[i]); - } - if (decoder) - IDirectXVideoDecoder_Release(decoder); - - talloc_free(tmp); - return ret; -} - -static void destroy_device(struct lavc_ctx *s) -{ - struct priv *p = s->hwdec_priv; - - if (p->device) - IDirect3DDevice9_Release(p->device); - - if (p->d3d9) - IDirect3D9_Release(p->d3d9); -} - -static bool create_device(struct lavc_ctx *s) -{ - struct priv *p = s->hwdec_priv; - - d3d_load_dlls(); - if (!d3d9_dll) { - MP_ERR(p, "Failed to load D3D9 library\n"); - return false; - } - - IDirect3D9* (WINAPI *Direct3DCreate9)(UINT) = - (void *)GetProcAddress(d3d9_dll, "Direct3DCreate9"); - if (!Direct3DCreate9) { - MP_ERR(p, "Failed to locate Direct3DCreate9\n"); - return false; - } - - p->d3d9 = Direct3DCreate9(D3D_SDK_VERSION); - if (!p->d3d9) { - MP_ERR(p, "Failed to create IDirect3D object\n"); - return false; - } - - UINT adapter = D3DADAPTER_DEFAULT; - D3DDISPLAYMODE display_mode; - IDirect3D9_GetAdapterDisplayMode(p->d3d9, adapter, &display_mode); - D3DPRESENT_PARAMETERS present_params = { - .Windowed = TRUE, - .BackBufferWidth = 640, - .BackBufferHeight = 480, - .BackBufferCount = 0, - .BackBufferFormat = display_mode.Format, - .SwapEffect = D3DSWAPEFFECT_DISCARD, - .Flags = D3DPRESENTFLAG_VIDEO, - }; - HRESULT hr = IDirect3D9_CreateDevice(p->d3d9, adapter, - D3DDEVTYPE_HAL, - GetShellWindow(), - D3DCREATE_SOFTWARE_VERTEXPROCESSING | - D3DCREATE_MULTITHREADED | - D3DCREATE_FPU_PRESERVE, - &present_params, - &p->device); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create Direct3D device: %s\n", - mp_HRESULT_to_str(hr)); - return false; - } - return true; -} - -static void dxva2_uninit(struct lavc_ctx *s) -{ - struct priv *p = s->hwdec_priv; - if (!p) - return; - - av_freep(&s->avctx->hwaccel_context); - talloc_free(p->decoder_pool); - - if (p->decoder_service) - IDirectXVideoDecoderService_Release(p->decoder_service); - - if (p->device_manager && p->device_handle != INVALID_HANDLE_VALUE) - IDirect3DDeviceManager9_CloseDeviceHandle(p->device_manager, p->device_handle); - - if (p->device_manager) - IDirect3DDeviceManager9_Release(p->device_manager); - - destroy_device(s); - - TA_FREEP(&s->hwdec_priv); -} - -static int dxva2_init(struct lavc_ctx *s) -{ - HRESULT hr; - struct priv *p = talloc_zero(NULL, struct priv); - if (!p) - return -1; - - s->hwdec_priv = p; - p->device_handle = INVALID_HANDLE_VALUE; - p->log = mp_log_new(s, s->log, "dxva2"); - - if (s->hwdec->type == HWDEC_DXVA2_COPY) { - mp_check_gpu_memcpy(p->log, NULL); - p->sw_pool = talloc_steal(p, mp_image_pool_new(17)); - } - - p->device = hwdec_devices_load(s->hwdec_devs, s->hwdec->type); - if (p->device) { - IDirect3D9_AddRef(p->device); - MP_VERBOSE(p, "Using VO-supplied device %p.\n", p->device); - } else if (s->hwdec->type == HWDEC_DXVA2) { - MP_ERR(p, "No Direct3D device provided for native dxva2 decoding\n"); - goto fail; - } else { - if (!create_device(s)) - goto fail; - } - - d3d_load_dlls(); - if (!dxva2_dll) { - MP_ERR(p, "Failed to load DXVA2 library\n"); - goto fail; - } - - HRESULT (WINAPI *CreateDeviceManager9)(UINT *, IDirect3DDeviceManager9 **) = - (void *)GetProcAddress(dxva2_dll, "DXVA2CreateDirect3DDeviceManager9"); - if (!CreateDeviceManager9) { - MP_ERR(p, "Failed to locate DXVA2CreateDirect3DDeviceManager9\n"); - goto fail; - } - - unsigned reset_token = 0; - hr = CreateDeviceManager9(&reset_token, &p->device_manager); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create Direct3D device manager: %s\n", - mp_HRESULT_to_str(hr)); - goto fail; - } - - hr = IDirect3DDeviceManager9_ResetDevice(p->device_manager, - p->device, reset_token); - if (FAILED(hr)) { - MP_ERR(p, "Failed to bind Direct3D device to device manager: %s\n", - mp_HRESULT_to_str(hr)); - goto fail; - } - - hr = IDirect3DDeviceManager9_OpenDeviceHandle(p->device_manager, - &p->device_handle); - if (FAILED(hr)) { - MP_ERR(p, "Failed to open device handle: %s\n", - mp_HRESULT_to_str(hr)); - goto fail; - } - - hr = IDirect3DDeviceManager9_GetVideoService( - p->device_manager, p->device_handle, &IID_IDirectXVideoDecoderService, - (void **)&p->decoder_service); - if (FAILED(hr)) { - MP_ERR(p, "Failed to create IDirectXVideoDecoderService: %s\n", - mp_HRESULT_to_str(hr)); - goto fail; - } - - s->avctx->hwaccel_context = av_mallocz(sizeof(struct dxva_context)); - if (!s->avctx->hwaccel_context) - goto fail; - - return 0; -fail: - dxva2_uninit(s); - return -1; -} - -static int dxva2_probe(struct lavc_ctx *ctx, struct vd_lavc_hwdec *hwdec, - const char *codec) -{ - // dxva2-copy can do without external context; dxva2 requires it. - if (hwdec->type == HWDEC_DXVA2) { - if (!hwdec_devices_load(ctx->hwdec_devs, HWDEC_DXVA2)) - return HWDEC_ERR_NO_CTX; - } else { - hwdec_devices_load(ctx->hwdec_devs, HWDEC_DXVA2_COPY); - } - return d3d_probe_codec(codec); -} - -const struct vd_lavc_hwdec mp_vd_lavc_dxva2 = { - .type = HWDEC_DXVA2, - .image_format = IMGFMT_DXVA2, - .probe = dxva2_probe, - .init = dxva2_init, - .uninit = dxva2_uninit, - .init_decoder = dxva2_init_decoder, - .allocate_image = dxva2_allocate_image, -}; - -const struct vd_lavc_hwdec mp_vd_lavc_dxva2_copy = { - .type = HWDEC_DXVA2_COPY, - .copying = true, - .image_format = IMGFMT_DXVA2, - .probe = dxva2_probe, - .init = dxva2_init, - .uninit = dxva2_uninit, - .init_decoder = dxva2_init_decoder, - .allocate_image = dxva2_allocate_image, - .process_image = dxva2_retrieve_image, - .delay_queue = HWDEC_DELAY_QUEUE_COUNT, -}; diff --git a/video/decode/hw_cuda.c b/video/decode/hw_cuda.c new file mode 100644 index 0000000000..92ba0772c4 --- /dev/null +++ b/video/decode/hw_cuda.c @@ -0,0 +1,104 @@ +/* + * This file is part of mpv. + * + * Copyright (c) 2016 Philip Langdale + * + * mpv is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * mpv is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with mpv. If not, see . + */ + +// This define and typedef prevent hwcontext_cuda.h trying to include cuda.h +#define CUDA_VERSION 7050 +typedef void * CUcontext; + +#include +#include + +#include "common/av_common.h" +#include "video/fmt-conversion.h" +#include "video/decode/lavc.h" + +static int probe(struct lavc_ctx *ctx, struct vd_lavc_hwdec *hwdec, + const char *codec) +{ + if (!hwdec_devices_load(ctx->hwdec_devs, HWDEC_CUDA)) + return HWDEC_ERR_NO_CTX; + return 0; +} + +static int init(struct lavc_ctx *ctx) +{ + ctx->hwdec_priv = hwdec_devices_get(ctx->hwdec_devs, HWDEC_CUDA); + return 0; +} + +static int init_decoder(struct lavc_ctx *ctx, int w, int h) +{ + AVCodecContext *avctx = ctx->avctx; + struct mp_hwdec_ctx *hwctx = ctx->hwdec_priv; + + if (avctx->hw_frames_ctx) { + MP_ERR(ctx, "hw_frames_ctx already initialised!\n"); + return -1; + } + + avctx->hw_frames_ctx = av_hwframe_ctx_alloc(hwctx->av_device_ref); + if (!avctx->hw_frames_ctx) { + MP_ERR(ctx, "av_hwframe_ctx_alloc failed\n"); + goto error; + } + + AVHWFramesContext *hwframe_ctx = (void* )avctx->hw_frames_ctx->data; + hwframe_ctx->format = AV_PIX_FMT_CUDA; + + // This is proper use of the hw_frames_ctx API, but it does not work + // (appaears to work but fails e.g. with 10 bit). The cuvid wrapper + // does non-standard things, and it's a meesy situation. + /* + hwframe_ctx->width = w; + hwframe_ctx->height = h; + hwframe_ctx->sw_format = avctx->sw_pix_fmt; + + if (av_hwframe_ctx_init(avctx->hw_frames_ctx) < 0) + goto error; + */ + + return 0; + + error: + av_buffer_unref(&avctx->hw_frames_ctx); + return -1; +} + +static void uninit(struct lavc_ctx *ctx) +{ + ctx->hwdec_priv = NULL; +} + +static struct mp_image *process_image(struct lavc_ctx *ctx, struct mp_image *img) +{ + if (img->imgfmt == IMGFMT_CUDA) + img->params.hw_subfmt = pixfmt2imgfmt(ctx->avctx->sw_pix_fmt); + return img; +} + +const struct vd_lavc_hwdec mp_vd_lavc_cuda = { + .type = HWDEC_CUDA, + .image_format = IMGFMT_CUDA, + .lavc_suffix = "_cuvid", + .probe = probe, + .init = init, + .uninit = uninit, + .init_decoder = init_decoder, + .process_image = process_image, +}; diff --git a/video/decode/hw_d3d11va.c b/video/decode/hw_d3d11va.c new file mode 100644 index 0000000000..a69a3890bd --- /dev/null +++ b/video/decode/hw_d3d11va.c @@ -0,0 +1,584 @@ +/* + * This file is part of mpv. + * + * mpv is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * mpv is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with mpv. If not, see . + */ + +#include + +#include "lavc.h" +#include "common/common.h" +#include "common/av_common.h" +#include "osdep/windows_utils.h" +#include "video/fmt-conversion.h" +#include "video/mp_image_pool.h" +#include "video/hwdec.h" + +#include "d3d.h" + +#define ADDITIONAL_SURFACES (HWDEC_EXTRA_SURFACES + HWDEC_DELAY_QUEUE_COUNT) + +struct d3d11va_decoder { + ID3D11VideoDecoder *decoder; + struct mp_image_pool *pool; + ID3D11Texture2D *staging; + int mpfmt_decoded; +}; + +struct priv { + struct mp_log *log; + + ID3D11Device *device; + ID3D11DeviceContext *device_ctx; + ID3D11VideoDevice *video_dev; + ID3D11VideoContext *video_ctx; + + struct d3d11va_decoder *decoder; + struct mp_image_pool *sw_pool; +}; + +struct d3d11va_surface { + ID3D11Texture2D *texture; + ID3D11VideoDecoderOutputView *surface; +}; + +static void d3d11va_release_img(void *arg) +{ + struct d3d11va_surface *surface = arg; + if (surface->surface) + ID3D11VideoDecoderOutputView_Release(surface->surface); + + if (surface->texture) + ID3D11Texture2D_Release(surface->texture); + + talloc_free(surface); +} + +static struct mp_image *d3d11va_new_ref(ID3D11VideoDecoderOutputView *view, + int w, int h) +{ + if (!view) + return NULL; + struct d3d11va_surface *surface = talloc_zero(NULL, struct d3d11va_surface); + + surface->surface = view; + ID3D11VideoDecoderOutputView_AddRef(surface->surface); + ID3D11VideoDecoderOutputView_GetResource( + surface->surface, (ID3D11Resource **)&surface->texture); + + D3D11_VIDEO_DECODER_OUTPUT_VIEW_DESC surface_desc; + ID3D11VideoDecoderOutputView_GetDesc(surface->surface, &surface_desc); + + struct mp_image *mpi = + mp_image_new_custom_ref(NULL, surface, d3d11va_release_img); + if (!mpi) + abort(); + + mp_image_setfmt(mpi, IMGFMT_D3D11VA); + mp_image_set_size(mpi, w, h); + mpi->planes[0] = NULL; + mpi->planes[1] = (void *)surface->texture; + mpi->planes[2] = (void *)(intptr_t)surface_desc.Texture2D.ArraySlice; + mpi->planes[3] = (void *)surface->surface; + + return mpi; +} + +static struct mp_image *d3d11va_allocate_image(struct lavc_ctx *s, int w, int h) +{ + struct priv *p = s->hwdec_priv; + struct mp_image *img = mp_image_pool_get_no_alloc(p->decoder->pool, + IMGFMT_D3D11VA, w, h); + if (!img) + MP_ERR(p, "Failed to get free D3D11VA surface\n"); + return img; +} + +static struct mp_image *d3d11va_retrieve_image(struct lavc_ctx *s, + struct mp_image *img) +{ + HRESULT hr; + struct priv *p = s->hwdec_priv; + ID3D11Texture2D *staging = p->decoder->staging; + + if (img->imgfmt != IMGFMT_D3D11VA) + return img; + + ID3D11Texture2D *texture = (void *)img->planes[1]; + int subindex = (intptr_t)img->planes[2]; + + if (!texture) { + MP_ERR(p, "Failed to get Direct3D texture and surface from mp_image\n"); + return img; + } + + D3D11_TEXTURE2D_DESC texture_desc; + ID3D11Texture2D_GetDesc(texture, &texture_desc); + if (texture_desc.Width < img->w || texture_desc.Height < img->h) { + MP_ERR(p, "Direct3D11 texture smaller than mp_image dimensions\n"); + return img; + } + + // copy to the staging texture + ID3D11DeviceContext_CopySubresourceRegion( + p->device_ctx, + (ID3D11Resource *)staging, 0, 0, 0, 0, + (ID3D11Resource *)texture, subindex, NULL); + + struct mp_image *sw_img = mp_image_pool_get(p->sw_pool, + p->decoder->mpfmt_decoded, + texture_desc.Width, + texture_desc.Height); + if (!sw_img) { + MP_ERR(p, "Failed to get %s surface from CPU pool\n", + mp_imgfmt_to_name(p->decoder->mpfmt_decoded)); + return img; + } + + // copy staging texture to the cpu mp_image + D3D11_MAPPED_SUBRESOURCE lock; + hr = ID3D11DeviceContext_Map(p->device_ctx, (ID3D11Resource *)staging, + 0, D3D11_MAP_READ, 0, &lock); + if (FAILED(hr)) { + MP_ERR(p, "Failed to map D3D11 surface: %s\n", mp_HRESULT_to_str(hr)); + talloc_free(sw_img); + return img; + } + copy_nv12(sw_img, lock.pData, lock.RowPitch, texture_desc.Height); + ID3D11DeviceContext_Unmap(p->device_ctx, (ID3D11Resource *)staging, 0); + + mp_image_set_size(sw_img, img->w, img->h); + mp_image_copy_attributes(sw_img, img); + talloc_free(img); + return sw_img; +} + +#define DFMT(name) MP_CONCAT(DXGI_FORMAT_, name), # name +static const struct d3d_decoded_format d3d11_formats[] = { + {DFMT(NV12), 8, IMGFMT_NV12}, + {DFMT(P010), 10, IMGFMT_P010}, + {DFMT(P016), 16, IMGFMT_P010}, +}; +#undef DFMT + +// Update hw_subfmt to the underlying format. Needed because AVFrame does not +// have such an attribute, so it can't be passed through, and is updated here +// instead. (But in the future, AVHWFramesContext could be used.) +static struct mp_image *d3d11va_update_image_attribs(struct lavc_ctx *s, + struct mp_image *img) +{ + ID3D11Texture2D *texture = (void *)img->planes[1]; + + if (!texture) + return img; + + D3D11_TEXTURE2D_DESC texture_desc; + ID3D11Texture2D_GetDesc(texture, &texture_desc); + for (int n = 0; n < MP_ARRAY_SIZE(d3d11_formats); n++) { + if (d3d11_formats[n].dxfmt == texture_desc.Format) { + img->params.hw_subfmt = d3d11_formats[n].mpfmt; + break; + } + } + + if (img->params.hw_subfmt == IMGFMT_NV12) + mp_image_setfmt(img, IMGFMT_D3D11NV12); + + return img; +} + +static bool d3d11_format_supported(struct lavc_ctx *s, const GUID *guid, + const struct d3d_decoded_format *format) +{ + struct priv *p = s->hwdec_priv; + BOOL is_supported = FALSE; + HRESULT hr = ID3D11VideoDevice_CheckVideoDecoderFormat( + p->video_dev, guid, format->dxfmt, &is_supported); + if (FAILED(hr)) { + MP_ERR(p, "Check decoder output format %s for decoder %s: %s\n", + format->name, d3d_decoder_guid_to_desc(guid), + mp_HRESULT_to_str(hr)); + } + return is_supported; +} + +static void dump_decoder_info(struct lavc_ctx *s, const GUID *guid) +{ + struct priv *p = s->hwdec_priv; + char fmts[256] = {0}; + for (int i = 0; i < MP_ARRAY_SIZE(d3d11_formats); i++) { + const struct d3d_decoded_format *format = &d3d11_formats[i]; + if (d3d11_format_supported(s, guid, format)) + mp_snprintf_cat(fmts, sizeof(fmts), " %s", format->name); + } + MP_VERBOSE(p, "%s %s\n", d3d_decoder_guid_to_desc(guid), fmts); +} + +static void d3d11va_destroy_decoder(void *arg) +{ + struct d3d11va_decoder *decoder = arg; + + if (decoder->decoder) + ID3D11VideoDecoder_Release(decoder->decoder); + + if (decoder->staging) + ID3D11Texture2D_Release(decoder->staging); +} + +static int d3d11va_init_decoder(struct lavc_ctx *s, int w, int h) +{ + HRESULT hr; + int ret = -1; + struct priv *p = s->hwdec_priv; + TA_FREEP(&p->decoder); + + ID3D11Texture2D *texture = NULL; + void *tmp = talloc_new(NULL); + + UINT n_guids = ID3D11VideoDevice_GetVideoDecoderProfileCount(p->video_dev); + GUID *device_guids = talloc_array(tmp, GUID, n_guids); + for (UINT i = 0; i < n_guids; i++) { + GUID *guid = &device_guids[i]; + hr = ID3D11VideoDevice_GetVideoDecoderProfile(p->video_dev, i, guid); + if (FAILED(hr)) { + MP_ERR(p, "Failed to get VideoDecoderProfile %d: %s\n", + i, mp_HRESULT_to_str(hr)); + goto done; + } + dump_decoder_info(s, guid); + } + + struct d3d_decoder_fmt fmt = + d3d_select_decoder_mode(s, device_guids, n_guids, + d3d11_formats, MP_ARRAY_SIZE(d3d11_formats), + d3d11_format_supported); + if (!fmt.format) { + MP_ERR(p, "Failed to find a suitable decoder\n"); + goto done; + } + + struct d3d11va_decoder *decoder = talloc_zero(tmp, struct d3d11va_decoder); + talloc_set_destructor(decoder, d3d11va_destroy_decoder); + decoder->mpfmt_decoded = fmt.format->mpfmt; + + int n_surfaces = hwdec_get_max_refs(s) + ADDITIONAL_SURFACES; + int w_align = w, h_align = h; + d3d_surface_align(s, &w_align, &h_align); + + D3D11_TEXTURE2D_DESC tex_desc = { + .Width = w_align, + .Height = h_align, + .MipLevels = 1, + .Format = fmt.format->dxfmt, + .SampleDesc.Count = 1, + .MiscFlags = 0, + .ArraySize = n_surfaces, + .Usage = D3D11_USAGE_DEFAULT, + .BindFlags = D3D11_BIND_DECODER | D3D11_BIND_SHADER_RESOURCE, + .CPUAccessFlags = 0, + }; + hr = ID3D11Device_CreateTexture2D(p->device, &tex_desc, NULL, &texture); + if (FAILED(hr)) { + MP_ERR(p, "Failed to create Direct3D11 texture with %d surfaces: %s\n", + n_surfaces, mp_HRESULT_to_str(hr)); + goto done; + } + + if (s->hwdec->type == HWDEC_D3D11VA_COPY) { + // create staging texture shared with the CPU with mostly the same + // parameters as the above decoder-bound texture + ID3D11Texture2D_GetDesc(texture, &tex_desc); + tex_desc.MipLevels = 1; + tex_desc.MiscFlags = 0; + tex_desc.ArraySize = 1; + tex_desc.Usage = D3D11_USAGE_STAGING; + tex_desc.CPUAccessFlags = D3D11_CPU_ACCESS_READ; + tex_desc.BindFlags = 0; + hr = ID3D11Device_CreateTexture2D(p->device, &tex_desc, NULL, + &decoder->staging); + if (FAILED(hr)) { + MP_ERR(p, "Failed to create staging texture: %s\n", + mp_HRESULT_to_str(hr)); + goto done; + } + } + + // pool to hold the mp_image wrapped surfaces + decoder->pool = talloc_steal(decoder, mp_image_pool_new(n_surfaces)); + // array of the same surfaces (needed by ffmpeg) + ID3D11VideoDecoderOutputView **surfaces = + talloc_array_ptrtype(decoder->pool, surfaces, n_surfaces); + + D3D11_VIDEO_DECODER_OUTPUT_VIEW_DESC view_desc = { + .DecodeProfile = *fmt.guid, + .ViewDimension = D3D11_VDOV_DIMENSION_TEXTURE2D, + }; + for (int i = 0; i < n_surfaces; i++) { + ID3D11VideoDecoderOutputView **surface = &surfaces[i]; + view_desc.Texture2D.ArraySlice = i; + hr = ID3D11VideoDevice_CreateVideoDecoderOutputView( + p->video_dev, (ID3D11Resource *)texture, &view_desc, surface); + if (FAILED(hr)) { + MP_ERR(p, "Failed getting decoder output view %d: %s\n", + i, mp_HRESULT_to_str(hr)); + goto done; + } + struct mp_image *img = d3d11va_new_ref(*surface, w, h); + ID3D11VideoDecoderOutputView_Release(*surface); // transferred to img + if (!img) { + MP_ERR(p, "Failed to create D3D11VA image %d\n", i); + goto done; + } + mp_image_pool_add(decoder->pool, img); // transferred to pool + } + + D3D11_VIDEO_DECODER_DESC decoder_desc = { + .Guid = *fmt.guid, + .SampleWidth = w, + .SampleHeight = h, + .OutputFormat = fmt.format->dxfmt, + }; + UINT n_cfg; + hr = ID3D11VideoDevice_GetVideoDecoderConfigCount(p->video_dev, + &decoder_desc, &n_cfg); + if (FAILED(hr)) { + MP_ERR(p, "Failed to get number of decoder configurations: %s)", + mp_HRESULT_to_str(hr)); + goto done; + } + + // pick the config with the highest score + D3D11_VIDEO_DECODER_CONFIG *decoder_config = + talloc_zero(decoder, D3D11_VIDEO_DECODER_CONFIG); + unsigned max_score = 0; + for (UINT i = 0; i < n_cfg; i++) { + D3D11_VIDEO_DECODER_CONFIG cfg; + hr = ID3D11VideoDevice_GetVideoDecoderConfig(p->video_dev, + &decoder_desc, + i, &cfg); + if (FAILED(hr)) { + MP_ERR(p, "Failed to get decoder config %d: %s\n", + i, mp_HRESULT_to_str(hr)); + goto done; + } + unsigned score = d3d_decoder_config_score( + s, &cfg.guidConfigBitstreamEncryption, cfg.ConfigBitstreamRaw); + if (score > max_score) { + max_score = score; + *decoder_config = cfg; + } + } + if (!max_score) { + MP_ERR(p, "Failed to find a suitable decoder configuration\n"); + goto done; + } + + hr = ID3D11VideoDevice_CreateVideoDecoder(p->video_dev, &decoder_desc, + decoder_config, + &decoder->decoder); + if (FAILED(hr)) { + MP_ERR(p, "Failed to create video decoder: %s\n", + mp_HRESULT_to_str(hr)); + goto done; + } + + struct AVD3D11VAContext *avd3d11va_ctx = s->avctx->hwaccel_context; + avd3d11va_ctx->decoder = decoder->decoder; + avd3d11va_ctx->video_context = p->video_ctx; + avd3d11va_ctx->cfg = decoder_config; + avd3d11va_ctx->surface_count = n_surfaces; + avd3d11va_ctx->surface = surfaces; + avd3d11va_ctx->workaround = is_clearvideo(fmt.guid) ? + FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO : 0; + + p->decoder = talloc_steal(NULL, decoder); + ret = 0; +done: + // still referenced by pool images / surfaces + if (texture) + ID3D11Texture2D_Release(texture); + + talloc_free(tmp); + return ret; +} + +static void destroy_device(struct lavc_ctx *s) +{ + struct priv *p = s->hwdec_priv; + + if (p->device) + ID3D11Device_Release(p->device); + + if (p->device_ctx) + ID3D11DeviceContext_Release(p->device_ctx); +} + +static bool create_device(struct lavc_ctx *s, BOOL thread_safe) +{ + HRESULT hr; + struct priv *p = s->hwdec_priv; + + if (!d3d11_dll) { + MP_ERR(p, "Failed to load D3D11 library\n"); + return false; + } + + PFN_D3D11_CREATE_DEVICE CreateDevice = + (void *)GetProcAddress(d3d11_dll, "D3D11CreateDevice"); + if (!CreateDevice) { + MP_ERR(p, "Failed to get D3D11CreateDevice symbol from DLL: %s\n", + mp_LastError_to_str()); + return false; + } + + hr = CreateDevice(NULL, D3D_DRIVER_TYPE_HARDWARE, NULL, + D3D11_CREATE_DEVICE_VIDEO_SUPPORT, NULL, 0, + D3D11_SDK_VERSION, &p->device, NULL, &p->device_ctx); + if (FAILED(hr)) { + MP_ERR(p, "Failed to create D3D11 Device: %s\n", + mp_HRESULT_to_str(hr)); + return false; + } + + ID3D10Multithread *multithread; + hr = ID3D11Device_QueryInterface(p->device, &IID_ID3D10Multithread, + (void **)&multithread); + if (FAILED(hr)) { + MP_ERR(p, "Failed to get Multithread interface: %s\n", + mp_HRESULT_to_str(hr)); + return false; + } + ID3D10Multithread_SetMultithreadProtected(multithread, thread_safe); + ID3D10Multithread_Release(multithread); + return true; +} + +static void d3d11va_uninit(struct lavc_ctx *s) +{ + struct priv *p = s->hwdec_priv; + if (!p) + return; + + talloc_free(p->decoder); + av_freep(&s->avctx->hwaccel_context); + + if (p->video_dev) + ID3D11VideoDevice_Release(p->video_dev); + + if (p->video_ctx) + ID3D11VideoContext_Release(p->video_ctx); + + destroy_device(s); + + TA_FREEP(&s->hwdec_priv); +} + +static int d3d11va_init(struct lavc_ctx *s) +{ + HRESULT hr; + struct priv *p = talloc_zero(NULL, struct priv); + if (!p) + return -1; + + // Unconditionally load Direct3D DLLs, even when using a VO-supplied D3D11 + // device. This prevents a crash that occurs at least with NVIDIA drivers, + // where D3D objects are accessed after ANGLE unloads d3d11.dll. + d3d_load_dlls(); + + s->hwdec_priv = p; + p->log = mp_log_new(s, s->log, "d3d11va"); + if (s->hwdec->type == HWDEC_D3D11VA_COPY) { + mp_check_gpu_memcpy(p->log, NULL); + p->sw_pool = talloc_steal(p, mp_image_pool_new(17)); + } + + p->device = hwdec_devices_load(s->hwdec_devs, s->hwdec->type); + if (p->device) { + ID3D11Device_AddRef(p->device); + ID3D11Device_GetImmediateContext(p->device, &p->device_ctx); + if (!p->device_ctx) + goto fail; + MP_VERBOSE(p, "Using VO-supplied device %p.\n", p->device); + } else if (s->hwdec->type == HWDEC_D3D11VA) { + MP_ERR(p, "