mirror of
https://github.com/mpv-player/mpv
synced 2025-01-09 00:19:32 +00:00
a02d77ba0d
For some reason, the d3d9/dxva2/d3d11 DLLs are still optional. But we don't need to try so hard to keep exact references. In fact, there's no reason to unload them at all. So load them once in a central place. For simplicity, the d3d9/d3d11 backends both load all DLLs. (They will error out only if the required DLLs could not be loaded.) In theory, we could just call LoadLibrary multiple times (without calling FreeLibrary), but I'm slightly worried that this could be detected as a "bug", or that the reference count could even have a low static limit that could be hit soon.
548 lines
17 KiB
C
548 lines
17 KiB
C
/*
|
|
* Ported from FFmpeg ffmpeg_dxva2.c (2dbee1a3935a91842c22eb65fd13f77e8d590e07).
|
|
* Original copyright header follows:
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include <initguid.h>
|
|
|
|
#define DXVA2API_USE_BITFIELDS
|
|
#include <libavcodec/dxva2.h>
|
|
|
|
#include "lavc.h"
|
|
#include "common/common.h"
|
|
#include "common/av_common.h"
|
|
#include "osdep/windows_utils.h"
|
|
#include "video/fmt-conversion.h"
|
|
#include "video/mp_image_pool.h"
|
|
#include "video/hwdec.h"
|
|
|
|
#include "d3d.h"
|
|
|
|
#define ADDITIONAL_SURFACES (4 + HWDEC_DELAY_QUEUE_COUNT)
|
|
|
|
struct priv {
|
|
struct mp_log *log;
|
|
|
|
IDirect3D9 *d3d9;
|
|
IDirect3DDevice9 *device;
|
|
HANDLE device_handle;
|
|
IDirect3DDeviceManager9 *device_manager;
|
|
IDirectXVideoDecoderService *decoder_service;
|
|
|
|
struct mp_image_pool *decoder_pool;
|
|
struct mp_image_pool *sw_pool;
|
|
int mpfmt_decoded;
|
|
};
|
|
|
|
struct dxva2_surface {
|
|
IDirectXVideoDecoder *decoder;
|
|
IDirect3DSurface9 *surface;
|
|
};
|
|
|
|
static void dxva2_release_img(void *arg)
|
|
{
|
|
struct dxva2_surface *surface = arg;
|
|
if (surface->surface)
|
|
IDirect3DSurface9_Release(surface->surface);
|
|
|
|
if (surface->decoder)
|
|
IDirectXVideoDecoder_Release(surface->decoder);
|
|
|
|
talloc_free(surface);
|
|
}
|
|
|
|
static struct mp_image *dxva2_new_ref(IDirectXVideoDecoder *decoder,
|
|
IDirect3DSurface9 *d3d9_surface,
|
|
int w, int h)
|
|
{
|
|
if (!decoder || !d3d9_surface)
|
|
return NULL;
|
|
struct dxva2_surface *surface = talloc_zero(NULL, struct dxva2_surface);
|
|
|
|
surface->surface = d3d9_surface;
|
|
IDirect3DSurface9_AddRef(surface->surface);
|
|
surface->decoder = decoder;
|
|
IDirectXVideoDecoder_AddRef(surface->decoder);
|
|
|
|
struct mp_image *mpi =
|
|
mp_image_new_custom_ref(NULL, surface, dxva2_release_img);
|
|
if (!mpi)
|
|
abort();
|
|
|
|
mp_image_setfmt(mpi, IMGFMT_DXVA2);
|
|
mp_image_set_size(mpi, w, h);
|
|
mpi->planes[3] = (void *)surface->surface;
|
|
return mpi;
|
|
fail:
|
|
dxva2_release_img(surface);
|
|
return NULL;
|
|
}
|
|
|
|
static struct mp_image *dxva2_allocate_image(struct lavc_ctx *s, int w, int h)
|
|
{
|
|
struct priv *p = s->hwdec_priv;
|
|
struct mp_image *img = mp_image_pool_get_no_alloc(p->decoder_pool,
|
|
IMGFMT_DXVA2, w, h);
|
|
if (!img)
|
|
MP_ERR(p, "Failed to allocate additional DXVA2 surface.\n");
|
|
return img;
|
|
}
|
|
|
|
static struct mp_image *dxva2_retrieve_image(struct lavc_ctx *s,
|
|
struct mp_image *img)
|
|
{
|
|
HRESULT hr;
|
|
struct priv *p = s->hwdec_priv;
|
|
IDirect3DSurface9 *surface = img->imgfmt == IMGFMT_DXVA2 ?
|
|
(IDirect3DSurface9 *)img->planes[3] : NULL;
|
|
|
|
if (!surface) {
|
|
MP_ERR(p, "Failed to get Direct3D surface from mp_image\n");
|
|
return img;
|
|
}
|
|
|
|
D3DSURFACE_DESC surface_desc;
|
|
IDirect3DSurface9_GetDesc(surface, &surface_desc);
|
|
if (surface_desc.Width < img->w || surface_desc.Height < img->h) {
|
|
MP_ERR(p, "Direct3D11 texture smaller than mp_image dimensions\n");
|
|
return img;
|
|
}
|
|
|
|
struct mp_image *sw_img = mp_image_pool_get(p->sw_pool,
|
|
p->mpfmt_decoded,
|
|
surface_desc.Width,
|
|
surface_desc.Height);
|
|
if (!sw_img) {
|
|
MP_ERR(p, "Failed to get %s surface from CPU pool\n",
|
|
mp_imgfmt_to_name(p->mpfmt_decoded));
|
|
return img;
|
|
}
|
|
|
|
D3DLOCKED_RECT lock;
|
|
hr = IDirect3DSurface9_LockRect(surface, &lock, NULL, D3DLOCK_READONLY);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Unable to lock DXVA2 surface: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
talloc_free(sw_img);
|
|
return img;
|
|
}
|
|
copy_nv12(sw_img, lock.pBits, lock.Pitch, surface_desc.Height);
|
|
IDirect3DSurface9_UnlockRect(surface);
|
|
|
|
mp_image_set_size(sw_img, img->w, img->h);
|
|
mp_image_copy_attributes(sw_img, img);
|
|
talloc_free(img);
|
|
return sw_img;
|
|
}
|
|
|
|
static const struct d3d_decoded_format d3d9_formats[] = {
|
|
{MKTAG('N','V','1','2'), "NV12", 8, IMGFMT_NV12},
|
|
{MKTAG('P','0','1','0'), "P010", 10, IMGFMT_P010},
|
|
{MKTAG('P','0','1','6'), "P016", 16, IMGFMT_P010},
|
|
};
|
|
|
|
static void dump_decoder_info(struct lavc_ctx *s,
|
|
GUID *device_guids, UINT n_guids)
|
|
{
|
|
struct priv *p = s->hwdec_priv;
|
|
MP_VERBOSE(p, "%u decoder devices:\n", (unsigned)n_guids);
|
|
for (UINT i = 0; i < n_guids; i++) {
|
|
GUID *guid = &device_guids[i];
|
|
char *description = d3d_decoder_guid_to_desc(guid);
|
|
|
|
D3DFORMAT *formats = NULL;
|
|
UINT n_formats = 0;
|
|
HRESULT hr = IDirectXVideoDecoderService_GetDecoderRenderTargets(
|
|
p->decoder_service, guid, &n_formats, &formats);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to get render targets for decoder %s:%s\n",
|
|
description, mp_HRESULT_to_str(hr));
|
|
}
|
|
|
|
char fmts[256] = {0};
|
|
for (UINT j = 0; j < n_formats; j++) {
|
|
mp_snprintf_cat(fmts, sizeof(fmts),
|
|
" %s", mp_tag_str(formats[j]));
|
|
}
|
|
CoTaskMemFree(formats);
|
|
|
|
MP_VERBOSE(p, "%s %s\n", description, fmts);
|
|
}
|
|
}
|
|
|
|
static bool dxva2_format_supported(struct lavc_ctx *s, const GUID *guid,
|
|
const struct d3d_decoded_format *format)
|
|
{
|
|
bool ret = false;
|
|
struct priv *p = s->hwdec_priv;
|
|
D3DFORMAT *formats = NULL;
|
|
UINT n_formats = 0;
|
|
HRESULT hr = IDirectXVideoDecoderService_GetDecoderRenderTargets(
|
|
p->decoder_service, guid, &n_formats, &formats);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Callback failed to get render targets for decoder %s: %s",
|
|
d3d_decoder_guid_to_desc(guid), mp_HRESULT_to_str(hr));
|
|
return 0;
|
|
}
|
|
|
|
for (int i = 0; i < n_formats; i++) {
|
|
ret = formats[i] == format->dxfmt;
|
|
if (ret)
|
|
break;
|
|
}
|
|
|
|
CoTaskMemFree(formats);
|
|
return ret;
|
|
}
|
|
|
|
static int dxva2_init_decoder(struct lavc_ctx *s, int w, int h)
|
|
{
|
|
HRESULT hr;
|
|
int ret = -1;
|
|
struct priv *p = s->hwdec_priv;
|
|
TA_FREEP(&p->decoder_pool);
|
|
|
|
int n_surfaces = hwdec_get_max_refs(s) + ADDITIONAL_SURFACES;
|
|
IDirect3DSurface9 **surfaces = NULL;
|
|
IDirectXVideoDecoder *decoder = NULL;
|
|
void *tmp = talloc_new(NULL);
|
|
|
|
UINT n_guids;
|
|
GUID *device_guids;
|
|
hr = IDirectXVideoDecoderService_GetDecoderDeviceGuids(
|
|
p->decoder_service, &n_guids, &device_guids);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to retrieve decoder device GUIDs: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
goto done;
|
|
}
|
|
|
|
dump_decoder_info(s, device_guids, n_guids);
|
|
|
|
struct d3d_decoder_fmt fmt =
|
|
d3d_select_decoder_mode(s, device_guids, n_guids,
|
|
d3d9_formats, MP_ARRAY_SIZE(d3d9_formats),
|
|
dxva2_format_supported);
|
|
CoTaskMemFree(device_guids);
|
|
if (!fmt.format) {
|
|
MP_ERR(p, "Failed to find a suitable decoder\n");
|
|
goto done;
|
|
}
|
|
|
|
p->mpfmt_decoded = fmt.format->mpfmt;
|
|
struct mp_image_pool *decoder_pool =
|
|
talloc_steal(tmp, mp_image_pool_new(n_surfaces));
|
|
DXVA2_ConfigPictureDecode *decoder_config =
|
|
talloc_zero(decoder_pool, DXVA2_ConfigPictureDecode);
|
|
|
|
int w_align = w, h_align = h;
|
|
d3d_surface_align(s, &w_align, &h_align);
|
|
DXVA2_VideoDesc video_desc ={
|
|
.SampleWidth = w,
|
|
.SampleHeight = h,
|
|
.Format = fmt.format->dxfmt,
|
|
};
|
|
UINT n_configs = 0;
|
|
DXVA2_ConfigPictureDecode *configs = NULL;
|
|
hr = IDirectXVideoDecoderService_GetDecoderConfigurations(
|
|
p->decoder_service, fmt.guid, &video_desc, NULL,
|
|
&n_configs, &configs);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Unable to retrieve decoder configurations: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
goto done;
|
|
}
|
|
|
|
unsigned max_score = 0;
|
|
for (UINT i = 0; i < n_configs; i++) {
|
|
unsigned score = d3d_decoder_config_score(
|
|
s, &configs[i].guidConfigBitstreamEncryption,
|
|
configs[i].ConfigBitstreamRaw);
|
|
if (score > max_score) {
|
|
max_score = score;
|
|
*decoder_config = configs[i];
|
|
}
|
|
}
|
|
CoTaskMemFree(configs);
|
|
if (!max_score) {
|
|
MP_ERR(p, "Failed to find a suitable decoder configuration\n");
|
|
goto done;
|
|
}
|
|
|
|
surfaces = talloc_zero_array(decoder_pool, IDirect3DSurface9*, n_surfaces);
|
|
hr = IDirectXVideoDecoderService_CreateSurface(
|
|
p->decoder_service,
|
|
w_align, h_align,
|
|
n_surfaces - 1, fmt.format->dxfmt, D3DPOOL_DEFAULT, 0,
|
|
DXVA2_VideoDecoderRenderTarget, surfaces, NULL);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to create %d video surfaces: %s\n",
|
|
n_surfaces, mp_HRESULT_to_str(hr));
|
|
goto done;
|
|
}
|
|
|
|
hr = IDirectXVideoDecoderService_CreateVideoDecoder(
|
|
p->decoder_service, fmt.guid, &video_desc, decoder_config,
|
|
surfaces, n_surfaces, &decoder);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to create DXVA2 video decoder: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
goto done;
|
|
}
|
|
|
|
for (int i = 0; i < n_surfaces; i++) {
|
|
struct mp_image *img = dxva2_new_ref(decoder, surfaces[i], w, h);
|
|
if (!img) {
|
|
MP_ERR(p, "Failed to create DXVA2 image\n");
|
|
goto done;
|
|
}
|
|
mp_image_pool_add(decoder_pool, img); // transferred to pool
|
|
}
|
|
|
|
// Pass required information on to ffmpeg.
|
|
struct dxva_context *dxva_ctx = s->avctx->hwaccel_context;
|
|
dxva_ctx->cfg = decoder_config;
|
|
dxva_ctx->decoder = decoder;
|
|
dxva_ctx->surface_count = n_surfaces;
|
|
dxva_ctx->surface = surfaces;
|
|
dxva_ctx->workaround = is_clearvideo(fmt.guid) ?
|
|
FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO : 0;
|
|
|
|
p->decoder_pool = talloc_steal(NULL, decoder_pool);
|
|
ret = 0;
|
|
done:
|
|
// On success, `p->decoder_pool` mp_images still hold refs to `surfaces` and
|
|
// `decoder`, so the pointers in the ffmpeg `dxva_context` strcture remain
|
|
// valid for the lifetime of the pool.
|
|
if (surfaces) {
|
|
for (int i = 0; i < n_surfaces; i++)
|
|
IDirect3DSurface9_Release(surfaces[i]);
|
|
}
|
|
if (decoder)
|
|
IDirectXVideoDecoder_Release(decoder);
|
|
|
|
talloc_free(tmp);
|
|
return ret;
|
|
}
|
|
|
|
static void destroy_device(struct lavc_ctx *s)
|
|
{
|
|
struct priv *p = s->hwdec_priv;
|
|
|
|
if (p->device)
|
|
IDirect3DDevice9_Release(p->device);
|
|
|
|
if (p->d3d9)
|
|
IDirect3D9_Release(p->d3d9);
|
|
}
|
|
|
|
static bool create_device(struct lavc_ctx *s)
|
|
{
|
|
struct priv *p = s->hwdec_priv;
|
|
|
|
d3d_load_dlls();
|
|
if (!d3d9_dll) {
|
|
MP_ERR(p, "Failed to load D3D9 library\n");
|
|
return false;
|
|
}
|
|
|
|
IDirect3D9* (WINAPI *Direct3DCreate9)(UINT) =
|
|
(void *)GetProcAddress(d3d9_dll, "Direct3DCreate9");
|
|
if (!Direct3DCreate9) {
|
|
MP_ERR(p, "Failed to locate Direct3DCreate9\n");
|
|
return false;
|
|
}
|
|
|
|
p->d3d9 = Direct3DCreate9(D3D_SDK_VERSION);
|
|
if (!p->d3d9) {
|
|
MP_ERR(p, "Failed to create IDirect3D object\n");
|
|
return false;
|
|
}
|
|
|
|
UINT adapter = D3DADAPTER_DEFAULT;
|
|
D3DDISPLAYMODE display_mode;
|
|
IDirect3D9_GetAdapterDisplayMode(p->d3d9, adapter, &display_mode);
|
|
D3DPRESENT_PARAMETERS present_params = {
|
|
.Windowed = TRUE,
|
|
.BackBufferWidth = 640,
|
|
.BackBufferHeight = 480,
|
|
.BackBufferCount = 0,
|
|
.BackBufferFormat = display_mode.Format,
|
|
.SwapEffect = D3DSWAPEFFECT_DISCARD,
|
|
.Flags = D3DPRESENTFLAG_VIDEO,
|
|
};
|
|
HRESULT hr = IDirect3D9_CreateDevice(p->d3d9, adapter,
|
|
D3DDEVTYPE_HAL,
|
|
GetShellWindow(),
|
|
D3DCREATE_SOFTWARE_VERTEXPROCESSING |
|
|
D3DCREATE_MULTITHREADED |
|
|
D3DCREATE_FPU_PRESERVE,
|
|
&present_params,
|
|
&p->device);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to create Direct3D device: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
static void dxva2_uninit(struct lavc_ctx *s)
|
|
{
|
|
struct priv *p = s->hwdec_priv;
|
|
if (!p)
|
|
return;
|
|
|
|
av_freep(&s->avctx->hwaccel_context);
|
|
talloc_free(p->decoder_pool);
|
|
|
|
if (p->decoder_service)
|
|
IDirectXVideoDecoderService_Release(p->decoder_service);
|
|
|
|
if (p->device_manager && p->device_handle != INVALID_HANDLE_VALUE)
|
|
IDirect3DDeviceManager9_CloseDeviceHandle(p->device_manager, p->device_handle);
|
|
|
|
if (p->device_manager)
|
|
IDirect3DDeviceManager9_Release(p->device_manager);
|
|
|
|
destroy_device(s);
|
|
|
|
TA_FREEP(&s->hwdec_priv);
|
|
}
|
|
|
|
static int dxva2_init(struct lavc_ctx *s)
|
|
{
|
|
HRESULT hr;
|
|
struct priv *p = talloc_zero(NULL, struct priv);
|
|
if (!p)
|
|
return -1;
|
|
|
|
s->hwdec_priv = p;
|
|
p->device_handle = INVALID_HANDLE_VALUE;
|
|
p->log = mp_log_new(s, s->log, "dxva2");
|
|
|
|
if (s->hwdec->type == HWDEC_DXVA2_COPY) {
|
|
mp_check_gpu_memcpy(p->log, NULL);
|
|
p->sw_pool = talloc_steal(p, mp_image_pool_new(17));
|
|
}
|
|
|
|
p->device = hwdec_devices_load(s->hwdec_devs, s->hwdec->type);
|
|
if (p->device) {
|
|
IDirect3D9_AddRef(p->device);
|
|
MP_VERBOSE(p, "Using VO-supplied device %p.\n", p->device);
|
|
} else if (s->hwdec->type == HWDEC_DXVA2) {
|
|
MP_ERR(p, "No Direct3D device provided for native dxva2 decoding\n");
|
|
goto fail;
|
|
} else {
|
|
if (!create_device(s))
|
|
goto fail;
|
|
}
|
|
|
|
d3d_load_dlls();
|
|
if (!dxva2_dll) {
|
|
MP_ERR(p, "Failed to load DXVA2 library\n");
|
|
goto fail;
|
|
}
|
|
|
|
HRESULT (WINAPI *CreateDeviceManager9)(UINT *, IDirect3DDeviceManager9 **) =
|
|
(void *)GetProcAddress(dxva2_dll, "DXVA2CreateDirect3DDeviceManager9");
|
|
if (!CreateDeviceManager9) {
|
|
MP_ERR(p, "Failed to locate DXVA2CreateDirect3DDeviceManager9\n");
|
|
goto fail;
|
|
}
|
|
|
|
unsigned reset_token = 0;
|
|
hr = CreateDeviceManager9(&reset_token, &p->device_manager);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to create Direct3D device manager: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
goto fail;
|
|
}
|
|
|
|
hr = IDirect3DDeviceManager9_ResetDevice(p->device_manager,
|
|
p->device, reset_token);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to bind Direct3D device to device manager: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
goto fail;
|
|
}
|
|
|
|
hr = IDirect3DDeviceManager9_OpenDeviceHandle(p->device_manager,
|
|
&p->device_handle);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to open device handle: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
goto fail;
|
|
}
|
|
|
|
hr = IDirect3DDeviceManager9_GetVideoService(
|
|
p->device_manager, p->device_handle, &IID_IDirectXVideoDecoderService,
|
|
(void **)&p->decoder_service);
|
|
if (FAILED(hr)) {
|
|
MP_ERR(p, "Failed to create IDirectXVideoDecoderService: %s\n",
|
|
mp_HRESULT_to_str(hr));
|
|
goto fail;
|
|
}
|
|
|
|
s->avctx->hwaccel_context = av_mallocz(sizeof(struct dxva_context));
|
|
if (!s->avctx->hwaccel_context)
|
|
goto fail;
|
|
|
|
return 0;
|
|
fail:
|
|
dxva2_uninit(s);
|
|
return -1;
|
|
}
|
|
|
|
static int dxva2_probe(struct lavc_ctx *ctx, struct vd_lavc_hwdec *hwdec,
|
|
const char *codec)
|
|
{
|
|
// dxva2-copy can do without external context; dxva2 requires it.
|
|
if (hwdec->type == HWDEC_DXVA2) {
|
|
if (!hwdec_devices_load(ctx->hwdec_devs, HWDEC_DXVA2))
|
|
return HWDEC_ERR_NO_CTX;
|
|
} else {
|
|
hwdec_devices_load(ctx->hwdec_devs, HWDEC_DXVA2_COPY);
|
|
}
|
|
return d3d_probe_codec(codec);
|
|
}
|
|
|
|
const struct vd_lavc_hwdec mp_vd_lavc_dxva2 = {
|
|
.type = HWDEC_DXVA2,
|
|
.image_format = IMGFMT_DXVA2,
|
|
.probe = dxva2_probe,
|
|
.init = dxva2_init,
|
|
.uninit = dxva2_uninit,
|
|
.init_decoder = dxva2_init_decoder,
|
|
.allocate_image = dxva2_allocate_image,
|
|
};
|
|
|
|
const struct vd_lavc_hwdec mp_vd_lavc_dxva2_copy = {
|
|
.type = HWDEC_DXVA2_COPY,
|
|
.copying = true,
|
|
.image_format = IMGFMT_DXVA2,
|
|
.probe = dxva2_probe,
|
|
.init = dxva2_init,
|
|
.uninit = dxva2_uninit,
|
|
.init_decoder = dxva2_init_decoder,
|
|
.allocate_image = dxva2_allocate_image,
|
|
.process_image = dxva2_retrieve_image,
|
|
.delay_queue = HWDEC_DELAY_QUEUE_COUNT,
|
|
};
|