mirror of
https://git.ffmpeg.org/ffmpeg.git
synced 2024-12-22 07:20:45 +00:00
ecee3b07cd
This allows user set hw_device_ctx instead of hw_frames_ctx for QSV decoders, hence we may remove the ad-hoc libmfx setup code from FFmpeg. "-hwaccel_output_format format" is applied to QSV decoders after removing the ad-hoc libmfx code. In order to keep compatibility with old commandlines, the default format is set to AV_PIX_FMT_QSV, but this behavior will be removed in the future. Please set "-hwaccel_output_format qsv" explicitly if AV_PIX_FMT_QSV is expected. The normal device stuff works for QSV decoders now, user may use "-init_hw_device args" to initialise device and "-hwaccel_device devicename" to select a device for QSV decoders. "-qsv_device device" which was added for workarounding device selection in the ad-hoc libmfx code still works For example: $> ffmpeg -init_hw_device qsv=qsv:hw_any,child_device=/dev/dri/card0 -hwaccel qsv -c:v h264_qsv -i input.h264 -f null - /dev/dri/renderD128 is actually open for h264_qsv decoder in the above command without this patch. After applying this patch, /dev/dri/card0 is used. $> ffmpeg -init_hw_device vaapi=va:/dev/dri/card0 -init_hw_device qsv=hw@va -hwaccel_device hw -hwaccel qsv -c:v h264_qsv -i input.h264 -f null - device hw of type qsv is not usable in the above command without this patch. After applying this patch, this command works as expected. Reviewed-by: Soft Works <softworkz@hotmail.com> Signed-off-by: James Almer <jamrial@gmail.com>
973 lines
31 KiB
C
973 lines
31 KiB
C
/*
|
|
* Intel MediaSDK QSV codec-independent code
|
|
*
|
|
* copyright (c) 2013 Luca Barbato
|
|
* copyright (c) 2015 Anton Khirnov <anton@khirnov.net>
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include <stdint.h>
|
|
#include <string.h>
|
|
#include <sys/types.h>
|
|
|
|
#include <mfx/mfxvideo.h>
|
|
|
|
#include "libavutil/common.h"
|
|
#include "libavutil/fifo.h"
|
|
#include "libavutil/frame.h"
|
|
#include "libavutil/hwcontext.h"
|
|
#include "libavutil/hwcontext_qsv.h"
|
|
#include "libavutil/mem.h"
|
|
#include "libavutil/log.h"
|
|
#include "libavutil/opt.h"
|
|
#include "libavutil/pixfmt.h"
|
|
#include "libavutil/time.h"
|
|
#include "libavutil/imgutils.h"
|
|
|
|
#include "avcodec.h"
|
|
#include "internal.h"
|
|
#include "decode.h"
|
|
#include "hwconfig.h"
|
|
#include "qsv.h"
|
|
#include "qsv_internal.h"
|
|
|
|
static const AVRational mfx_tb = { 1, 90000 };
|
|
|
|
#define PTS_TO_MFX_PTS(pts, pts_tb) ((pts) == AV_NOPTS_VALUE ? \
|
|
MFX_TIMESTAMP_UNKNOWN : pts_tb.num ? \
|
|
av_rescale_q(pts, pts_tb, mfx_tb) : pts)
|
|
|
|
#define MFX_PTS_TO_PTS(mfx_pts, pts_tb) ((mfx_pts) == MFX_TIMESTAMP_UNKNOWN ? \
|
|
AV_NOPTS_VALUE : pts_tb.num ? \
|
|
av_rescale_q(mfx_pts, mfx_tb, pts_tb) : mfx_pts)
|
|
|
|
typedef struct QSVContext {
|
|
// the session used for decoding
|
|
mfxSession session;
|
|
|
|
// the session we allocated internally, in case the caller did not provide
|
|
// one
|
|
QSVSession internal_qs;
|
|
|
|
QSVFramesContext frames_ctx;
|
|
|
|
/**
|
|
* a linked list of frames currently being used by QSV
|
|
*/
|
|
QSVFrame *work_frames;
|
|
|
|
AVFifoBuffer *async_fifo;
|
|
int zero_consume_run;
|
|
int buffered_count;
|
|
int reinit_flag;
|
|
|
|
enum AVPixelFormat orig_pix_fmt;
|
|
uint32_t fourcc;
|
|
mfxFrameInfo frame_info;
|
|
AVBufferPool *pool;
|
|
|
|
int initialized;
|
|
|
|
// options set by the caller
|
|
int async_depth;
|
|
int iopattern;
|
|
int gpu_copy;
|
|
|
|
char *load_plugins;
|
|
|
|
mfxExtBuffer **ext_buffers;
|
|
int nb_ext_buffers;
|
|
} QSVContext;
|
|
|
|
static const AVCodecHWConfigInternal *const qsv_hw_configs[] = {
|
|
&(const AVCodecHWConfigInternal) {
|
|
.public = {
|
|
.pix_fmt = AV_PIX_FMT_QSV,
|
|
.methods = AV_CODEC_HW_CONFIG_METHOD_HW_FRAMES_CTX |
|
|
AV_CODEC_HW_CONFIG_METHOD_HW_DEVICE_CTX,
|
|
.device_type = AV_HWDEVICE_TYPE_QSV,
|
|
},
|
|
.hwaccel = NULL,
|
|
},
|
|
NULL
|
|
};
|
|
|
|
static int qsv_get_continuous_buffer(AVCodecContext *avctx, AVFrame *frame,
|
|
AVBufferPool *pool)
|
|
{
|
|
int ret = 0;
|
|
|
|
ff_decode_frame_props(avctx, frame);
|
|
|
|
frame->width = avctx->width;
|
|
frame->height = avctx->height;
|
|
|
|
switch (avctx->pix_fmt) {
|
|
case AV_PIX_FMT_NV12:
|
|
frame->linesize[0] = FFALIGN(avctx->width, 128);
|
|
break;
|
|
case AV_PIX_FMT_P010:
|
|
frame->linesize[0] = 2 * FFALIGN(avctx->width, 128);
|
|
break;
|
|
default:
|
|
av_log(avctx, AV_LOG_ERROR, "Unsupported pixel format.\n");
|
|
return AVERROR(EINVAL);
|
|
}
|
|
|
|
frame->linesize[1] = frame->linesize[0];
|
|
frame->buf[0] = av_buffer_pool_get(pool);
|
|
if (!frame->buf[0])
|
|
return AVERROR(ENOMEM);
|
|
|
|
frame->data[0] = frame->buf[0]->data;
|
|
frame->data[1] = frame->data[0] +
|
|
frame->linesize[0] * FFALIGN(avctx->height, 64);
|
|
|
|
ret = ff_attach_decode_data(frame);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int qsv_init_session(AVCodecContext *avctx, QSVContext *q, mfxSession session,
|
|
AVBufferRef *hw_frames_ref, AVBufferRef *hw_device_ref)
|
|
{
|
|
int ret;
|
|
|
|
if (q->gpu_copy == MFX_GPUCOPY_ON &&
|
|
!(q->iopattern & MFX_IOPATTERN_OUT_SYSTEM_MEMORY)) {
|
|
av_log(avctx, AV_LOG_WARNING, "GPU-accelerated memory copy "
|
|
"only works in system memory mode.\n");
|
|
q->gpu_copy = MFX_GPUCOPY_OFF;
|
|
}
|
|
if (session) {
|
|
q->session = session;
|
|
} else if (hw_frames_ref) {
|
|
if (q->internal_qs.session) {
|
|
MFXClose(q->internal_qs.session);
|
|
q->internal_qs.session = NULL;
|
|
}
|
|
av_buffer_unref(&q->frames_ctx.hw_frames_ctx);
|
|
|
|
q->frames_ctx.hw_frames_ctx = av_buffer_ref(hw_frames_ref);
|
|
if (!q->frames_ctx.hw_frames_ctx)
|
|
return AVERROR(ENOMEM);
|
|
|
|
ret = ff_qsv_init_session_frames(avctx, &q->internal_qs.session,
|
|
&q->frames_ctx, q->load_plugins,
|
|
q->iopattern == MFX_IOPATTERN_OUT_OPAQUE_MEMORY,
|
|
q->gpu_copy);
|
|
if (ret < 0) {
|
|
av_buffer_unref(&q->frames_ctx.hw_frames_ctx);
|
|
return ret;
|
|
}
|
|
|
|
q->session = q->internal_qs.session;
|
|
} else if (hw_device_ref) {
|
|
if (q->internal_qs.session) {
|
|
MFXClose(q->internal_qs.session);
|
|
q->internal_qs.session = NULL;
|
|
}
|
|
|
|
ret = ff_qsv_init_session_device(avctx, &q->internal_qs.session,
|
|
hw_device_ref, q->load_plugins, q->gpu_copy);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
q->session = q->internal_qs.session;
|
|
} else {
|
|
if (!q->internal_qs.session) {
|
|
ret = ff_qsv_init_internal_session(avctx, &q->internal_qs,
|
|
q->load_plugins, q->gpu_copy);
|
|
if (ret < 0)
|
|
return ret;
|
|
}
|
|
|
|
q->session = q->internal_qs.session;
|
|
}
|
|
|
|
/* make sure the decoder is uninitialized */
|
|
MFXVideoDECODE_Close(q->session);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static inline unsigned int qsv_fifo_item_size(void)
|
|
{
|
|
return sizeof(mfxSyncPoint*) + sizeof(QSVFrame*);
|
|
}
|
|
|
|
static inline unsigned int qsv_fifo_size(const AVFifoBuffer* fifo)
|
|
{
|
|
return av_fifo_size(fifo) / qsv_fifo_item_size();
|
|
}
|
|
|
|
static int qsv_decode_preinit(AVCodecContext *avctx, QSVContext *q, enum AVPixelFormat pix_fmt, mfxVideoParam *param)
|
|
{
|
|
mfxSession session = NULL;
|
|
int iopattern = 0;
|
|
int ret;
|
|
enum AVPixelFormat pix_fmts[3] = {
|
|
AV_PIX_FMT_QSV, /* opaque format in case of video memory output */
|
|
pix_fmt, /* system memory format obtained from bitstream parser */
|
|
AV_PIX_FMT_NONE };
|
|
|
|
ret = ff_get_format(avctx, pix_fmts);
|
|
if (ret < 0) {
|
|
q->orig_pix_fmt = avctx->pix_fmt = AV_PIX_FMT_NONE;
|
|
return ret;
|
|
}
|
|
|
|
if (!q->async_fifo) {
|
|
q->async_fifo = av_fifo_alloc(q->async_depth * qsv_fifo_item_size());
|
|
if (!q->async_fifo)
|
|
return AVERROR(ENOMEM);
|
|
}
|
|
|
|
if (avctx->pix_fmt == AV_PIX_FMT_QSV && avctx->hwaccel_context) {
|
|
AVQSVContext *user_ctx = avctx->hwaccel_context;
|
|
session = user_ctx->session;
|
|
iopattern = user_ctx->iopattern;
|
|
q->ext_buffers = user_ctx->ext_buffers;
|
|
q->nb_ext_buffers = user_ctx->nb_ext_buffers;
|
|
}
|
|
|
|
if (avctx->hw_device_ctx && !avctx->hw_frames_ctx && ret == AV_PIX_FMT_QSV) {
|
|
AVHWFramesContext *hwframes_ctx;
|
|
AVQSVFramesContext *frames_hwctx;
|
|
|
|
avctx->hw_frames_ctx = av_hwframe_ctx_alloc(avctx->hw_device_ctx);
|
|
|
|
if (!avctx->hw_frames_ctx) {
|
|
av_log(avctx, AV_LOG_ERROR, "av_hwframe_ctx_alloc failed\n");
|
|
return AVERROR(ENOMEM);
|
|
}
|
|
|
|
hwframes_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data;
|
|
frames_hwctx = hwframes_ctx->hwctx;
|
|
hwframes_ctx->width = FFALIGN(avctx->coded_width, 32);
|
|
hwframes_ctx->height = FFALIGN(avctx->coded_height, 32);
|
|
hwframes_ctx->format = AV_PIX_FMT_QSV;
|
|
hwframes_ctx->sw_format = avctx->sw_pix_fmt;
|
|
hwframes_ctx->initial_pool_size = 64 + avctx->extra_hw_frames;
|
|
frames_hwctx->frame_type = MFX_MEMTYPE_VIDEO_MEMORY_DECODER_TARGET;
|
|
|
|
ret = av_hwframe_ctx_init(avctx->hw_frames_ctx);
|
|
|
|
if (ret < 0) {
|
|
av_log(NULL, AV_LOG_ERROR, "Error initializing a QSV frame pool\n");
|
|
av_buffer_unref(&avctx->hw_frames_ctx);
|
|
return ret;
|
|
}
|
|
}
|
|
|
|
if (avctx->hw_frames_ctx) {
|
|
AVHWFramesContext *frames_ctx = (AVHWFramesContext*)avctx->hw_frames_ctx->data;
|
|
AVQSVFramesContext *frames_hwctx = frames_ctx->hwctx;
|
|
|
|
if (!iopattern) {
|
|
if (frames_hwctx->frame_type & MFX_MEMTYPE_OPAQUE_FRAME)
|
|
iopattern = MFX_IOPATTERN_OUT_OPAQUE_MEMORY;
|
|
else if (frames_hwctx->frame_type & MFX_MEMTYPE_VIDEO_MEMORY_DECODER_TARGET)
|
|
iopattern = MFX_IOPATTERN_OUT_VIDEO_MEMORY;
|
|
}
|
|
}
|
|
|
|
if (!iopattern)
|
|
iopattern = MFX_IOPATTERN_OUT_SYSTEM_MEMORY;
|
|
q->iopattern = iopattern;
|
|
|
|
ff_qsv_print_iopattern(avctx, q->iopattern, "Decoder");
|
|
|
|
ret = qsv_init_session(avctx, q, session, avctx->hw_frames_ctx, avctx->hw_device_ctx);
|
|
if (ret < 0) {
|
|
av_log(avctx, AV_LOG_ERROR, "Error initializing an MFX session\n");
|
|
return ret;
|
|
}
|
|
|
|
param->IOPattern = q->iopattern;
|
|
param->AsyncDepth = q->async_depth;
|
|
param->ExtParam = q->ext_buffers;
|
|
param->NumExtParam = q->nb_ext_buffers;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int qsv_decode_init_context(AVCodecContext *avctx, QSVContext *q, mfxVideoParam *param)
|
|
{
|
|
int ret;
|
|
|
|
avctx->width = param->mfx.FrameInfo.CropW;
|
|
avctx->height = param->mfx.FrameInfo.CropH;
|
|
avctx->coded_width = param->mfx.FrameInfo.Width;
|
|
avctx->coded_height = param->mfx.FrameInfo.Height;
|
|
avctx->level = param->mfx.CodecLevel;
|
|
avctx->profile = param->mfx.CodecProfile;
|
|
avctx->field_order = ff_qsv_map_picstruct(param->mfx.FrameInfo.PicStruct);
|
|
avctx->pix_fmt = ff_qsv_map_fourcc(param->mfx.FrameInfo.FourCC);
|
|
|
|
ret = MFXVideoDECODE_Init(q->session, param);
|
|
if (ret < 0)
|
|
return ff_qsv_print_error(avctx, ret,
|
|
"Error initializing the MFX video decoder");
|
|
|
|
q->frame_info = param->mfx.FrameInfo;
|
|
|
|
if (!avctx->hw_frames_ctx)
|
|
q->pool = av_buffer_pool_init(av_image_get_buffer_size(avctx->pix_fmt,
|
|
FFALIGN(avctx->width, 128), FFALIGN(avctx->height, 64), 1), av_buffer_allocz);
|
|
return 0;
|
|
}
|
|
|
|
static int qsv_decode_header(AVCodecContext *avctx, QSVContext *q,
|
|
const AVPacket *avpkt, enum AVPixelFormat pix_fmt,
|
|
mfxVideoParam *param)
|
|
{
|
|
int ret;
|
|
mfxExtVideoSignalInfo video_signal_info = { 0 };
|
|
mfxExtBuffer *header_ext_params[1] = { (mfxExtBuffer *)&video_signal_info };
|
|
mfxBitstream bs = { 0 };
|
|
|
|
if (avpkt->size) {
|
|
bs.Data = avpkt->data;
|
|
bs.DataLength = avpkt->size;
|
|
bs.MaxLength = bs.DataLength;
|
|
bs.TimeStamp = PTS_TO_MFX_PTS(avpkt->pts, avctx->pkt_timebase);
|
|
if (avctx->field_order == AV_FIELD_PROGRESSIVE)
|
|
bs.DataFlag |= MFX_BITSTREAM_COMPLETE_FRAME;
|
|
} else
|
|
return AVERROR_INVALIDDATA;
|
|
|
|
|
|
if(!q->session) {
|
|
ret = qsv_decode_preinit(avctx, q, pix_fmt, param);
|
|
if (ret < 0)
|
|
return ret;
|
|
}
|
|
|
|
ret = ff_qsv_codec_id_to_mfx(avctx->codec_id);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
param->mfx.CodecId = ret;
|
|
video_signal_info.Header.BufferId = MFX_EXTBUFF_VIDEO_SIGNAL_INFO;
|
|
video_signal_info.Header.BufferSz = sizeof(video_signal_info);
|
|
// The SDK doesn't support other ext buffers when calling MFXVideoDECODE_DecodeHeader,
|
|
// so do not append this buffer to the existent buffer array
|
|
param->ExtParam = header_ext_params;
|
|
param->NumExtParam = 1;
|
|
ret = MFXVideoDECODE_DecodeHeader(q->session, &bs, param);
|
|
if (MFX_ERR_MORE_DATA == ret) {
|
|
return AVERROR(EAGAIN);
|
|
}
|
|
if (ret < 0)
|
|
return ff_qsv_print_error(avctx, ret,
|
|
"Error decoding stream header");
|
|
|
|
avctx->color_range = video_signal_info.VideoFullRange ? AVCOL_RANGE_JPEG : AVCOL_RANGE_MPEG;
|
|
|
|
if (video_signal_info.ColourDescriptionPresent) {
|
|
avctx->color_primaries = video_signal_info.ColourPrimaries;
|
|
avctx->color_trc = video_signal_info.TransferCharacteristics;
|
|
avctx->colorspace = video_signal_info.MatrixCoefficients;
|
|
}
|
|
|
|
param->ExtParam = q->ext_buffers;
|
|
param->NumExtParam = q->nb_ext_buffers;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int alloc_frame(AVCodecContext *avctx, QSVContext *q, QSVFrame *frame)
|
|
{
|
|
int ret;
|
|
|
|
if (q->pool)
|
|
ret = qsv_get_continuous_buffer(avctx, frame->frame, q->pool);
|
|
else
|
|
ret = ff_get_buffer(avctx, frame->frame, AV_GET_BUFFER_FLAG_REF);
|
|
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
if (frame->frame->format == AV_PIX_FMT_QSV) {
|
|
frame->surface = *(mfxFrameSurface1*)frame->frame->data[3];
|
|
} else {
|
|
frame->surface.Info = q->frame_info;
|
|
|
|
frame->surface.Data.PitchLow = frame->frame->linesize[0];
|
|
frame->surface.Data.Y = frame->frame->data[0];
|
|
frame->surface.Data.UV = frame->frame->data[1];
|
|
}
|
|
|
|
if (q->frames_ctx.mids) {
|
|
ret = ff_qsv_find_surface_idx(&q->frames_ctx, frame);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
frame->surface.Data.MemId = &q->frames_ctx.mids[ret];
|
|
}
|
|
frame->surface.Data.ExtParam = &frame->ext_param;
|
|
frame->surface.Data.NumExtParam = 1;
|
|
frame->ext_param = (mfxExtBuffer*)&frame->dec_info;
|
|
frame->dec_info.Header.BufferId = MFX_EXTBUFF_DECODED_FRAME_INFO;
|
|
frame->dec_info.Header.BufferSz = sizeof(frame->dec_info);
|
|
|
|
frame->used = 1;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static void qsv_clear_unused_frames(QSVContext *q)
|
|
{
|
|
QSVFrame *cur = q->work_frames;
|
|
while (cur) {
|
|
if (cur->used && !cur->surface.Data.Locked && !cur->queued) {
|
|
cur->used = 0;
|
|
av_frame_unref(cur->frame);
|
|
}
|
|
cur = cur->next;
|
|
}
|
|
}
|
|
|
|
static int get_surface(AVCodecContext *avctx, QSVContext *q, mfxFrameSurface1 **surf)
|
|
{
|
|
QSVFrame *frame, **last;
|
|
int ret;
|
|
|
|
qsv_clear_unused_frames(q);
|
|
|
|
frame = q->work_frames;
|
|
last = &q->work_frames;
|
|
while (frame) {
|
|
if (!frame->used) {
|
|
ret = alloc_frame(avctx, q, frame);
|
|
if (ret < 0)
|
|
return ret;
|
|
*surf = &frame->surface;
|
|
return 0;
|
|
}
|
|
|
|
last = &frame->next;
|
|
frame = frame->next;
|
|
}
|
|
|
|
frame = av_mallocz(sizeof(*frame));
|
|
if (!frame)
|
|
return AVERROR(ENOMEM);
|
|
frame->frame = av_frame_alloc();
|
|
if (!frame->frame) {
|
|
av_freep(&frame);
|
|
return AVERROR(ENOMEM);
|
|
}
|
|
*last = frame;
|
|
|
|
ret = alloc_frame(avctx, q, frame);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
*surf = &frame->surface;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static QSVFrame *find_frame(QSVContext *q, mfxFrameSurface1 *surf)
|
|
{
|
|
QSVFrame *cur = q->work_frames;
|
|
while (cur) {
|
|
if (surf == &cur->surface)
|
|
return cur;
|
|
cur = cur->next;
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
static int qsv_decode(AVCodecContext *avctx, QSVContext *q,
|
|
AVFrame *frame, int *got_frame,
|
|
const AVPacket *avpkt)
|
|
{
|
|
QSVFrame *out_frame;
|
|
mfxFrameSurface1 *insurf;
|
|
mfxFrameSurface1 *outsurf;
|
|
mfxSyncPoint *sync;
|
|
mfxBitstream bs = { { { 0 } } };
|
|
int ret;
|
|
|
|
if (avpkt->size) {
|
|
bs.Data = avpkt->data;
|
|
bs.DataLength = avpkt->size;
|
|
bs.MaxLength = bs.DataLength;
|
|
bs.TimeStamp = PTS_TO_MFX_PTS(avpkt->pts, avctx->pkt_timebase);
|
|
if (avctx->field_order == AV_FIELD_PROGRESSIVE)
|
|
bs.DataFlag |= MFX_BITSTREAM_COMPLETE_FRAME;
|
|
}
|
|
|
|
sync = av_mallocz(sizeof(*sync));
|
|
if (!sync) {
|
|
av_freep(&sync);
|
|
return AVERROR(ENOMEM);
|
|
}
|
|
|
|
do {
|
|
ret = get_surface(avctx, q, &insurf);
|
|
if (ret < 0) {
|
|
av_freep(&sync);
|
|
return ret;
|
|
}
|
|
|
|
ret = MFXVideoDECODE_DecodeFrameAsync(q->session, avpkt->size ? &bs : NULL,
|
|
insurf, &outsurf, sync);
|
|
if (ret == MFX_WRN_DEVICE_BUSY)
|
|
av_usleep(500);
|
|
|
|
} while (ret == MFX_WRN_DEVICE_BUSY || ret == MFX_ERR_MORE_SURFACE);
|
|
|
|
if (ret != MFX_ERR_NONE &&
|
|
ret != MFX_ERR_MORE_DATA &&
|
|
ret != MFX_WRN_VIDEO_PARAM_CHANGED &&
|
|
ret != MFX_ERR_MORE_SURFACE) {
|
|
av_freep(&sync);
|
|
return ff_qsv_print_error(avctx, ret,
|
|
"Error during QSV decoding.");
|
|
}
|
|
|
|
/* make sure we do not enter an infinite loop if the SDK
|
|
* did not consume any data and did not return anything */
|
|
if (!*sync && !bs.DataOffset) {
|
|
bs.DataOffset = avpkt->size;
|
|
++q->zero_consume_run;
|
|
if (q->zero_consume_run > 1)
|
|
ff_qsv_print_warning(avctx, ret, "A decode call did not consume any data");
|
|
} else if (!*sync && bs.DataOffset) {
|
|
++q->buffered_count;
|
|
} else {
|
|
q->zero_consume_run = 0;
|
|
}
|
|
|
|
if (*sync) {
|
|
QSVFrame *out_frame = find_frame(q, outsurf);
|
|
|
|
if (!out_frame) {
|
|
av_log(avctx, AV_LOG_ERROR,
|
|
"The returned surface does not correspond to any frame\n");
|
|
av_freep(&sync);
|
|
return AVERROR_BUG;
|
|
}
|
|
|
|
out_frame->queued = 1;
|
|
av_fifo_generic_write(q->async_fifo, &out_frame, sizeof(out_frame), NULL);
|
|
av_fifo_generic_write(q->async_fifo, &sync, sizeof(sync), NULL);
|
|
} else {
|
|
av_freep(&sync);
|
|
}
|
|
|
|
if ((qsv_fifo_size(q->async_fifo) >= q->async_depth) ||
|
|
(!avpkt->size && av_fifo_size(q->async_fifo))) {
|
|
AVFrame *src_frame;
|
|
|
|
av_fifo_generic_read(q->async_fifo, &out_frame, sizeof(out_frame), NULL);
|
|
av_fifo_generic_read(q->async_fifo, &sync, sizeof(sync), NULL);
|
|
out_frame->queued = 0;
|
|
|
|
if (avctx->pix_fmt != AV_PIX_FMT_QSV) {
|
|
do {
|
|
ret = MFXVideoCORE_SyncOperation(q->session, *sync, 1000);
|
|
} while (ret == MFX_WRN_IN_EXECUTION);
|
|
}
|
|
|
|
av_freep(&sync);
|
|
|
|
src_frame = out_frame->frame;
|
|
|
|
ret = av_frame_ref(frame, src_frame);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
outsurf = &out_frame->surface;
|
|
|
|
frame->pts = MFX_PTS_TO_PTS(outsurf->Data.TimeStamp, avctx->pkt_timebase);
|
|
|
|
frame->repeat_pict =
|
|
outsurf->Info.PicStruct & MFX_PICSTRUCT_FRAME_TRIPLING ? 4 :
|
|
outsurf->Info.PicStruct & MFX_PICSTRUCT_FRAME_DOUBLING ? 2 :
|
|
outsurf->Info.PicStruct & MFX_PICSTRUCT_FIELD_REPEATED ? 1 : 0;
|
|
frame->top_field_first =
|
|
outsurf->Info.PicStruct & MFX_PICSTRUCT_FIELD_TFF;
|
|
frame->interlaced_frame =
|
|
!(outsurf->Info.PicStruct & MFX_PICSTRUCT_PROGRESSIVE);
|
|
frame->pict_type = ff_qsv_map_pictype(out_frame->dec_info.FrameType);
|
|
//Key frame is IDR frame is only suitable for H264. For HEVC, IRAPs are key frames.
|
|
if (avctx->codec_id == AV_CODEC_ID_H264)
|
|
frame->key_frame = !!(out_frame->dec_info.FrameType & MFX_FRAMETYPE_IDR);
|
|
|
|
/* update the surface properties */
|
|
if (avctx->pix_fmt == AV_PIX_FMT_QSV)
|
|
((mfxFrameSurface1*)frame->data[3])->Info = outsurf->Info;
|
|
|
|
*got_frame = 1;
|
|
}
|
|
|
|
return bs.DataOffset;
|
|
}
|
|
|
|
static void qsv_decode_close_qsvcontext(QSVContext *q)
|
|
{
|
|
QSVFrame *cur = q->work_frames;
|
|
|
|
if (q->session)
|
|
MFXVideoDECODE_Close(q->session);
|
|
|
|
while (q->async_fifo && av_fifo_size(q->async_fifo)) {
|
|
QSVFrame *out_frame;
|
|
mfxSyncPoint *sync;
|
|
|
|
av_fifo_generic_read(q->async_fifo, &out_frame, sizeof(out_frame), NULL);
|
|
av_fifo_generic_read(q->async_fifo, &sync, sizeof(sync), NULL);
|
|
|
|
av_freep(&sync);
|
|
}
|
|
|
|
while (cur) {
|
|
q->work_frames = cur->next;
|
|
av_frame_free(&cur->frame);
|
|
av_freep(&cur);
|
|
cur = q->work_frames;
|
|
}
|
|
|
|
av_fifo_free(q->async_fifo);
|
|
q->async_fifo = NULL;
|
|
|
|
ff_qsv_close_internal_session(&q->internal_qs);
|
|
|
|
av_buffer_unref(&q->frames_ctx.hw_frames_ctx);
|
|
av_buffer_unref(&q->frames_ctx.mids_buf);
|
|
av_buffer_pool_uninit(&q->pool);
|
|
}
|
|
|
|
static int qsv_process_data(AVCodecContext *avctx, QSVContext *q,
|
|
AVFrame *frame, int *got_frame, const AVPacket *pkt)
|
|
{
|
|
int ret;
|
|
mfxVideoParam param = { 0 };
|
|
enum AVPixelFormat pix_fmt = AV_PIX_FMT_NV12;
|
|
|
|
if (!pkt->size)
|
|
return qsv_decode(avctx, q, frame, got_frame, pkt);
|
|
|
|
/* TODO: flush delayed frames on reinit */
|
|
|
|
// sw_pix_fmt, coded_width/height should be set for ff_get_format(),
|
|
// assume sw_pix_fmt is NV12 and coded_width/height to be 1280x720,
|
|
// the assumption may be not corret but will be updated after header decoded if not true.
|
|
if (q->orig_pix_fmt != AV_PIX_FMT_NONE)
|
|
pix_fmt = q->orig_pix_fmt;
|
|
if (!avctx->coded_width)
|
|
avctx->coded_width = 1280;
|
|
if (!avctx->coded_height)
|
|
avctx->coded_height = 720;
|
|
|
|
ret = qsv_decode_header(avctx, q, pkt, pix_fmt, ¶m);
|
|
|
|
if (ret >= 0 && (q->orig_pix_fmt != ff_qsv_map_fourcc(param.mfx.FrameInfo.FourCC) ||
|
|
avctx->coded_width != param.mfx.FrameInfo.Width ||
|
|
avctx->coded_height != param.mfx.FrameInfo.Height)) {
|
|
AVPacket zero_pkt = {0};
|
|
|
|
if (q->buffered_count) {
|
|
q->reinit_flag = 1;
|
|
/* decode zero-size pkt to flush the buffered pkt before reinit */
|
|
q->buffered_count--;
|
|
return qsv_decode(avctx, q, frame, got_frame, &zero_pkt);
|
|
}
|
|
q->reinit_flag = 0;
|
|
|
|
q->orig_pix_fmt = avctx->pix_fmt = pix_fmt = ff_qsv_map_fourcc(param.mfx.FrameInfo.FourCC);
|
|
|
|
avctx->coded_width = param.mfx.FrameInfo.Width;
|
|
avctx->coded_height = param.mfx.FrameInfo.Height;
|
|
|
|
ret = qsv_decode_preinit(avctx, q, pix_fmt, ¶m);
|
|
if (ret < 0)
|
|
goto reinit_fail;
|
|
q->initialized = 0;
|
|
}
|
|
|
|
if (!q->initialized) {
|
|
ret = qsv_decode_init_context(avctx, q, ¶m);
|
|
if (ret < 0)
|
|
goto reinit_fail;
|
|
q->initialized = 1;
|
|
}
|
|
|
|
return qsv_decode(avctx, q, frame, got_frame, pkt);
|
|
|
|
reinit_fail:
|
|
q->orig_pix_fmt = avctx->pix_fmt = AV_PIX_FMT_NONE;
|
|
return ret;
|
|
}
|
|
|
|
enum LoadPlugin {
|
|
LOAD_PLUGIN_NONE,
|
|
LOAD_PLUGIN_HEVC_SW,
|
|
LOAD_PLUGIN_HEVC_HW,
|
|
};
|
|
|
|
typedef struct QSVDecContext {
|
|
AVClass *class;
|
|
QSVContext qsv;
|
|
|
|
int load_plugin;
|
|
|
|
AVFifoBuffer *packet_fifo;
|
|
|
|
AVPacket buffer_pkt;
|
|
} QSVDecContext;
|
|
|
|
static void qsv_clear_buffers(QSVDecContext *s)
|
|
{
|
|
AVPacket pkt;
|
|
while (av_fifo_size(s->packet_fifo) >= sizeof(pkt)) {
|
|
av_fifo_generic_read(s->packet_fifo, &pkt, sizeof(pkt), NULL);
|
|
av_packet_unref(&pkt);
|
|
}
|
|
|
|
av_packet_unref(&s->buffer_pkt);
|
|
}
|
|
|
|
static av_cold int qsv_decode_close(AVCodecContext *avctx)
|
|
{
|
|
QSVDecContext *s = avctx->priv_data;
|
|
|
|
av_freep(&s->qsv.load_plugins);
|
|
|
|
qsv_decode_close_qsvcontext(&s->qsv);
|
|
|
|
qsv_clear_buffers(s);
|
|
|
|
av_fifo_free(s->packet_fifo);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static av_cold int qsv_decode_init(AVCodecContext *avctx)
|
|
{
|
|
QSVDecContext *s = avctx->priv_data;
|
|
int ret;
|
|
const char *uid = NULL;
|
|
|
|
if (avctx->codec_id == AV_CODEC_ID_VP8) {
|
|
uid = "f622394d8d87452f878c51f2fc9b4131";
|
|
} else if (avctx->codec_id == AV_CODEC_ID_VP9) {
|
|
uid = "a922394d8d87452f878c51f2fc9b4131";
|
|
}
|
|
else if (avctx->codec_id == AV_CODEC_ID_HEVC && s->load_plugin != LOAD_PLUGIN_NONE) {
|
|
static const char * const uid_hevcdec_sw = "15dd936825ad475ea34e35f3f54217a6";
|
|
static const char * const uid_hevcdec_hw = "33a61c0b4c27454ca8d85dde757c6f8e";
|
|
|
|
if (s->qsv.load_plugins[0]) {
|
|
av_log(avctx, AV_LOG_WARNING,
|
|
"load_plugins is not empty, but load_plugin is not set to 'none'."
|
|
"The load_plugin value will be ignored.\n");
|
|
} else {
|
|
if (s->load_plugin == LOAD_PLUGIN_HEVC_SW)
|
|
uid = uid_hevcdec_sw;
|
|
else
|
|
uid = uid_hevcdec_hw;
|
|
}
|
|
}
|
|
if (uid) {
|
|
av_freep(&s->qsv.load_plugins);
|
|
s->qsv.load_plugins = av_strdup(uid);
|
|
if (!s->qsv.load_plugins)
|
|
return AVERROR(ENOMEM);
|
|
}
|
|
|
|
s->qsv.orig_pix_fmt = AV_PIX_FMT_NV12;
|
|
s->packet_fifo = av_fifo_alloc(sizeof(AVPacket));
|
|
if (!s->packet_fifo) {
|
|
ret = AVERROR(ENOMEM);
|
|
goto fail;
|
|
}
|
|
|
|
if (!avctx->pkt_timebase.num)
|
|
av_log(avctx, AV_LOG_WARNING, "Invalid pkt_timebase, passing timestamps as-is.\n");
|
|
|
|
return 0;
|
|
fail:
|
|
qsv_decode_close(avctx);
|
|
return ret;
|
|
}
|
|
|
|
static int qsv_decode_frame(AVCodecContext *avctx, void *data,
|
|
int *got_frame, AVPacket *avpkt)
|
|
{
|
|
QSVDecContext *s = avctx->priv_data;
|
|
AVFrame *frame = data;
|
|
int ret;
|
|
|
|
/* buffer the input packet */
|
|
if (avpkt->size) {
|
|
AVPacket input_ref;
|
|
|
|
if (av_fifo_space(s->packet_fifo) < sizeof(input_ref)) {
|
|
ret = av_fifo_realloc2(s->packet_fifo,
|
|
av_fifo_size(s->packet_fifo) + sizeof(input_ref));
|
|
if (ret < 0)
|
|
return ret;
|
|
}
|
|
|
|
ret = av_packet_ref(&input_ref, avpkt);
|
|
if (ret < 0)
|
|
return ret;
|
|
av_fifo_generic_write(s->packet_fifo, &input_ref, sizeof(input_ref), NULL);
|
|
}
|
|
|
|
/* process buffered data */
|
|
while (!*got_frame) {
|
|
/* prepare the input data */
|
|
if (s->buffer_pkt.size <= 0) {
|
|
/* no more data */
|
|
if (av_fifo_size(s->packet_fifo) < sizeof(AVPacket))
|
|
return avpkt->size ? avpkt->size : qsv_process_data(avctx, &s->qsv, frame, got_frame, avpkt);
|
|
/* in progress of reinit, no read from fifo and keep the buffer_pkt */
|
|
if (!s->qsv.reinit_flag) {
|
|
av_packet_unref(&s->buffer_pkt);
|
|
av_fifo_generic_read(s->packet_fifo, &s->buffer_pkt, sizeof(s->buffer_pkt), NULL);
|
|
}
|
|
}
|
|
|
|
ret = qsv_process_data(avctx, &s->qsv, frame, got_frame, &s->buffer_pkt);
|
|
if (ret < 0){
|
|
/* Drop buffer_pkt when failed to decode the packet. Otherwise,
|
|
the decoder will keep decoding the failure packet. */
|
|
av_packet_unref(&s->buffer_pkt);
|
|
return ret;
|
|
}
|
|
if (s->qsv.reinit_flag)
|
|
continue;
|
|
|
|
s->buffer_pkt.size -= ret;
|
|
s->buffer_pkt.data += ret;
|
|
}
|
|
|
|
return avpkt->size;
|
|
}
|
|
|
|
static void qsv_decode_flush(AVCodecContext *avctx)
|
|
{
|
|
QSVDecContext *s = avctx->priv_data;
|
|
|
|
qsv_clear_buffers(s);
|
|
|
|
s->qsv.orig_pix_fmt = AV_PIX_FMT_NONE;
|
|
s->qsv.initialized = 0;
|
|
}
|
|
|
|
#define OFFSET(x) offsetof(QSVDecContext, x)
|
|
#define VD AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_DECODING_PARAM
|
|
|
|
#define DEFINE_QSV_DECODER_WITH_OPTION(x, X, bsf_name, opt) \
|
|
static const AVClass x##_qsv_class = { \
|
|
.class_name = #x "_qsv", \
|
|
.item_name = av_default_item_name, \
|
|
.option = opt, \
|
|
.version = LIBAVUTIL_VERSION_INT, \
|
|
}; \
|
|
const AVCodec ff_##x##_qsv_decoder = { \
|
|
.name = #x "_qsv", \
|
|
.long_name = NULL_IF_CONFIG_SMALL(#X " video (Intel Quick Sync Video acceleration)"), \
|
|
.priv_data_size = sizeof(QSVDecContext), \
|
|
.type = AVMEDIA_TYPE_VIDEO, \
|
|
.id = AV_CODEC_ID_##X, \
|
|
.init = qsv_decode_init, \
|
|
.decode = qsv_decode_frame, \
|
|
.flush = qsv_decode_flush, \
|
|
.close = qsv_decode_close, \
|
|
.bsfs = bsf_name, \
|
|
.capabilities = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_DR1 | AV_CODEC_CAP_AVOID_PROBING | AV_CODEC_CAP_HYBRID, \
|
|
.priv_class = &x##_qsv_class, \
|
|
.pix_fmts = (const enum AVPixelFormat[]){ AV_PIX_FMT_NV12, \
|
|
AV_PIX_FMT_P010, \
|
|
AV_PIX_FMT_QSV, \
|
|
AV_PIX_FMT_NONE }, \
|
|
.hw_configs = qsv_hw_configs, \
|
|
.wrapper_name = "qsv", \
|
|
}; \
|
|
|
|
#define DEFINE_QSV_DECODER(x, X, bsf_name) DEFINE_QSV_DECODER_WITH_OPTION(x, X, bsf_name, options)
|
|
|
|
#if CONFIG_HEVC_QSV_DECODER
|
|
static const AVOption hevc_options[] = {
|
|
{ "async_depth", "Internal parallelization depth, the higher the value the higher the latency.", OFFSET(qsv.async_depth), AV_OPT_TYPE_INT, { .i64 = ASYNC_DEPTH_DEFAULT }, 1, INT_MAX, VD },
|
|
|
|
{ "load_plugin", "A user plugin to load in an internal session", OFFSET(load_plugin), AV_OPT_TYPE_INT, { .i64 = LOAD_PLUGIN_HEVC_HW }, LOAD_PLUGIN_NONE, LOAD_PLUGIN_HEVC_HW, VD, "load_plugin" },
|
|
{ "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_NONE }, 0, 0, VD, "load_plugin" },
|
|
{ "hevc_sw", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_HEVC_SW }, 0, 0, VD, "load_plugin" },
|
|
{ "hevc_hw", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_HEVC_HW }, 0, 0, VD, "load_plugin" },
|
|
|
|
{ "load_plugins", "A :-separate list of hexadecimal plugin UIDs to load in an internal session",
|
|
OFFSET(qsv.load_plugins), AV_OPT_TYPE_STRING, { .str = "" }, 0, 0, VD },
|
|
|
|
{ "gpu_copy", "A GPU-accelerated copy between video and system memory", OFFSET(qsv.gpu_copy), AV_OPT_TYPE_INT, { .i64 = MFX_GPUCOPY_DEFAULT }, MFX_GPUCOPY_DEFAULT, MFX_GPUCOPY_OFF, VD, "gpu_copy"},
|
|
{ "default", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_DEFAULT }, 0, 0, VD, "gpu_copy"},
|
|
{ "on", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_ON }, 0, 0, VD, "gpu_copy"},
|
|
{ "off", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_OFF }, 0, 0, VD, "gpu_copy"},
|
|
{ NULL },
|
|
};
|
|
DEFINE_QSV_DECODER_WITH_OPTION(hevc, HEVC, "hevc_mp4toannexb", hevc_options)
|
|
#endif
|
|
|
|
static const AVOption options[] = {
|
|
{ "async_depth", "Internal parallelization depth, the higher the value the higher the latency.", OFFSET(qsv.async_depth), AV_OPT_TYPE_INT, { .i64 = ASYNC_DEPTH_DEFAULT }, 1, INT_MAX, VD },
|
|
|
|
{ "gpu_copy", "A GPU-accelerated copy between video and system memory", OFFSET(qsv.gpu_copy), AV_OPT_TYPE_INT, { .i64 = MFX_GPUCOPY_DEFAULT }, MFX_GPUCOPY_DEFAULT, MFX_GPUCOPY_OFF, VD, "gpu_copy"},
|
|
{ "default", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_DEFAULT }, 0, 0, VD, "gpu_copy"},
|
|
{ "on", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_ON }, 0, 0, VD, "gpu_copy"},
|
|
{ "off", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_GPUCOPY_OFF }, 0, 0, VD, "gpu_copy"},
|
|
{ NULL },
|
|
};
|
|
|
|
#if CONFIG_H264_QSV_DECODER
|
|
DEFINE_QSV_DECODER(h264, H264, "h264_mp4toannexb")
|
|
#endif
|
|
|
|
#if CONFIG_MPEG2_QSV_DECODER
|
|
DEFINE_QSV_DECODER(mpeg2, MPEG2VIDEO, NULL)
|
|
#endif
|
|
|
|
#if CONFIG_VC1_QSV_DECODER
|
|
DEFINE_QSV_DECODER(vc1, VC1, NULL)
|
|
#endif
|
|
|
|
#if CONFIG_MJPEG_QSV_DECODER
|
|
DEFINE_QSV_DECODER(mjpeg, MJPEG, NULL)
|
|
#endif
|
|
|
|
#if CONFIG_VP8_QSV_DECODER
|
|
DEFINE_QSV_DECODER(vp8, VP8, NULL)
|
|
#endif
|
|
|
|
#if CONFIG_VP9_QSV_DECODER
|
|
DEFINE_QSV_DECODER(vp9, VP9, NULL)
|
|
#endif
|
|
|
|
#if CONFIG_AV1_QSV_DECODER
|
|
DEFINE_QSV_DECODER(av1, AV1, NULL)
|
|
#endif
|