/* * libkvazaar encoder * * Copyright (c) 2015 Tampere University of Technology * * This file is part of FFmpeg. * * FFmpeg is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2.1 of the License, or (at your option) any later version. * * FFmpeg is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with FFmpeg; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA */ #include #include #include "libavutil/avassert.h" #include "libavutil/imgutils.h" #include "libavutil/dict.h" #include "libavutil/opt.h" #include "libavutil/pixdesc.h" #include "avcodec.h" #include "internal.h" typedef struct LibkvazaarContext { const AVClass *class; const kvz_api *api; kvz_encoder *encoder; kvz_config *config; char *kvz_params; } LibkvazaarContext; static av_cold int libkvazaar_init(AVCodecContext *avctx) { int retval = 0; kvz_config *cfg = NULL; kvz_encoder *enc = NULL; const kvz_api *const api = kvz_api_get(8); LibkvazaarContext *const ctx = avctx->priv_data; // Kvazaar requires width and height to be multiples of eight. if (avctx->width % 8 || avctx->height % 8) { av_log(avctx, AV_LOG_ERROR, "Video dimensions are not a multiple of 8.\n"); retval = AVERROR_INVALIDDATA; goto done; } cfg = api->config_alloc(); if (!cfg) { av_log(avctx, AV_LOG_ERROR, "Could not allocate kvazaar config structure.\n"); retval = AVERROR(ENOMEM); goto done; } if (!api->config_init(cfg)) { av_log(avctx, AV_LOG_ERROR, "Could not initialize kvazaar config structure.\n"); retval = AVERROR_EXTERNAL; goto done; } cfg->width = avctx->width; cfg->height = avctx->height; cfg->framerate = (double)(avctx->time_base.num * avctx->ticks_per_frame) / avctx->time_base.den; cfg->threads = avctx->thread_count; cfg->target_bitrate = avctx->bit_rate; cfg->vui.sar_width = avctx->sample_aspect_ratio.num; cfg->vui.sar_height = avctx->sample_aspect_ratio.den; if (ctx->kvz_params) { AVDictionary *dict = NULL; if (!av_dict_parse_string(&dict, ctx->kvz_params, "=", ",", 0)) { AVDictionaryEntry *entry = NULL; while ((entry = av_dict_get(dict, "", entry, AV_DICT_IGNORE_SUFFIX))) { if (!api->config_parse(cfg, entry->key, entry->value)) { av_log(avctx, AV_LOG_WARNING, "Invalid option: %s=%s.\n", entry->key, entry->value); } } av_dict_free(&dict); } } enc = api->encoder_open(cfg); if (!enc) { av_log(avctx, AV_LOG_ERROR, "Could not open kvazaar encoder.\n"); retval = AVERROR_EXTERNAL; goto done; } ctx->api = api; ctx->encoder = enc; ctx->config = cfg; enc = NULL; cfg = NULL; done: api->config_destroy(cfg); api->encoder_close(enc); return retval; } static av_cold int libkvazaar_close(AVCodecContext *avctx) { LibkvazaarContext *ctx = avctx->priv_data; if (!ctx->api) return 0; if (ctx->encoder) { ctx->api->encoder_close(ctx->encoder); ctx->encoder = NULL; } if (ctx->config) { ctx->api->config_destroy(ctx->config); ctx->config = NULL; } return 0; } static int libkvazaar_encode(AVCodecContext *avctx, AVPacket *avpkt, const AVFrame *frame, int *got_packet_ptr) { int retval = 0; kvz_picture *img_in = NULL; kvz_data_chunk *data_out = NULL; uint32_t len_out = 0; kvz_picture *recon_pic = NULL; kvz_frame_info frame_info; LibkvazaarContext *ctx = avctx->priv_data; *got_packet_ptr = 0; if (frame) { if (frame->width != ctx->config->width || frame->height != ctx->config->height) { av_log(avctx, AV_LOG_ERROR, "Changing video dimensions during encoding is not supported. " "(changed from %dx%d to %dx%d)\n", ctx->config->width, ctx->config->height, frame->width, frame->height); retval = AVERROR_INVALIDDATA; goto done; } if (frame->format != avctx->pix_fmt) { av_log(avctx, AV_LOG_ERROR, "Changing pixel format during encoding is not supported. " "(changed from %s to %s)\n", av_get_pix_fmt_name(avctx->pix_fmt), av_get_pix_fmt_name(frame->format)); retval = AVERROR_INVALIDDATA; goto done; } // Allocate input picture for kvazaar. img_in = ctx->api->picture_alloc(frame->width, frame->height); if (!img_in) { av_log(avctx, AV_LOG_ERROR, "Failed to allocate picture.\n"); retval = AVERROR(ENOMEM); goto done; } // Copy pixels from frame to img_in. { int dst_linesizes[4] = { frame->width, frame->width / 2, frame->width / 2, 0 }; av_image_copy(img_in->data, dst_linesizes, frame->data, frame->linesize, frame->format, frame->width, frame->height); } img_in->pts = frame->pts; } if (!ctx->api->encoder_encode(ctx->encoder, img_in, &data_out, &len_out, &recon_pic, NULL, &frame_info)) { av_log(avctx, AV_LOG_ERROR, "Failed to encode frame.\n"); retval = AVERROR_EXTERNAL; goto done; } if (data_out) { kvz_data_chunk *chunk = NULL; uint64_t written = 0; retval = ff_alloc_packet(avpkt, len_out); if (retval < 0) { av_log(avctx, AV_LOG_ERROR, "Failed to allocate output packet.\n"); goto done; } for (chunk = data_out; chunk != NULL; chunk = chunk->next) { av_assert0(written + chunk->len <= len_out); memcpy(avpkt->data + written, chunk->data, chunk->len); written += chunk->len; } *got_packet_ptr = 1; ctx->api->chunk_free(data_out); data_out = NULL; avpkt->pts = recon_pic->pts; avpkt->dts = recon_pic->dts; avpkt->flags = 0; // IRAP VCL NAL unit types span the range // [BLA_W_LP (16), RSV_IRAP_VCL23 (23)]. if (frame_info.nal_unit_type >= KVZ_NAL_BLA_W_LP && frame_info.nal_unit_type <= KVZ_NAL_RSV_IRAP_VCL23) { avpkt->flags |= AV_PKT_FLAG_KEY; } } done: ctx->api->picture_free(img_in); ctx->api->picture_free(recon_pic); ctx->api->chunk_free(data_out); return retval; } static const enum AVPixelFormat pix_fmts[] = { AV_PIX_FMT_YUV420P, AV_PIX_FMT_NONE }; static const AVOption options[] = { { "kvazaar-params", "Set kvazaar parameters as a comma-separated list of name=value pairs.", offsetof(LibkvazaarContext, kvz_params), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM }, { NULL }, }; static const AVClass class = { .class_name = "libkvazaar", .item_name = av_default_item_name, .option = options, .version = LIBAVUTIL_VERSION_INT, }; static const AVCodecDefault defaults[] = { { "b", "0" }, { NULL }, }; AVCodec ff_libkvazaar_encoder = { .name = "libkvazaar", .long_name = NULL_IF_CONFIG_SMALL("libkvazaar H.265 / HEVC"), .type = AVMEDIA_TYPE_VIDEO, .id = AV_CODEC_ID_HEVC, .capabilities = AV_CODEC_CAP_DELAY, .pix_fmts = pix_fmts, .priv_class = &class, .priv_data_size = sizeof(LibkvazaarContext), .defaults = defaults, .init = libkvazaar_init, .encode2 = libkvazaar_encode, .close = libkvazaar_close, };