mirror of https://git.ffmpeg.org/ffmpeg.git
410 lines
14 KiB
C
410 lines
14 KiB
C
/*
|
|
* ARIB STD-B24 caption decoder using the libaribb24 library
|
|
* Copyright (c) 2019 Jan Ekström
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include "avcodec.h"
|
|
#include "libavcodec/ass.h"
|
|
#include "codec_internal.h"
|
|
#include "libavutil/log.h"
|
|
#include "libavutil/mem.h"
|
|
#include "libavutil/opt.h"
|
|
|
|
#include <aribb24/aribb24.h>
|
|
#include <aribb24/parser.h>
|
|
#include <aribb24/decoder.h>
|
|
|
|
typedef struct Libaribb24Context {
|
|
AVClass *class;
|
|
|
|
arib_instance_t *lib_instance;
|
|
arib_parser_t *parser;
|
|
arib_decoder_t *decoder;
|
|
|
|
int read_order;
|
|
|
|
char *aribb24_base_path;
|
|
unsigned int aribb24_skip_ruby;
|
|
|
|
int default_profile;
|
|
} Libaribb24Context;
|
|
|
|
static unsigned int get_profile_font_size(AVCodecContext *avctx)
|
|
{
|
|
Libaribb24Context *b24 = avctx->priv_data;
|
|
int profile = avctx->profile;
|
|
|
|
if (profile == AV_PROFILE_UNKNOWN)
|
|
profile = b24->default_profile;
|
|
|
|
switch (profile) {
|
|
case AV_PROFILE_ARIB_PROFILE_A:
|
|
return 36;
|
|
case AV_PROFILE_ARIB_PROFILE_C:
|
|
return 18;
|
|
default:
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
static void libaribb24_log(void *p, const char *msg)
|
|
{
|
|
av_log((AVCodecContext *)p, AV_LOG_INFO, "%s\n", msg);
|
|
}
|
|
|
|
static int libaribb24_generate_ass_header(AVCodecContext *avctx)
|
|
{
|
|
Libaribb24Context *b24 = avctx->priv_data;
|
|
unsigned int plane_width = 0;
|
|
unsigned int plane_height = 0;
|
|
unsigned int font_size = 0;
|
|
int profile = avctx->profile;
|
|
|
|
if (profile == AV_PROFILE_UNKNOWN)
|
|
profile = b24->default_profile;
|
|
|
|
switch (profile) {
|
|
case AV_PROFILE_ARIB_PROFILE_A:
|
|
plane_width = 960;
|
|
plane_height = 540;
|
|
break;
|
|
case AV_PROFILE_ARIB_PROFILE_C:
|
|
plane_width = 320;
|
|
plane_height = 180;
|
|
break;
|
|
default:
|
|
av_log(avctx, AV_LOG_ERROR, "Unknown or unsupported profile set!\n");
|
|
return AVERROR(EINVAL);
|
|
}
|
|
|
|
font_size = get_profile_font_size(avctx);
|
|
|
|
avctx->subtitle_header = av_asprintf(
|
|
"[Script Info]\r\n"
|
|
"; Script generated by FFmpeg/Lavc%s\r\n"
|
|
"ScriptType: v4.00+\r\n"
|
|
"PlayResX: %d\r\n"
|
|
"PlayResY: %d\r\n"
|
|
"\r\n"
|
|
"[V4+ Styles]\r\n"
|
|
|
|
/* ASSv4 header */
|
|
"Format: Name, "
|
|
"Fontname, Fontsize, "
|
|
"PrimaryColour, SecondaryColour, OutlineColour, BackColour, "
|
|
"Bold, Italic, Underline, StrikeOut, "
|
|
"ScaleX, ScaleY, "
|
|
"Spacing, Angle, "
|
|
"BorderStyle, Outline, Shadow, "
|
|
"Alignment, MarginL, MarginR, MarginV, "
|
|
"Encoding\r\n"
|
|
|
|
"Style: "
|
|
"Default," /* Name */
|
|
"%s,%d," /* Font{name,size} */
|
|
"&H%x,&H%x,&H%x,&H%x," /* {Primary,Secondary,Outline,Back}Colour */
|
|
"%d,%d,%d,0," /* Bold, Italic, Underline, StrikeOut */
|
|
"100,100," /* Scale{X,Y} */
|
|
"0,0," /* Spacing, Angle */
|
|
"%d,1,0," /* BorderStyle, Outline, Shadow */
|
|
"%d,10,10,10," /* Alignment, Margin[LRV] */
|
|
"0\r\n" /* Encoding */
|
|
|
|
"\r\n"
|
|
"[Events]\r\n"
|
|
"Format: Layer, Start, End, Style, Name, MarginL, MarginR, MarginV, Effect, Text\r\n",
|
|
!(avctx->flags & AV_CODEC_FLAG_BITEXACT) ? AV_STRINGIFY(LIBAVCODEC_VERSION) : "",
|
|
plane_width, plane_height,
|
|
ASS_DEFAULT_FONT, font_size, ASS_DEFAULT_COLOR,
|
|
ASS_DEFAULT_COLOR, ASS_DEFAULT_BACK_COLOR, ASS_DEFAULT_BACK_COLOR,
|
|
-ASS_DEFAULT_BOLD, -ASS_DEFAULT_ITALIC, -ASS_DEFAULT_UNDERLINE,
|
|
ASS_DEFAULT_BORDERSTYLE, ASS_DEFAULT_ALIGNMENT);
|
|
|
|
if (!avctx->subtitle_header)
|
|
return AVERROR(ENOMEM);
|
|
|
|
avctx->subtitle_header_size = strlen(avctx->subtitle_header);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int libaribb24_init(AVCodecContext *avctx)
|
|
{
|
|
Libaribb24Context *b24 = avctx->priv_data;
|
|
void(* arib_dec_init)(arib_decoder_t* decoder) = NULL;
|
|
int ret;
|
|
int profile = avctx->profile;
|
|
|
|
if (!(b24->lib_instance = arib_instance_new(avctx))) {
|
|
av_log(avctx, AV_LOG_ERROR, "Failed to initialize libaribb24!\n");
|
|
return AVERROR_EXTERNAL;
|
|
}
|
|
|
|
if (b24->aribb24_base_path) {
|
|
av_log(avctx, AV_LOG_INFO, "Setting the libaribb24 base path to '%s'\n",
|
|
b24->aribb24_base_path);
|
|
arib_set_base_path(b24->lib_instance, b24->aribb24_base_path);
|
|
}
|
|
|
|
arib_register_messages_callback(b24->lib_instance, libaribb24_log);
|
|
|
|
if (!(b24->parser = arib_get_parser(b24->lib_instance))) {
|
|
av_log(avctx, AV_LOG_ERROR, "Failed to initialize libaribb24 PES parser!\n");
|
|
return AVERROR_EXTERNAL;
|
|
}
|
|
if (!(b24->decoder = arib_get_decoder(b24->lib_instance))) {
|
|
av_log(avctx, AV_LOG_ERROR, "Failed to initialize libaribb24 decoder!\n");
|
|
return AVERROR_EXTERNAL;
|
|
}
|
|
|
|
if (profile == AV_PROFILE_UNKNOWN)
|
|
profile = b24->default_profile;
|
|
|
|
switch (profile) {
|
|
case AV_PROFILE_ARIB_PROFILE_A:
|
|
arib_dec_init = arib_initialize_decoder_a_profile;
|
|
break;
|
|
case AV_PROFILE_ARIB_PROFILE_C:
|
|
arib_dec_init = arib_initialize_decoder_c_profile;
|
|
break;
|
|
default:
|
|
av_log(avctx, AV_LOG_ERROR, "Unknown or unsupported profile set!\n");
|
|
return AVERROR(EINVAL);
|
|
}
|
|
|
|
arib_dec_init(b24->decoder);
|
|
|
|
ret = libaribb24_generate_ass_header(avctx);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int libaribb24_close(AVCodecContext *avctx)
|
|
{
|
|
Libaribb24Context *b24 = avctx->priv_data;
|
|
|
|
if (b24->decoder)
|
|
arib_finalize_decoder(b24->decoder);
|
|
|
|
if (b24->lib_instance)
|
|
arib_instance_destroy(b24->lib_instance);
|
|
|
|
return 0;
|
|
}
|
|
|
|
#define RGB_TO_BGR(c) (((c) & 0xff) << 16 | ((c) & 0xff00) | (((c) >> 16) & 0xff))
|
|
|
|
static int libaribb24_handle_regions(AVCodecContext *avctx, AVSubtitle *sub)
|
|
{
|
|
Libaribb24Context *b24 = avctx->priv_data;
|
|
const arib_buf_region_t *region = arib_decoder_get_regions(b24->decoder);
|
|
unsigned int profile_font_size = get_profile_font_size(avctx);
|
|
AVBPrint buf;
|
|
int ret = 0;
|
|
|
|
av_bprint_init(&buf, 0, AV_BPRINT_SIZE_UNLIMITED);
|
|
|
|
while (region) {
|
|
ptrdiff_t region_length = region->p_end - region->p_start;
|
|
unsigned int ruby_region =
|
|
region->i_fontheight == (profile_font_size / 2);
|
|
|
|
// ASS requires us to make the colors BGR, so we convert here
|
|
int foreground_bgr_color = RGB_TO_BGR(region->i_foreground_color);
|
|
int background_bgr_color = RGB_TO_BGR(region->i_background_color);
|
|
|
|
if (region_length < 0) {
|
|
av_log(avctx, AV_LOG_ERROR, "Invalid negative region length!\n");
|
|
ret = AVERROR_INVALIDDATA;
|
|
break;
|
|
}
|
|
|
|
if (region_length == 0 || (ruby_region && b24->aribb24_skip_ruby)) {
|
|
goto next_region;
|
|
}
|
|
|
|
// color and alpha
|
|
if (foreground_bgr_color != ASS_DEFAULT_COLOR)
|
|
av_bprintf(&buf, "{\\1c&H%06x&}", foreground_bgr_color);
|
|
|
|
if (region->i_foreground_alpha != 0)
|
|
av_bprintf(&buf, "{\\1a&H%02x&}", region->i_foreground_alpha);
|
|
|
|
if (background_bgr_color != ASS_DEFAULT_BACK_COLOR)
|
|
av_bprintf(&buf, "{\\3c&H%06x&}", background_bgr_color);
|
|
|
|
if (region->i_background_alpha != 0)
|
|
av_bprintf(&buf, "{\\3a&H%02x&}", region->i_background_alpha);
|
|
|
|
// font size
|
|
if (region->i_fontwidth != profile_font_size ||
|
|
region->i_fontheight != profile_font_size) {
|
|
av_bprintf(&buf, "{\\fscx%"PRId64"\\fscy%"PRId64"}",
|
|
av_rescale(region->i_fontwidth, 100,
|
|
profile_font_size),
|
|
av_rescale(region->i_fontheight, 100,
|
|
profile_font_size));
|
|
}
|
|
|
|
// TODO: positioning
|
|
|
|
av_bprint_append_data(&buf, region->p_start, region_length);
|
|
|
|
av_bprintf(&buf, "{\\r}");
|
|
|
|
next_region:
|
|
region = region->p_next;
|
|
}
|
|
|
|
if (!av_bprint_is_complete(&buf))
|
|
ret = AVERROR(ENOMEM);
|
|
|
|
if (ret == 0) {
|
|
av_log(avctx, AV_LOG_DEBUG, "Styled ASS line: %s\n",
|
|
buf.str);
|
|
|
|
sub->format = 1; /* text */
|
|
ret = ff_ass_add_rect(sub, buf.str, b24->read_order++,
|
|
0, NULL, NULL);
|
|
}
|
|
|
|
av_bprint_finalize(&buf, NULL);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int libaribb24_decode(AVCodecContext *avctx, AVSubtitle *sub,
|
|
int *got_sub_ptr, const AVPacket *pkt)
|
|
{
|
|
Libaribb24Context *b24 = avctx->priv_data;
|
|
size_t parsed_data_size = 0;
|
|
size_t decoded_subtitle_size = 0;
|
|
const unsigned char *parsed_data = NULL;
|
|
char *decoded_subtitle = NULL;
|
|
time_t subtitle_duration = 0;
|
|
int ret = 0;
|
|
|
|
if (pkt->size <= 0)
|
|
return pkt->size;
|
|
|
|
arib_parse_pes(b24->parser, pkt->data, pkt->size);
|
|
|
|
parsed_data = arib_parser_get_data(b24->parser,
|
|
&parsed_data_size);
|
|
if (!parsed_data || !parsed_data_size) {
|
|
av_log(avctx, AV_LOG_DEBUG, "No decode'able data was received from "
|
|
"packet (dts: %"PRId64", pts: %"PRId64").\n",
|
|
pkt->dts, pkt->pts);
|
|
return pkt->size;
|
|
}
|
|
|
|
decoded_subtitle_size = parsed_data_size * 4;
|
|
if (!(decoded_subtitle = av_mallocz(decoded_subtitle_size + 1))) {
|
|
av_log(avctx, AV_LOG_ERROR,
|
|
"Failed to allocate buffer for decoded subtitle!\n");
|
|
return AVERROR(ENOMEM);
|
|
}
|
|
|
|
decoded_subtitle_size = arib_decode_buffer(b24->decoder,
|
|
parsed_data,
|
|
parsed_data_size,
|
|
decoded_subtitle,
|
|
decoded_subtitle_size);
|
|
|
|
subtitle_duration = arib_decoder_get_time(b24->decoder);
|
|
|
|
if (avctx->pkt_timebase.num && pkt->pts != AV_NOPTS_VALUE)
|
|
sub->pts = av_rescale_q(pkt->pts,
|
|
avctx->pkt_timebase, AV_TIME_BASE_Q);
|
|
|
|
sub->end_display_time = subtitle_duration ?
|
|
av_rescale_q(subtitle_duration,
|
|
AV_TIME_BASE_Q,
|
|
(AVRational){1, 1000}) :
|
|
UINT32_MAX;
|
|
|
|
av_log(avctx, AV_LOG_DEBUG,
|
|
"Result: '%s' (size: %zu, pkt_pts: %"PRId64", sub_pts: %"PRId64" "
|
|
"duration: %"PRIu32", pkt_timebase: %d/%d, time_base: %d/%d')\n",
|
|
decoded_subtitle ? decoded_subtitle : "<no subtitle>",
|
|
decoded_subtitle_size,
|
|
pkt->pts, sub->pts,
|
|
sub->end_display_time,
|
|
avctx->pkt_timebase.num, avctx->pkt_timebase.den,
|
|
avctx->time_base.num, avctx->time_base.den);
|
|
|
|
if (decoded_subtitle)
|
|
ret = libaribb24_handle_regions(avctx, sub);
|
|
|
|
*got_sub_ptr = sub->num_rects > 0;
|
|
|
|
av_free(decoded_subtitle);
|
|
|
|
// flush the region buffers, otherwise the linked list keeps getting
|
|
// longer and longer...
|
|
arib_finalize_decoder(b24->decoder);
|
|
|
|
return ret < 0 ? ret : pkt->size;
|
|
}
|
|
|
|
static void libaribb24_flush(AVCodecContext *avctx)
|
|
{
|
|
Libaribb24Context *b24 = avctx->priv_data;
|
|
if (!(avctx->flags2 & AV_CODEC_FLAG2_RO_FLUSH_NOOP))
|
|
b24->read_order = 0;
|
|
}
|
|
|
|
#define OFFSET(x) offsetof(Libaribb24Context, x)
|
|
#define SD AV_OPT_FLAG_SUBTITLE_PARAM | AV_OPT_FLAG_DECODING_PARAM
|
|
static const AVOption options[] = {
|
|
{ "aribb24-base-path", "set the base path for the libaribb24 library",
|
|
OFFSET(aribb24_base_path), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, SD },
|
|
{ "aribb24-skip-ruby-text", "skip ruby text blocks during decoding",
|
|
OFFSET(aribb24_skip_ruby), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, SD },
|
|
{ "default_profile", "default profile to use if not specified in the stream parameters",
|
|
OFFSET(default_profile), AV_OPT_TYPE_INT, { .i64 = AV_PROFILE_UNKNOWN }, AV_PROFILE_UNKNOWN, AV_PROFILE_ARIB_PROFILE_C, SD, .unit = "profile" },
|
|
{"a", "Profile A", 0, AV_OPT_TYPE_CONST, {.i64 = AV_PROFILE_ARIB_PROFILE_A}, INT_MIN, INT_MAX, SD, .unit = "profile"},
|
|
{"c", "Profile C", 0, AV_OPT_TYPE_CONST, {.i64 = AV_PROFILE_ARIB_PROFILE_C}, INT_MIN, INT_MAX, SD, .unit = "profile"},
|
|
{ NULL }
|
|
};
|
|
|
|
static const AVClass aribb24_class = {
|
|
.class_name = "libaribb24 decoder",
|
|
.item_name = av_default_item_name,
|
|
.option = options,
|
|
.version = LIBAVUTIL_VERSION_INT,
|
|
};
|
|
|
|
const FFCodec ff_libaribb24_decoder = {
|
|
.p.name = "libaribb24",
|
|
CODEC_LONG_NAME("libaribb24 ARIB STD-B24 caption decoder"),
|
|
.p.type = AVMEDIA_TYPE_SUBTITLE,
|
|
.p.id = AV_CODEC_ID_ARIB_CAPTION,
|
|
.p.priv_class = &aribb24_class,
|
|
.p.wrapper_name = "libaribb24",
|
|
.caps_internal = FF_CODEC_CAP_INIT_CLEANUP | FF_CODEC_CAP_NOT_INIT_THREADSAFE,
|
|
.priv_data_size = sizeof(Libaribb24Context),
|
|
.init = libaribb24_init,
|
|
.close = libaribb24_close,
|
|
FF_CODEC_DECODE_SUB_CB(libaribb24_decode),
|
|
.flush = libaribb24_flush,
|
|
};
|