ffmpeg/libavcodec/cbs_av1.c

1309 lines
39 KiB
C

/*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include "libavutil/avassert.h"
#include "libavutil/opt.h"
#include "libavutil/pixfmt.h"
#include "cbs.h"
#include "cbs_internal.h"
#include "cbs_av1.h"
#include "defs.h"
#include "refstruct.h"
static int cbs_av1_read_uvlc(CodedBitstreamContext *ctx, GetBitContext *gbc,
const char *name, uint32_t *write_to,
uint32_t range_min, uint32_t range_max)
{
uint32_t zeroes, bits_value, value;
CBS_TRACE_READ_START();
zeroes = 0;
while (zeroes < 32) {
if (get_bits_left(gbc) < 1) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid uvlc code at "
"%s: bitstream ended.\n", name);
return AVERROR_INVALIDDATA;
}
if (get_bits1(gbc))
break;
++zeroes;
}
if (zeroes >= 32) {
// The spec allows at least thirty-two zero bits followed by a
// one to mean 2^32-1, with no constraint on the number of
// zeroes. The libaom reference decoder does not match this,
// instead reading thirty-two zeroes but not the following one
// to mean 2^32-1. These two interpretations are incompatible
// and other implementations may follow one or the other.
// Therefore we reject thirty-two zeroes because the intended
// behaviour is not clear.
av_log(ctx->log_ctx, AV_LOG_ERROR, "Thirty-two zero bits in "
"%s uvlc code: considered invalid due to conflicting "
"standard and reference decoder behaviour.\n", name);
return AVERROR_INVALIDDATA;
} else {
if (get_bits_left(gbc) < zeroes) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid uvlc code at "
"%s: bitstream ended.\n", name);
return AVERROR_INVALIDDATA;
}
bits_value = get_bits_long(gbc, zeroes);
value = bits_value + (UINT32_C(1) << zeroes) - 1;
}
CBS_TRACE_READ_END_NO_SUBSCRIPTS();
if (value < range_min || value > range_max) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "%s out of range: "
"%"PRIu32", but must be in [%"PRIu32",%"PRIu32"].\n",
name, value, range_min, range_max);
return AVERROR_INVALIDDATA;
}
*write_to = value;
return 0;
}
static int cbs_av1_write_uvlc(CodedBitstreamContext *ctx, PutBitContext *pbc,
const char *name, uint32_t value,
uint32_t range_min, uint32_t range_max)
{
uint32_t v;
int zeroes;
CBS_TRACE_WRITE_START();
if (value < range_min || value > range_max) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "%s out of range: "
"%"PRIu32", but must be in [%"PRIu32",%"PRIu32"].\n",
name, value, range_min, range_max);
return AVERROR_INVALIDDATA;
}
zeroes = av_log2(value + 1);
v = value - (1U << zeroes) + 1;
if (put_bits_left(pbc) < 2 * zeroes + 1)
return AVERROR(ENOSPC);
put_bits(pbc, zeroes, 0);
put_bits(pbc, 1, 1);
put_bits(pbc, zeroes, v);
CBS_TRACE_WRITE_END_NO_SUBSCRIPTS();
return 0;
}
static int cbs_av1_read_leb128(CodedBitstreamContext *ctx, GetBitContext *gbc,
const char *name, uint64_t *write_to)
{
uint64_t value;
uint32_t byte;
int i;
CBS_TRACE_READ_START();
value = 0;
for (i = 0; i < 8; i++) {
if (get_bits_left(gbc) < 8) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid leb128 at "
"%s: bitstream ended.\n", name);
return AVERROR_INVALIDDATA;
}
byte = get_bits(gbc, 8);
value |= (uint64_t)(byte & 0x7f) << (i * 7);
if (!(byte & 0x80))
break;
}
if (value > UINT32_MAX)
return AVERROR_INVALIDDATA;
CBS_TRACE_READ_END_NO_SUBSCRIPTS();
*write_to = value;
return 0;
}
static int cbs_av1_write_leb128(CodedBitstreamContext *ctx, PutBitContext *pbc,
const char *name, uint64_t value, int fixed_length)
{
int len, i;
uint8_t byte;
CBS_TRACE_WRITE_START();
len = (av_log2(value) + 7) / 7;
if (fixed_length) {
if (fixed_length < len) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "OBU is too large for "
"fixed length size field (%d > %d).\n",
len, fixed_length);
return AVERROR(EINVAL);
}
len = fixed_length;
}
for (i = 0; i < len; i++) {
if (put_bits_left(pbc) < 8)
return AVERROR(ENOSPC);
byte = value >> (7 * i) & 0x7f;
if (i < len - 1)
byte |= 0x80;
put_bits(pbc, 8, byte);
}
CBS_TRACE_WRITE_END_NO_SUBSCRIPTS();
return 0;
}
static int cbs_av1_read_ns(CodedBitstreamContext *ctx, GetBitContext *gbc,
uint32_t n, const char *name,
const int *subscripts, uint32_t *write_to)
{
uint32_t m, v, extra_bit, value;
int w;
CBS_TRACE_READ_START();
av_assert0(n > 0);
w = av_log2(n) + 1;
m = (1 << w) - n;
if (get_bits_left(gbc) < w) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid non-symmetric value at "
"%s: bitstream ended.\n", name);
return AVERROR_INVALIDDATA;
}
if (w - 1 > 0)
v = get_bits(gbc, w - 1);
else
v = 0;
if (v < m) {
value = v;
} else {
extra_bit = get_bits1(gbc);
value = (v << 1) - m + extra_bit;
}
CBS_TRACE_READ_END();
*write_to = value;
return 0;
}
static int cbs_av1_write_ns(CodedBitstreamContext *ctx, PutBitContext *pbc,
uint32_t n, const char *name,
const int *subscripts, uint32_t value)
{
uint32_t w, m, v, extra_bit;
CBS_TRACE_WRITE_START();
if (value > n) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "%s out of range: "
"%"PRIu32", but must be in [0,%"PRIu32"].\n",
name, value, n);
return AVERROR_INVALIDDATA;
}
w = av_log2(n) + 1;
m = (1 << w) - n;
if (put_bits_left(pbc) < w)
return AVERROR(ENOSPC);
if (value < m) {
v = value;
put_bits(pbc, w - 1, v);
} else {
v = m + ((value - m) >> 1);
extra_bit = (value - m) & 1;
put_bits(pbc, w - 1, v);
put_bits(pbc, 1, extra_bit);
}
CBS_TRACE_WRITE_END();
return 0;
}
static int cbs_av1_read_increment(CodedBitstreamContext *ctx, GetBitContext *gbc,
uint32_t range_min, uint32_t range_max,
const char *name, uint32_t *write_to)
{
uint32_t value;
CBS_TRACE_READ_START();
av_assert0(range_min <= range_max && range_max - range_min < 32);
for (value = range_min; value < range_max;) {
if (get_bits_left(gbc) < 1) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid increment value at "
"%s: bitstream ended.\n", name);
return AVERROR_INVALIDDATA;
}
if (get_bits1(gbc))
++value;
else
break;
}
CBS_TRACE_READ_END_NO_SUBSCRIPTS();
*write_to = value;
return 0;
}
static int cbs_av1_write_increment(CodedBitstreamContext *ctx, PutBitContext *pbc,
uint32_t range_min, uint32_t range_max,
const char *name, uint32_t value)
{
int len;
CBS_TRACE_WRITE_START();
av_assert0(range_min <= range_max && range_max - range_min < 32);
if (value < range_min || value > range_max) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "%s out of range: "
"%"PRIu32", but must be in [%"PRIu32",%"PRIu32"].\n",
name, value, range_min, range_max);
return AVERROR_INVALIDDATA;
}
if (value == range_max)
len = range_max - range_min;
else
len = value - range_min + 1;
if (put_bits_left(pbc) < len)
return AVERROR(ENOSPC);
if (len > 0)
put_bits(pbc, len, (1U << len) - 1 - (value != range_max));
CBS_TRACE_WRITE_END_NO_SUBSCRIPTS();
return 0;
}
static int cbs_av1_read_subexp(CodedBitstreamContext *ctx, GetBitContext *gbc,
uint32_t range_max, const char *name,
const int *subscripts, uint32_t *write_to)
{
uint32_t value, max_len, len, range_offset, range_bits;
int err;
CBS_TRACE_READ_START();
av_assert0(range_max > 0);
max_len = av_log2(range_max - 1) - 3;
err = cbs_av1_read_increment(ctx, gbc, 0, max_len,
"subexp_more_bits", &len);
if (err < 0)
return err;
if (len) {
range_bits = 2 + len;
range_offset = 1 << range_bits;
} else {
range_bits = 3;
range_offset = 0;
}
if (len < max_len) {
err = ff_cbs_read_simple_unsigned(ctx, gbc, range_bits,
"subexp_bits", &value);
if (err < 0)
return err;
} else {
err = cbs_av1_read_ns(ctx, gbc, range_max - range_offset,
"subexp_final_bits", NULL, &value);
if (err < 0)
return err;
}
value += range_offset;
CBS_TRACE_READ_END_VALUE_ONLY();
*write_to = value;
return err;
}
static int cbs_av1_write_subexp(CodedBitstreamContext *ctx, PutBitContext *pbc,
uint32_t range_max, const char *name,
const int *subscripts, uint32_t value)
{
int err;
uint32_t max_len, len, range_offset, range_bits;
CBS_TRACE_WRITE_START();
if (value > range_max) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "%s out of range: "
"%"PRIu32", but must be in [0,%"PRIu32"].\n",
name, value, range_max);
return AVERROR_INVALIDDATA;
}
av_assert0(range_max > 0);
max_len = av_log2(range_max - 1) - 3;
if (value < 8) {
range_bits = 3;
range_offset = 0;
len = 0;
} else {
range_bits = av_log2(value);
len = range_bits - 2;
if (len > max_len) {
// The top bin is combined with the one below it.
av_assert0(len == max_len + 1);
--range_bits;
len = max_len;
}
range_offset = 1 << range_bits;
}
err = cbs_av1_write_increment(ctx, pbc, 0, max_len,
"subexp_more_bits", len);
if (err < 0)
return err;
if (len < max_len) {
err = ff_cbs_write_simple_unsigned(ctx, pbc, range_bits,
"subexp_bits",
value - range_offset);
if (err < 0)
return err;
} else {
err = cbs_av1_write_ns(ctx, pbc, range_max - range_offset,
"subexp_final_bits", NULL,
value - range_offset);
if (err < 0)
return err;
}
CBS_TRACE_WRITE_END_VALUE_ONLY();
return err;
}
static int cbs_av1_tile_log2(int blksize, int target)
{
int k;
for (k = 0; (blksize << k) < target; k++);
return k;
}
static int cbs_av1_get_relative_dist(const AV1RawSequenceHeader *seq,
unsigned int a, unsigned int b)
{
unsigned int diff, m;
if (!seq->enable_order_hint)
return 0;
diff = a - b;
m = 1 << seq->order_hint_bits_minus_1;
diff = (diff & (m - 1)) - (diff & m);
return diff;
}
static size_t cbs_av1_get_payload_bytes_left(GetBitContext *gbc)
{
GetBitContext tmp = *gbc;
size_t size = 0;
for (int i = 0; get_bits_left(&tmp) >= 8; i++) {
if (get_bits(&tmp, 8))
size = i;
}
return size;
}
#define HEADER(name) do { \
ff_cbs_trace_header(ctx, name); \
} while (0)
#define CHECK(call) do { \
err = (call); \
if (err < 0) \
return err; \
} while (0)
#define FUNC_NAME(rw, codec, name) cbs_ ## codec ## _ ## rw ## _ ## name
#define FUNC_AV1(rw, name) FUNC_NAME(rw, av1, name)
#define FUNC(name) FUNC_AV1(READWRITE, name)
#define SUBSCRIPTS(subs, ...) (subs > 0 ? ((int[subs + 1]){ subs, __VA_ARGS__ }) : NULL)
#define fc(width, name, range_min, range_max) \
xf(width, name, current->name, range_min, range_max, 0, )
#define flag(name) fb(1, name)
#define su(width, name) \
xsu(width, name, current->name, 0, )
#define fbs(width, name, subs, ...) \
xf(width, name, current->name, 0, MAX_UINT_BITS(width), subs, __VA_ARGS__)
#define fcs(width, name, range_min, range_max, subs, ...) \
xf(width, name, current->name, range_min, range_max, subs, __VA_ARGS__)
#define flags(name, subs, ...) \
xf(1, name, current->name, 0, 1, subs, __VA_ARGS__)
#define sus(width, name, subs, ...) \
xsu(width, name, current->name, subs, __VA_ARGS__)
#define fixed(width, name, value) do { \
av_unused uint32_t fixed_value = value; \
xf(width, name, fixed_value, value, value, 0, ); \
} while (0)
#define READ
#define READWRITE read
#define RWContext GetBitContext
#define fb(width, name) do { \
uint32_t value; \
CHECK(ff_cbs_read_simple_unsigned(ctx, rw, width, \
#name, &value)); \
current->name = value; \
} while (0)
#define xf(width, name, var, range_min, range_max, subs, ...) do { \
uint32_t value; \
CHECK(ff_cbs_read_unsigned(ctx, rw, width, #name, \
SUBSCRIPTS(subs, __VA_ARGS__), \
&value, range_min, range_max)); \
var = value; \
} while (0)
#define xsu(width, name, var, subs, ...) do { \
int32_t value; \
CHECK(ff_cbs_read_signed(ctx, rw, width, #name, \
SUBSCRIPTS(subs, __VA_ARGS__), &value, \
MIN_INT_BITS(width), \
MAX_INT_BITS(width))); \
var = value; \
} while (0)
#define uvlc(name, range_min, range_max) do { \
uint32_t value; \
CHECK(cbs_av1_read_uvlc(ctx, rw, #name, \
&value, range_min, range_max)); \
current->name = value; \
} while (0)
#define ns(max_value, name, subs, ...) do { \
uint32_t value; \
CHECK(cbs_av1_read_ns(ctx, rw, max_value, #name, \
SUBSCRIPTS(subs, __VA_ARGS__), &value)); \
current->name = value; \
} while (0)
#define increment(name, min, max) do { \
uint32_t value; \
CHECK(cbs_av1_read_increment(ctx, rw, min, max, #name, &value)); \
current->name = value; \
} while (0)
#define subexp(name, max, subs, ...) do { \
uint32_t value; \
CHECK(cbs_av1_read_subexp(ctx, rw, max, #name, \
SUBSCRIPTS(subs, __VA_ARGS__), &value)); \
current->name = value; \
} while (0)
#define delta_q(name) do { \
uint8_t delta_coded; \
int8_t delta_q; \
xf(1, name.delta_coded, delta_coded, 0, 1, 0, ); \
if (delta_coded) \
xsu(1 + 6, name.delta_q, delta_q, 0, ); \
else \
delta_q = 0; \
current->name = delta_q; \
} while (0)
#define leb128(name) do { \
uint64_t value; \
CHECK(cbs_av1_read_leb128(ctx, rw, #name, &value)); \
current->name = value; \
} while (0)
#define infer(name, value) do { \
current->name = value; \
} while (0)
#define byte_alignment(rw) (get_bits_count(rw) % 8)
#include "cbs_av1_syntax_template.c"
#undef READ
#undef READWRITE
#undef RWContext
#undef fb
#undef xf
#undef xsu
#undef uvlc
#undef ns
#undef increment
#undef subexp
#undef delta_q
#undef leb128
#undef infer
#undef byte_alignment
#define WRITE
#define READWRITE write
#define RWContext PutBitContext
#define fb(width, name) do { \
CHECK(ff_cbs_write_simple_unsigned(ctx, rw, width, #name, \
current->name)); \
} while (0)
#define xf(width, name, var, range_min, range_max, subs, ...) do { \
CHECK(ff_cbs_write_unsigned(ctx, rw, width, #name, \
SUBSCRIPTS(subs, __VA_ARGS__), \
var, range_min, range_max)); \
} while (0)
#define xsu(width, name, var, subs, ...) do { \
CHECK(ff_cbs_write_signed(ctx, rw, width, #name, \
SUBSCRIPTS(subs, __VA_ARGS__), var, \
MIN_INT_BITS(width), \
MAX_INT_BITS(width))); \
} while (0)
#define uvlc(name, range_min, range_max) do { \
CHECK(cbs_av1_write_uvlc(ctx, rw, #name, current->name, \
range_min, range_max)); \
} while (0)
#define ns(max_value, name, subs, ...) do { \
CHECK(cbs_av1_write_ns(ctx, rw, max_value, #name, \
SUBSCRIPTS(subs, __VA_ARGS__), \
current->name)); \
} while (0)
#define increment(name, min, max) do { \
CHECK(cbs_av1_write_increment(ctx, rw, min, max, #name, \
current->name)); \
} while (0)
#define subexp(name, max, subs, ...) do { \
CHECK(cbs_av1_write_subexp(ctx, rw, max, #name, \
SUBSCRIPTS(subs, __VA_ARGS__), \
current->name)); \
} while (0)
#define delta_q(name) do { \
xf(1, name.delta_coded, current->name != 0, 0, 1, 0, ); \
if (current->name) \
xsu(1 + 6, name.delta_q, current->name, 0, ); \
} while (0)
#define leb128(name) do { \
CHECK(cbs_av1_write_leb128(ctx, rw, #name, current->name, 0)); \
} while (0)
#define infer(name, value) do { \
if (current->name != (value)) { \
av_log(ctx->log_ctx, AV_LOG_ERROR, \
"%s does not match inferred value: " \
"%"PRId64", but should be %"PRId64".\n", \
#name, (int64_t)current->name, (int64_t)(value)); \
return AVERROR_INVALIDDATA; \
} \
} while (0)
#define byte_alignment(rw) (put_bits_count(rw) % 8)
#include "cbs_av1_syntax_template.c"
#undef WRITE
#undef READWRITE
#undef RWContext
#undef fb
#undef xf
#undef xsu
#undef uvlc
#undef ns
#undef increment
#undef subexp
#undef delta_q
#undef leb128
#undef infer
#undef byte_alignment
static int cbs_av1_split_fragment(CodedBitstreamContext *ctx,
CodedBitstreamFragment *frag,
int header)
{
GetBitContext gbc;
uint8_t *data;
size_t size;
uint64_t obu_length;
int pos, err, trace;
// Don't include this parsing in trace output.
trace = ctx->trace_enable;
ctx->trace_enable = 0;
data = frag->data;
size = frag->data_size;
if (INT_MAX / 8 < size) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid fragment: "
"too large (%"SIZE_SPECIFIER" bytes).\n", size);
err = AVERROR_INVALIDDATA;
goto fail;
}
if (header && size && data[0] & 0x80) {
// first bit is nonzero, the extradata does not consist purely of
// OBUs. Expect MP4/Matroska AV1CodecConfigurationRecord
int config_record_version = data[0] & 0x7f;
if (config_record_version != 1) {
av_log(ctx->log_ctx, AV_LOG_ERROR,
"Unknown version %d of AV1CodecConfigurationRecord "
"found!\n",
config_record_version);
err = AVERROR_INVALIDDATA;
goto fail;
}
if (size <= 4) {
if (size < 4) {
av_log(ctx->log_ctx, AV_LOG_WARNING,
"Undersized AV1CodecConfigurationRecord v%d found!\n",
config_record_version);
err = AVERROR_INVALIDDATA;
goto fail;
}
goto success;
}
// In AV1CodecConfigurationRecord v1, actual OBUs start after
// four bytes. Thus set the offset as required for properly
// parsing them.
data += 4;
size -= 4;
}
while (size > 0) {
AV1RawOBUHeader header;
uint64_t obu_size;
init_get_bits(&gbc, data, 8 * size);
err = cbs_av1_read_obu_header(ctx, &gbc, &header);
if (err < 0)
goto fail;
if (header.obu_has_size_field) {
if (get_bits_left(&gbc) < 8) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid OBU: fragment "
"too short (%"SIZE_SPECIFIER" bytes).\n", size);
err = AVERROR_INVALIDDATA;
goto fail;
}
err = cbs_av1_read_leb128(ctx, &gbc, "obu_size", &obu_size);
if (err < 0)
goto fail;
} else
obu_size = size - 1 - header.obu_extension_flag;
pos = get_bits_count(&gbc);
av_assert0(pos % 8 == 0 && pos / 8 <= size);
obu_length = pos / 8 + obu_size;
if (size < obu_length) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid OBU length: "
"%"PRIu64", but only %"SIZE_SPECIFIER" bytes remaining in fragment.\n",
obu_length, size);
err = AVERROR_INVALIDDATA;
goto fail;
}
err = ff_cbs_append_unit_data(frag, header.obu_type,
data, obu_length, frag->data_ref);
if (err < 0)
goto fail;
data += obu_length;
size -= obu_length;
}
success:
err = 0;
fail:
ctx->trace_enable = trace;
return err;
}
static int cbs_av1_ref_tile_data(CodedBitstreamContext *ctx,
CodedBitstreamUnit *unit,
GetBitContext *gbc,
AV1RawTileData *td)
{
int pos;
pos = get_bits_count(gbc);
if (pos >= 8 * unit->data_size) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Bitstream ended before "
"any data in tile group (%d bits read).\n", pos);
return AVERROR_INVALIDDATA;
}
// Must be byte-aligned at this point.
av_assert0(pos % 8 == 0);
td->data_ref = av_buffer_ref(unit->data_ref);
if (!td->data_ref)
return AVERROR(ENOMEM);
td->data = unit->data + pos / 8;
td->data_size = unit->data_size - pos / 8;
return 0;
}
static int cbs_av1_read_unit(CodedBitstreamContext *ctx,
CodedBitstreamUnit *unit)
{
CodedBitstreamAV1Context *priv = ctx->priv_data;
AV1RawOBU *obu;
GetBitContext gbc;
int err, start_pos, end_pos;
err = ff_cbs_alloc_unit_content(ctx, unit);
if (err < 0)
return err;
obu = unit->content;
err = init_get_bits(&gbc, unit->data, 8 * unit->data_size);
if (err < 0)
return err;
err = cbs_av1_read_obu_header(ctx, &gbc, &obu->header);
if (err < 0)
return err;
av_assert0(obu->header.obu_type == unit->type);
if (obu->header.obu_has_size_field) {
uint64_t obu_size;
err = cbs_av1_read_leb128(ctx, &gbc, "obu_size", &obu_size);
if (err < 0)
return err;
obu->obu_size = obu_size;
} else {
if (unit->data_size < 1 + obu->header.obu_extension_flag) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid OBU length: "
"unit too short (%"SIZE_SPECIFIER").\n", unit->data_size);
return AVERROR_INVALIDDATA;
}
obu->obu_size = unit->data_size - 1 - obu->header.obu_extension_flag;
}
start_pos = get_bits_count(&gbc);
if (obu->header.obu_extension_flag) {
if (obu->header.obu_type != AV1_OBU_SEQUENCE_HEADER &&
obu->header.obu_type != AV1_OBU_TEMPORAL_DELIMITER &&
priv->operating_point_idc) {
int in_temporal_layer =
(priv->operating_point_idc >> priv->temporal_id ) & 1;
int in_spatial_layer =
(priv->operating_point_idc >> (priv->spatial_id + 8)) & 1;
if (!in_temporal_layer || !in_spatial_layer) {
return AVERROR(EAGAIN); // drop_obu()
}
}
}
switch (obu->header.obu_type) {
case AV1_OBU_SEQUENCE_HEADER:
{
err = cbs_av1_read_sequence_header_obu(ctx, &gbc,
&obu->obu.sequence_header);
if (err < 0)
return err;
if (priv->operating_point >= 0) {
AV1RawSequenceHeader *sequence_header = &obu->obu.sequence_header;
if (priv->operating_point > sequence_header->operating_points_cnt_minus_1) {
av_log(ctx->log_ctx, AV_LOG_ERROR, "Invalid Operating Point %d requested. "
"Must not be higher than %u.\n",
priv->operating_point, sequence_header->operating_points_cnt_minus_1);
return AVERROR(EINVAL);
}
priv->operating_point_idc = sequence_header->operating_point_idc[priv->operating_point];
}
ff_refstruct_replace(&priv->sequence_header_ref, unit->content_ref);
priv->sequence_header = &obu->obu.sequence_header;
}
break;
case AV1_OBU_TEMPORAL_DELIMITER:
{
err = cbs_av1_read_temporal_delimiter_obu(ctx, &gbc);
if (err < 0)
return err;
}
break;
case AV1_OBU_FRAME_HEADER:
case AV1_OBU_REDUNDANT_FRAME_HEADER:
{
err = cbs_av1_read_frame_header_obu(ctx, &gbc,
&obu->obu.frame_header,
obu->header.obu_type ==
AV1_OBU_REDUNDANT_FRAME_HEADER,
unit->data_ref);
if (err < 0)
return err;
}
break;
case AV1_OBU_TILE_GROUP:
{
err = cbs_av1_read_tile_group_obu(ctx, &gbc,
&obu->obu.tile_group);
if (err < 0)
return err;
err = cbs_av1_ref_tile_data(ctx, unit, &gbc,
&obu->obu.tile_group.tile_data);
if (err < 0)
return err;
}
break;
case AV1_OBU_FRAME:
{
err = cbs_av1_read_frame_obu(ctx, &gbc, &obu->obu.frame,
unit->data_ref);
if (err < 0)
return err;
err = cbs_av1_ref_tile_data(ctx, unit, &gbc,
&obu->obu.frame.tile_group.tile_data);
if (err < 0)
return err;
}
break;
case AV1_OBU_TILE_LIST:
{
err = cbs_av1_read_tile_list_obu(ctx, &gbc,
&obu->obu.tile_list);
if (err < 0)
return err;
err = cbs_av1_ref_tile_data(ctx, unit, &gbc,
&obu->obu.tile_list.tile_data);
if (err < 0)
return err;
}
break;
case AV1_OBU_METADATA:
{
err = cbs_av1_read_metadata_obu(ctx, &gbc, &obu->obu.metadata);
if (err < 0)
return err;
}
break;
case AV1_OBU_PADDING:
{
err = cbs_av1_read_padding_obu(ctx, &gbc, &obu->obu.padding);
if (err < 0)
return err;
}
break;
default:
return AVERROR(ENOSYS);
}
end_pos = get_bits_count(&gbc);
av_assert0(end_pos <= unit->data_size * 8);
if (obu->obu_size > 0 &&
obu->header.obu_type != AV1_OBU_TILE_GROUP &&
obu->header.obu_type != AV1_OBU_TILE_LIST &&
obu->header.obu_type != AV1_OBU_FRAME) {
int nb_bits = obu->obu_size * 8 + start_pos - end_pos;
if (nb_bits <= 0)
return AVERROR_INVALIDDATA;
err = cbs_av1_read_trailing_bits(ctx, &gbc, nb_bits);
if (err < 0)
return err;
}
return 0;
}
static int cbs_av1_write_obu(CodedBitstreamContext *ctx,
CodedBitstreamUnit *unit,
PutBitContext *pbc)
{
CodedBitstreamAV1Context *priv = ctx->priv_data;
AV1RawOBU *obu = unit->content;
PutBitContext pbc_tmp;
AV1RawTileData *td;
size_t header_size;
int err, start_pos, end_pos, data_pos;
CodedBitstreamAV1Context av1ctx;
// OBUs in the normal bitstream format must contain a size field
// in every OBU (in annex B it is optional, but we don't support
// writing that).
obu->header.obu_has_size_field = 1;
av1ctx = *priv;
if (priv->sequence_header_ref) {
av1ctx.sequence_header_ref = ff_refstruct_ref(priv->sequence_header_ref);
}
if (priv->frame_header_ref) {
av1ctx.frame_header_ref = av_buffer_ref(priv->frame_header_ref);
if (!av1ctx.frame_header_ref) {
err = AVERROR(ENOMEM);
goto error;
}
}
err = cbs_av1_write_obu_header(ctx, pbc, &obu->header);
if (err < 0)
goto error;
if (obu->header.obu_has_size_field) {
pbc_tmp = *pbc;
if (priv->fixed_obu_size_length) {
for (int i = 0; i < priv->fixed_obu_size_length; i++)
put_bits(pbc, 8, 0);
} else {
// Add space for the size field to fill later.
put_bits32(pbc, 0);
put_bits32(pbc, 0);
}
}
td = NULL;
start_pos = put_bits_count(pbc);
switch (obu->header.obu_type) {
case AV1_OBU_SEQUENCE_HEADER:
{
err = cbs_av1_write_sequence_header_obu(ctx, pbc,
&obu->obu.sequence_header);
if (err < 0)
goto error;
ff_refstruct_unref(&priv->sequence_header_ref);
priv->sequence_header = NULL;
err = ff_cbs_make_unit_refcounted(ctx, unit);
if (err < 0)
goto error;
priv->sequence_header_ref = ff_refstruct_ref(unit->content_ref);
priv->sequence_header = &obu->obu.sequence_header;
}
break;
case AV1_OBU_TEMPORAL_DELIMITER:
{
err = cbs_av1_write_temporal_delimiter_obu(ctx, pbc);
if (err < 0)
goto error;
}
break;
case AV1_OBU_FRAME_HEADER:
case AV1_OBU_REDUNDANT_FRAME_HEADER:
{
err = cbs_av1_write_frame_header_obu(ctx, pbc,
&obu->obu.frame_header,
obu->header.obu_type ==
AV1_OBU_REDUNDANT_FRAME_HEADER,
NULL);
if (err < 0)
goto error;
}
break;
case AV1_OBU_TILE_GROUP:
{
err = cbs_av1_write_tile_group_obu(ctx, pbc,
&obu->obu.tile_group);
if (err < 0)
goto error;
td = &obu->obu.tile_group.tile_data;
}
break;
case AV1_OBU_FRAME:
{
err = cbs_av1_write_frame_obu(ctx, pbc, &obu->obu.frame, NULL);
if (err < 0)
goto error;
td = &obu->obu.frame.tile_group.tile_data;
}
break;
case AV1_OBU_TILE_LIST:
{
err = cbs_av1_write_tile_list_obu(ctx, pbc, &obu->obu.tile_list);
if (err < 0)
goto error;
td = &obu->obu.tile_list.tile_data;
}
break;
case AV1_OBU_METADATA:
{
err = cbs_av1_write_metadata_obu(ctx, pbc, &obu->obu.metadata);
if (err < 0)
goto error;
}
break;
case AV1_OBU_PADDING:
{
err = cbs_av1_write_padding_obu(ctx, pbc, &obu->obu.padding);
if (err < 0)
goto error;
}
break;
default:
err = AVERROR(ENOSYS);
goto error;
}
end_pos = put_bits_count(pbc);
header_size = (end_pos - start_pos + 7) / 8;
if (td) {
obu->obu_size = header_size + td->data_size;
} else if (header_size > 0) {
// Add trailing bits and recalculate.
err = cbs_av1_write_trailing_bits(ctx, pbc, 8 - end_pos % 8);
if (err < 0)
goto error;
end_pos = put_bits_count(pbc);
obu->obu_size = header_size = (end_pos - start_pos + 7) / 8;
} else {
// Empty OBU.
obu->obu_size = 0;
}
end_pos = put_bits_count(pbc);
// Must now be byte-aligned.
av_assert0(end_pos % 8 == 0);
flush_put_bits(pbc);
start_pos /= 8;
end_pos /= 8;
*pbc = pbc_tmp;
err = cbs_av1_write_leb128(ctx, pbc, "obu_size", obu->obu_size,
priv->fixed_obu_size_length);
if (err < 0)
goto error;
data_pos = put_bits_count(pbc) / 8;
flush_put_bits(pbc);
av_assert0(data_pos <= start_pos);
if (8 * obu->obu_size > put_bits_left(pbc)) {
ff_refstruct_unref(&priv->sequence_header_ref);
av_buffer_unref(&priv->frame_header_ref);
*priv = av1ctx;
return AVERROR(ENOSPC);
}
if (obu->obu_size > 0) {
if (!priv->fixed_obu_size_length) {
memmove(pbc->buf + data_pos,
pbc->buf + start_pos, header_size);
} else {
// The size was fixed so the following data was
// already written in the correct place.
}
skip_put_bytes(pbc, header_size);
if (td) {
memcpy(pbc->buf + data_pos + header_size,
td->data, td->data_size);
skip_put_bytes(pbc, td->data_size);
}
}
// OBU data must be byte-aligned.
av_assert0(put_bits_count(pbc) % 8 == 0);
err = 0;
error:
ff_refstruct_unref(&av1ctx.sequence_header_ref);
av_buffer_unref(&av1ctx.frame_header_ref);
return err;
}
static int cbs_av1_assemble_fragment(CodedBitstreamContext *ctx,
CodedBitstreamFragment *frag)
{
size_t size, pos;
int i;
size = 0;
for (i = 0; i < frag->nb_units; i++)
size += frag->units[i].data_size;
frag->data_ref = av_buffer_alloc(size + AV_INPUT_BUFFER_PADDING_SIZE);
if (!frag->data_ref)
return AVERROR(ENOMEM);
frag->data = frag->data_ref->data;
memset(frag->data + size, 0, AV_INPUT_BUFFER_PADDING_SIZE);
pos = 0;
for (i = 0; i < frag->nb_units; i++) {
memcpy(frag->data + pos, frag->units[i].data,
frag->units[i].data_size);
pos += frag->units[i].data_size;
}
av_assert0(pos == size);
frag->data_size = size;
return 0;
}
static void cbs_av1_flush(CodedBitstreamContext *ctx)
{
CodedBitstreamAV1Context *priv = ctx->priv_data;
av_buffer_unref(&priv->frame_header_ref);
priv->sequence_header = NULL;
priv->frame_header = NULL;
memset(priv->ref, 0, sizeof(priv->ref));
priv->operating_point_idc = 0;
priv->seen_frame_header = 0;
priv->tile_num = 0;
}
static void cbs_av1_close(CodedBitstreamContext *ctx)
{
CodedBitstreamAV1Context *priv = ctx->priv_data;
ff_refstruct_unref(&priv->sequence_header_ref);
av_buffer_unref(&priv->frame_header_ref);
}
static void cbs_av1_free_metadata(FFRefStructOpaque unused, void *content)
{
AV1RawOBU *obu = content;
AV1RawMetadata *md;
av_assert0(obu->header.obu_type == AV1_OBU_METADATA);
md = &obu->obu.metadata;
switch (md->metadata_type) {
case AV1_METADATA_TYPE_HDR_CLL:
case AV1_METADATA_TYPE_HDR_MDCV:
case AV1_METADATA_TYPE_SCALABILITY:
case AV1_METADATA_TYPE_TIMECODE:
break;
case AV1_METADATA_TYPE_ITUT_T35:
av_buffer_unref(&md->metadata.itut_t35.payload_ref);
break;
default:
av_buffer_unref(&md->metadata.unknown.payload_ref);
}
}
static const CodedBitstreamUnitTypeDescriptor cbs_av1_unit_types[] = {
CBS_UNIT_TYPE_POD(AV1_OBU_SEQUENCE_HEADER, AV1RawOBU),
CBS_UNIT_TYPE_POD(AV1_OBU_TEMPORAL_DELIMITER, AV1RawOBU),
CBS_UNIT_TYPE_POD(AV1_OBU_FRAME_HEADER, AV1RawOBU),
CBS_UNIT_TYPE_POD(AV1_OBU_REDUNDANT_FRAME_HEADER, AV1RawOBU),
CBS_UNIT_TYPE_INTERNAL_REF(AV1_OBU_TILE_GROUP, AV1RawOBU,
obu.tile_group.tile_data.data),
CBS_UNIT_TYPE_INTERNAL_REF(AV1_OBU_FRAME, AV1RawOBU,
obu.frame.tile_group.tile_data.data),
CBS_UNIT_TYPE_INTERNAL_REF(AV1_OBU_TILE_LIST, AV1RawOBU,
obu.tile_list.tile_data.data),
CBS_UNIT_TYPE_INTERNAL_REF(AV1_OBU_PADDING, AV1RawOBU,
obu.padding.payload),
CBS_UNIT_TYPE_COMPLEX(AV1_OBU_METADATA, AV1RawOBU,
&cbs_av1_free_metadata),
CBS_UNIT_TYPE_END_OF_LIST
};
#define OFFSET(x) offsetof(CodedBitstreamAV1Context, x)
static const AVOption cbs_av1_options[] = {
{ "operating_point", "Set operating point to select layers to parse from a scalable bitstream",
OFFSET(operating_point), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, AV1_MAX_OPERATING_POINTS - 1, 0 },
{ "fixed_obu_size_length", "Set fixed length of the obu_size field",
OFFSET(fixed_obu_size_length), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 8, 0 },
{ NULL }
};
static const AVClass cbs_av1_class = {
.class_name = "cbs_av1",
.item_name = av_default_item_name,
.option = cbs_av1_options,
.version = LIBAVUTIL_VERSION_INT,
};
const CodedBitstreamType ff_cbs_type_av1 = {
.codec_id = AV_CODEC_ID_AV1,
.priv_class = &cbs_av1_class,
.priv_data_size = sizeof(CodedBitstreamAV1Context),
.unit_types = cbs_av1_unit_types,
.split_fragment = &cbs_av1_split_fragment,
.read_unit = &cbs_av1_read_unit,
.write_unit = &cbs_av1_write_obu,
.assemble_fragment = &cbs_av1_assemble_fragment,
.flush = &cbs_av1_flush,
.close = &cbs_av1_close,
};