mirror of https://git.ffmpeg.org/ffmpeg.git
492 lines
15 KiB
C
492 lines
15 KiB
C
/*
|
|
* JPEG-LS encoder
|
|
* Copyright (c) 2003 Michael Niedermayer
|
|
* Copyright (c) 2006 Konstantin Shishkov
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
/**
|
|
* @file
|
|
* JPEG-LS encoder.
|
|
*/
|
|
|
|
#define UNCHECKED_BITSTREAM_READER 1
|
|
#include "libavutil/opt.h"
|
|
#include "avcodec.h"
|
|
#include "bytestream.h"
|
|
#include "codec_internal.h"
|
|
#include "encode.h"
|
|
#include "get_bits.h"
|
|
#include "put_bits.h"
|
|
#include "put_golomb.h"
|
|
#include "mathops.h"
|
|
#include "mjpeg.h"
|
|
#include "jpegls.h"
|
|
|
|
typedef struct JPEGLSContext {
|
|
AVClass *class;
|
|
|
|
int pred;
|
|
int comps;
|
|
|
|
size_t size;
|
|
uint8_t *buf;
|
|
} JPEGLSContext;
|
|
|
|
static inline void put_marker_byteu(PutByteContext *pb, enum JpegMarker code)
|
|
{
|
|
bytestream2_put_byteu(pb, 0xff);
|
|
bytestream2_put_byteu(pb, code);
|
|
}
|
|
|
|
/**
|
|
* Encode error from regular symbol
|
|
*/
|
|
static inline void ls_encode_regular(JLSState *state, PutBitContext *pb, int Q,
|
|
int err)
|
|
{
|
|
int k;
|
|
int val;
|
|
int map;
|
|
|
|
for (k = 0; (state->N[Q] << k) < state->A[Q]; k++)
|
|
;
|
|
|
|
map = !state->near && !k && (2 * state->B[Q] <= -state->N[Q]);
|
|
|
|
if (err < 0)
|
|
err += state->range;
|
|
if (err >= (state->range + 1 >> 1)) {
|
|
err -= state->range;
|
|
val = 2 * FFABS(err) - 1 - map;
|
|
} else
|
|
val = 2 * err + map;
|
|
|
|
set_ur_golomb_jpegls(pb, val, k, state->limit, state->qbpp);
|
|
|
|
ff_jpegls_update_state_regular(state, Q, err);
|
|
}
|
|
|
|
/**
|
|
* Encode error from run termination
|
|
*/
|
|
static inline void ls_encode_runterm(JLSState *state, PutBitContext *pb,
|
|
int RItype, int err, int limit_add)
|
|
{
|
|
int k;
|
|
int val, map;
|
|
int Q = 365 + RItype;
|
|
int temp;
|
|
|
|
temp = state->A[Q];
|
|
if (RItype)
|
|
temp += state->N[Q] >> 1;
|
|
for (k = 0; (state->N[Q] << k) < temp; k++)
|
|
;
|
|
map = 0;
|
|
if (!k && err && (2 * state->B[Q] < state->N[Q]))
|
|
map = 1;
|
|
|
|
if (err < 0)
|
|
val = -(2 * err) - 1 - RItype + map;
|
|
else
|
|
val = 2 * err - RItype - map;
|
|
set_ur_golomb_jpegls(pb, val, k, state->limit - limit_add - 1, state->qbpp);
|
|
|
|
if (err < 0)
|
|
state->B[Q]++;
|
|
state->A[Q] += (val + 1 - RItype) >> 1;
|
|
|
|
ff_jpegls_downscale_state(state, Q);
|
|
}
|
|
|
|
/**
|
|
* Encode run value as specified by JPEG-LS standard
|
|
*/
|
|
static inline void ls_encode_run(JLSState *state, PutBitContext *pb, int run,
|
|
int comp, int trail)
|
|
{
|
|
while (run >= (1 << ff_log2_run[state->run_index[comp]])) {
|
|
put_bits(pb, 1, 1);
|
|
run -= 1 << ff_log2_run[state->run_index[comp]];
|
|
if (state->run_index[comp] < 31)
|
|
state->run_index[comp]++;
|
|
}
|
|
/* if hit EOL, encode another full run, else encode aborted run */
|
|
if (!trail && run) {
|
|
put_bits(pb, 1, 1);
|
|
} else if (trail) {
|
|
put_bits(pb, 1, 0);
|
|
if (ff_log2_run[state->run_index[comp]])
|
|
put_bits(pb, ff_log2_run[state->run_index[comp]], run);
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Encode one line of image
|
|
*/
|
|
static inline void ls_encode_line(JLSState *state, PutBitContext *pb,
|
|
void *tmp, const void *in, int last2, int w,
|
|
int stride, int comp, int bits)
|
|
{
|
|
int x = 0;
|
|
int Ra = R(tmp, 0), Rb, Rc = last2, Rd;
|
|
int D0, D1, D2;
|
|
|
|
while (x < w) {
|
|
int err, pred, sign;
|
|
|
|
/* compute gradients */
|
|
Rb = R(tmp, x);
|
|
Rd = (x >= w - stride) ? R(tmp, x) : R(tmp, x + stride);
|
|
D0 = Rd - Rb;
|
|
D1 = Rb - Rc;
|
|
D2 = Rc - Ra;
|
|
|
|
/* run mode */
|
|
if ((FFABS(D0) <= state->near) &&
|
|
(FFABS(D1) <= state->near) &&
|
|
(FFABS(D2) <= state->near)) {
|
|
int RUNval, RItype, run;
|
|
|
|
run = 0;
|
|
RUNval = Ra;
|
|
while (x < w && (FFABS(R(in, x) - RUNval) <= state->near)) {
|
|
run++;
|
|
W(tmp, x, Ra);
|
|
x += stride;
|
|
}
|
|
ls_encode_run(state, pb, run, comp, x < w);
|
|
if (x >= w)
|
|
return;
|
|
Rb = R(tmp, x);
|
|
RItype = FFABS(Ra - Rb) <= state->near;
|
|
pred = RItype ? Ra : Rb;
|
|
err = R(in, x) - pred;
|
|
|
|
if (!RItype && Ra > Rb)
|
|
err = -err;
|
|
|
|
if (state->near) {
|
|
if (err > 0)
|
|
err = (state->near + err) / state->twonear;
|
|
else
|
|
err = -(state->near - err) / state->twonear;
|
|
|
|
if (RItype || (Rb >= Ra))
|
|
Ra = av_clip(pred + err * state->twonear, 0, state->maxval);
|
|
else
|
|
Ra = av_clip(pred - err * state->twonear, 0, state->maxval);
|
|
} else
|
|
Ra = R(in, x);
|
|
W(tmp, x, Ra);
|
|
|
|
if (err < 0)
|
|
err += state->range;
|
|
if (err >= state->range + 1 >> 1)
|
|
err -= state->range;
|
|
|
|
ls_encode_runterm(state, pb, RItype, err,
|
|
ff_log2_run[state->run_index[comp]]);
|
|
|
|
if (state->run_index[comp] > 0)
|
|
state->run_index[comp]--;
|
|
} else { /* regular mode */
|
|
int context;
|
|
|
|
context = ff_jpegls_quantize(state, D0) * 81 +
|
|
ff_jpegls_quantize(state, D1) * 9 +
|
|
ff_jpegls_quantize(state, D2);
|
|
pred = mid_pred(Ra, Ra + Rb - Rc, Rb);
|
|
|
|
if (context < 0) {
|
|
context = -context;
|
|
sign = 1;
|
|
pred = av_clip(pred - state->C[context], 0, state->maxval);
|
|
err = pred - R(in, x);
|
|
} else {
|
|
sign = 0;
|
|
pred = av_clip(pred + state->C[context], 0, state->maxval);
|
|
err = R(in, x) - pred;
|
|
}
|
|
|
|
if (state->near) {
|
|
if (err > 0)
|
|
err = (state->near + err) / state->twonear;
|
|
else
|
|
err = -(state->near - err) / state->twonear;
|
|
if (!sign)
|
|
Ra = av_clip(pred + err * state->twonear, 0, state->maxval);
|
|
else
|
|
Ra = av_clip(pred - err * state->twonear, 0, state->maxval);
|
|
} else
|
|
Ra = R(in, x);
|
|
W(tmp, x, Ra);
|
|
|
|
ls_encode_regular(state, pb, context, err);
|
|
}
|
|
Rc = Rb;
|
|
x += stride;
|
|
}
|
|
}
|
|
|
|
static void ls_store_lse(JLSState *state, PutByteContext *pb)
|
|
{
|
|
/* Test if we have default params and don't need to store LSE */
|
|
JLSState state2 = { 0 };
|
|
state2.bpp = state->bpp;
|
|
state2.near = state->near;
|
|
ff_jpegls_reset_coding_parameters(&state2, 1);
|
|
if (state->T1 == state2.T1 &&
|
|
state->T2 == state2.T2 &&
|
|
state->T3 == state2.T3 &&
|
|
state->reset == state2.reset)
|
|
return;
|
|
/* store LSE type 1 */
|
|
put_marker_byteu(pb, LSE);
|
|
bytestream2_put_be16u(pb, 13);
|
|
bytestream2_put_byteu(pb, 1);
|
|
bytestream2_put_be16u(pb, state->maxval);
|
|
bytestream2_put_be16u(pb, state->T1);
|
|
bytestream2_put_be16u(pb, state->T2);
|
|
bytestream2_put_be16u(pb, state->T3);
|
|
bytestream2_put_be16u(pb, state->reset);
|
|
}
|
|
|
|
static int encode_picture_ls(AVCodecContext *avctx, AVPacket *pkt,
|
|
const AVFrame *pict, int *got_packet)
|
|
{
|
|
JPEGLSContext *ctx = avctx->priv_data;
|
|
const AVFrame *const p = pict;
|
|
PutByteContext pb;
|
|
PutBitContext pb2;
|
|
GetBitContext gb;
|
|
const uint8_t *in;
|
|
uint8_t *last = NULL;
|
|
JLSState state = { 0 };
|
|
size_t size;
|
|
int i, ret, size_in_bits;
|
|
int comps;
|
|
|
|
last = av_mallocz(FFABS(p->linesize[0]));
|
|
if (!last)
|
|
return AVERROR(ENOMEM);
|
|
|
|
init_put_bits(&pb2, ctx->buf, ctx->size);
|
|
|
|
comps = ctx->comps;
|
|
/* initialize JPEG-LS state from JPEG parameters */
|
|
state.near = ctx->pred;
|
|
state.bpp = (avctx->pix_fmt == AV_PIX_FMT_GRAY16) ? 16 : 8;
|
|
ff_jpegls_reset_coding_parameters(&state, 0);
|
|
ff_jpegls_init_state(&state);
|
|
|
|
in = p->data[0];
|
|
if (avctx->pix_fmt == AV_PIX_FMT_GRAY8) {
|
|
int t = 0;
|
|
|
|
for (i = 0; i < avctx->height; i++) {
|
|
int last0 = last[0];
|
|
ls_encode_line(&state, &pb2, last, in, t, avctx->width, 1, 0, 8);
|
|
t = last0;
|
|
in += p->linesize[0];
|
|
}
|
|
} else if (avctx->pix_fmt == AV_PIX_FMT_GRAY16) {
|
|
int t = 0;
|
|
|
|
for (i = 0; i < avctx->height; i++) {
|
|
int last0 = *((uint16_t *)last);
|
|
ls_encode_line(&state, &pb2, last, in, t, avctx->width, 1, 0, 16);
|
|
t = last0;
|
|
in += p->linesize[0];
|
|
}
|
|
} else if (avctx->pix_fmt == AV_PIX_FMT_RGB24) {
|
|
int j, width;
|
|
int Rc[3] = { 0, 0, 0 };
|
|
|
|
width = avctx->width * 3;
|
|
for (i = 0; i < avctx->height; i++) {
|
|
for (j = 0; j < 3; j++) {
|
|
int last0 = last[j];
|
|
ls_encode_line(&state, &pb2, last + j, in + j, Rc[j],
|
|
width, 3, j, 8);
|
|
Rc[j] = last0;
|
|
}
|
|
in += p->linesize[0];
|
|
}
|
|
} else if (avctx->pix_fmt == AV_PIX_FMT_BGR24) {
|
|
int j, width;
|
|
int Rc[3] = { 0, 0, 0 };
|
|
|
|
width = avctx->width * 3;
|
|
for (i = 0; i < avctx->height; i++) {
|
|
for (j = 2; j >= 0; j--) {
|
|
int last0 = last[j];
|
|
ls_encode_line(&state, &pb2, last + j, in + j, Rc[j],
|
|
width, 3, j, 8);
|
|
Rc[j] = last0;
|
|
}
|
|
in += p->linesize[0];
|
|
}
|
|
}
|
|
av_free(last);
|
|
/* Now the actual image data has been written, which enables us to estimate
|
|
* the needed packet size: For every 15 input bits, an escape bit might be
|
|
* added below; and if put_bits_count % 15 is >= 8, then another bit might
|
|
* be added.
|
|
* Furthermore the specification says that after doing 0xff escaping unused
|
|
* bits in the last byte must be set to 0, so just append 7 "optional" zero
|
|
* bits to avoid special-casing. This also simplifies the size calculation:
|
|
* Properly rounding up is now automatically baked-in. */
|
|
put_bits(&pb2, 7, 0);
|
|
/* Make sure that the bit count + padding is representable in an int;
|
|
necessary for put_bits_count() as well as for using a GetBitContext. */
|
|
if (put_bytes_count(&pb2, 0) > INT_MAX / 8 - AV_INPUT_BUFFER_PADDING_SIZE)
|
|
return AVERROR(ERANGE);
|
|
size_in_bits = put_bits_count(&pb2);
|
|
flush_put_bits(&pb2);
|
|
size = size_in_bits * 2U / 15;
|
|
size += 2 + 2 + 2 + 1 + 2 + 2 + 1 + comps * (1 + 1 + 1) + 2 + 2 + 1
|
|
+ comps * (1 + 1) + 1 + 1 + 1; /* Header */
|
|
size += 2 + 2 + 1 + 2 + 2 + 2 + 2 + 2; /* LSE */
|
|
size += 2; /* EOI */
|
|
if ((ret = ff_get_encode_buffer(avctx, pkt, size, 0)) < 0)
|
|
return ret;
|
|
|
|
bytestream2_init_writer(&pb, pkt->data, pkt->size);
|
|
|
|
/* write our own JPEG header, can't use mjpeg_picture_header */
|
|
put_marker_byteu(&pb, SOI);
|
|
put_marker_byteu(&pb, SOF48);
|
|
bytestream2_put_be16u(&pb, 8 + comps * 3); // header size depends on components
|
|
bytestream2_put_byteu(&pb, (avctx->pix_fmt == AV_PIX_FMT_GRAY16) ? 16 : 8); // bpp
|
|
bytestream2_put_be16u(&pb, avctx->height);
|
|
bytestream2_put_be16u(&pb, avctx->width);
|
|
bytestream2_put_byteu(&pb, comps); // components
|
|
for (i = 1; i <= comps; i++) {
|
|
bytestream2_put_byteu(&pb, i); // component ID
|
|
bytestream2_put_byteu(&pb, 0x11); // subsampling: none
|
|
bytestream2_put_byteu(&pb, 0); // Tiq, used by JPEG-LS ext
|
|
}
|
|
|
|
put_marker_byteu(&pb, SOS);
|
|
bytestream2_put_be16u(&pb, 6 + comps * 2);
|
|
bytestream2_put_byteu(&pb, comps);
|
|
for (i = 1; i <= comps; i++) {
|
|
bytestream2_put_byteu(&pb, i); // component ID
|
|
bytestream2_put_byteu(&pb, 0); // mapping index: none
|
|
}
|
|
bytestream2_put_byteu(&pb, ctx->pred);
|
|
bytestream2_put_byteu(&pb, (comps > 1) ? 1 : 0); // interleaving: 0 - plane, 1 - line
|
|
bytestream2_put_byteu(&pb, 0); // point transform: none
|
|
|
|
ls_store_lse(&state, &pb);
|
|
|
|
/* do escape coding */
|
|
init_get_bits(&gb, pb2.buf, size_in_bits);
|
|
size_in_bits -= 7;
|
|
while (get_bits_count(&gb) < size_in_bits) {
|
|
int v;
|
|
v = get_bits(&gb, 8);
|
|
bytestream2_put_byteu(&pb, v);
|
|
if (v == 0xFF) {
|
|
v = get_bits(&gb, 7);
|
|
bytestream2_put_byteu(&pb, v);
|
|
}
|
|
}
|
|
|
|
/* End of image */
|
|
put_marker_byteu(&pb, EOI);
|
|
|
|
av_shrink_packet(pkt, bytestream2_tell_p(&pb));
|
|
*got_packet = 1;
|
|
return 0;
|
|
}
|
|
|
|
static av_cold int encode_jpegls_init(AVCodecContext *avctx)
|
|
{
|
|
JPEGLSContext *ctx = avctx->priv_data;
|
|
size_t size;
|
|
|
|
if ((avctx->width | avctx->height) > UINT16_MAX) {
|
|
av_log(avctx, AV_LOG_ERROR, "Dimensions exceeding 65535x65535\n");
|
|
return AVERROR(EINVAL);
|
|
}
|
|
if (avctx->pix_fmt == AV_PIX_FMT_GRAY8 ||
|
|
avctx->pix_fmt == AV_PIX_FMT_GRAY16)
|
|
ctx->comps = 1;
|
|
else
|
|
ctx->comps = 3;
|
|
size = AV_INPUT_BUFFER_MIN_SIZE;
|
|
/* INT_MAX due to PutBit-API. */
|
|
if (avctx->width * (unsigned)avctx->height > (INT_MAX - size) / 4 / ctx->comps)
|
|
return AVERROR(ERANGE);
|
|
size += 4 * ctx->comps * avctx->width * avctx->height;
|
|
ctx->size = size;
|
|
ctx->buf = av_malloc(size + AV_INPUT_BUFFER_PADDING_SIZE);
|
|
if (!ctx->buf)
|
|
return AVERROR(ENOMEM);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static av_cold int encode_jpegls_close(AVCodecContext *avctx)
|
|
{
|
|
JPEGLSContext *ctx = avctx->priv_data;
|
|
|
|
av_freep(&ctx->buf);
|
|
return 0;
|
|
}
|
|
|
|
#define OFFSET(x) offsetof(JPEGLSContext, x)
|
|
#define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
|
|
static const AVOption options[] = {
|
|
{ "pred", "Prediction method", OFFSET(pred), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 2, VE, "pred" },
|
|
{ "left", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, INT_MIN, INT_MAX, VE, "pred" },
|
|
{ "plane", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, INT_MIN, INT_MAX, VE, "pred" },
|
|
{ "median", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 2 }, INT_MIN, INT_MAX, VE, "pred" },
|
|
|
|
{ NULL},
|
|
};
|
|
|
|
static const AVClass jpegls_class = {
|
|
.class_name = "jpegls",
|
|
.item_name = av_default_item_name,
|
|
.option = options,
|
|
.version = LIBAVUTIL_VERSION_INT,
|
|
};
|
|
|
|
const FFCodec ff_jpegls_encoder = {
|
|
.p.name = "jpegls",
|
|
CODEC_LONG_NAME("JPEG-LS"),
|
|
.p.type = AVMEDIA_TYPE_VIDEO,
|
|
.p.id = AV_CODEC_ID_JPEGLS,
|
|
.p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
|
|
.priv_data_size = sizeof(JPEGLSContext),
|
|
.p.priv_class = &jpegls_class,
|
|
.init = encode_jpegls_init,
|
|
FF_CODEC_ENCODE_CB(encode_picture_ls),
|
|
.close = encode_jpegls_close,
|
|
.p.pix_fmts = (const enum AVPixelFormat[]) {
|
|
AV_PIX_FMT_BGR24, AV_PIX_FMT_RGB24,
|
|
AV_PIX_FMT_GRAY8, AV_PIX_FMT_GRAY16,
|
|
AV_PIX_FMT_NONE
|
|
},
|
|
.caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
|
|
};
|