[FFmpeg-devel,10/39] lavc/ffv1dec: move the bitreader to stack

Message ID	20240716171155.31838-10-anton@khirnov.net
State	New
Headers	show Delivered-To: ffmpegpatchwork2@gmail.com Received-SPF: pass (google.com: domain of ffmpeg-devel-bounces@ffmpeg.org designates 79.124.17.100 as permitted sender) client-ip=79.124.17.100; From: Anton Khirnov <anton@khirnov.net> To: ffmpeg-devel@ffmpeg.org Date: Tue, 16 Jul 2024 19:11:25 +0200 Message-ID: <20240716171155.31838-10-anton@khirnov.net> In-Reply-To: <20240716171155.31838-1-anton@khirnov.net> References: <20240716171155.31838-1-anton@khirnov.net> MIME-Version: 1.0 Subject: [FFmpeg-devel] [PATCH 10/39] lavc/ffv1dec: move the bitreader to stack Precedence: list Reply-To: FFmpeg development discussions and patches <ffmpeg-devel@ffmpeg.org> Content-Type: text/plain; charset="us-ascii" Content-Transfer-Encoding: 7bit Errors-To: ffmpeg-devel-bounces@ffmpeg.org Sender: "ffmpeg-devel" <ffmpeg-devel-bounces@ffmpeg.org>
Series	[FFmpeg-devel,01/39] tests/fate/vcodec: add vsynth tests for FFV1 version 2 \| expand [FFmpeg-devel,01/39] tests/fate/vcodec: add vsynth tests for FFV1 version 2 [FFmpeg-devel,02/39] lavc/ffv1dec: declare loop variables in the loop where possible [FFmpeg-devel,03/39] lavc/ffv1dec: simplify slice index calculation [FFmpeg-devel,04/39] lavc/ffv1dec: drop FFV1Context.cur [FFmpeg-devel,05/39] lavc/ffv1dec: drop a pointless variable in decode_slice() [FFmpeg-devel,06/39] lavc/ffv1dec: move copy_fields() under HAVE_THREADS [FFmpeg-devel,07/39] lavc/ffv1: add a per-slice context [FFmpeg-devel,08/39] lavc/ffv1: move sample_buffer to the per-slice context [FFmpeg-devel,09/39] lavc/ffv1: move run_index to the per-slice context [FFmpeg-devel,10/39] lavc/ffv1dec: move the bitreader to stack [FFmpeg-devel,11/39] lavc/ffv1enc: move bit writer to per-slice context [FFmpeg-devel,12/39] lavc/ffv1: drop redundant FFV1Context.quant_table [FFmpeg-devel,13/39] lavc/ffv1: drop redundant PlaneContext.quant_table [FFmpeg-devel,14/39] lavc/ffv1: drop write-only PlaneContext.interlace_bit_state [FFmpeg-devel,15/39] lavc/ffv1: always use the main context values of plane_count/transparency [FFmpeg-devel,16/39] lavc/ffv1: move FFV1Context.slice_{coding_mode, rct_.y_coef} to per-slice cont… [FFmpeg-devel,17/39] lavc/ffv1: always use the main context values of ac [FFmpeg-devel,18/39] lavc/ffv1: move FFV1Context.plane to per-slice context [FFmpeg-devel,19/39] lavc/ffv1: move RangeCoder to per-slice context [FFmpeg-devel,20/39] lavc/ffv1enc: store per-slice rc_stat(2?) in FFV1SliceContext [FFmpeg-devel,21/39] lavc/ffv1: move ac_byte_count to per-slice context [FFmpeg-devel,22/39] lavc/ffv1enc: stop using per-slice FFV1Context [FFmpeg-devel,23/39] lavc/ffv1dec: move slice_reset_contexts to per-slice context [FFmpeg-devel,24/39] lavc/ffv1dec: move slice_damaged to per-slice context [FFmpeg-devel,25/39] lavc/ffv1dec: stop using per-slice FFV1Context [FFmpeg-devel,26/39] lavc/ffv1dec: inline copy_fields() into update_thread_context() [FFmpeg-devel,27/39] lavc/ffv1: change FFV1SliceContext.plane into a RefStruct object [FFmpeg-devel,28/39] lavc/ffv1dec: fix races in accessing FFV1SliceContext.slice_damaged [FFmpeg-devel,29/39] lavc/thread: move generic-layer API to avcodec_internal.h [FFmpeg-devel,30/39] lavc/internal: document the precise meaning of AVCodecInternal.draining [FFmpeg-devel,31/39] lavc/decode: wrap AV_FRAME_FLAG_DISCARD handling in a loop [FFmpeg-devel,32/39] lavc/decode: reindent [FFmpeg-devel,33/39] lavc: convert frame threading to the receive_frame() pattern [FFmpeg-devel,34/39] lavc/decode: reindent after previous commit [FFmpeg-devel,35/39] lavc/hevcdec: switch to receive_frame() [FFmpeg-devel,36/39] lavc: add private container FIFO API [FFmpeg-devel,37/39] lavc/hevcdec: use a ContainerFifo to hold frames scheduled for output [FFmpeg-devel,38/39] lavc/hevcdec: simplify output logic [FFmpeg-devel,39/39] lavc/hevcdec: call ff_thread_finish_setup() even if hwaccel is in use

Context	Check	Description
andriy/make_x86	success	Make finished
andriy/make_fate_x86	success	Make fate finished

diff --git a/libavcodec/ffv1.h b/libavcodec/ffv1.h index 68d13a2964..c88aa8c30d 100644 --- a/libavcodec/ffv1.h +++ b/libavcodec/ffv1.h @@ -85,7 +85,6 @@ typedef struct FFV1Context { AVClass *class; AVCodecContext *avctx; RangeCoder c; - GetBitContext gb; PutBitContext pb; uint64_t rc_stat[256][2]; uint64_t (*rc_stat2[MAX_QUANT_TABLES])[32][2]; diff --git a/libavcodec/ffv1dec.c b/libavcodec/ffv1dec.c index a2971d7eea..a1f7206871 100644 --- a/libavcodec/ffv1dec.c +++ b/libavcodec/ffv1dec.c @@ -94,14 +94,14 @@ static inline int get_vlc_symbol(GetBitContext *gb, VlcState *const state, return ret; } -static int is_input_end(FFV1Context *s) +static int is_input_end(FFV1Context *s, GetBitContext *gb) { if (s->ac != AC_GOLOMB_RICE) { RangeCoder *const c = &s->c; if (c->overread > MAX_OVERREAD) return AVERROR_INVALIDDATA; } else { - if (get_bits_left(&s->gb) < 1) + if (get_bits_left(gb) < 1) return AVERROR_INVALIDDATA; } return 0; @@ -118,6 +118,7 @@ static int is_input_end(FFV1Context *s) #include "ffv1dec_template.c" static int decode_plane(FFV1Context *s, FFV1SliceContext *sc, + GetBitContext *gb, uint8_t *src, int w, int h, int stride, int plane_index, int pixel_stride) { @@ -140,13 +141,13 @@ static int decode_plane(FFV1Context *s, FFV1SliceContext *sc, sample[0][w] = sample[0][w - 1]; if (s->avctx->bits_per_raw_sample <= 8) { - int ret = decode_line(s, sc, w, sample, plane_index, 8); + int ret = decode_line(s, sc, gb, w, sample, plane_index, 8); if (ret < 0) return ret; for (x = 0; x < w; x++) src[x*pixel_stride + stride * y] = sample[1][x]; } else { - int ret = decode_line(s, sc, w, sample, plane_index, s->avctx->bits_per_raw_sample); + int ret = decode_line(s, sc, gb, w, sample, plane_index, s->avctx->bits_per_raw_sample); if (ret < 0) return ret; if (s->packed_at_lsb) { @@ -262,6 +263,7 @@ static int decode_slice(AVCodecContext *c, void *arg) AVFrame * const p = f->picture.f; const int si = (FFV1Context**)arg - f->slice_context; FFV1SliceContext *sc = &f->slices[si]; + GetBitContext gb; if (f->fsrc && !(p->flags & AV_FRAME_FLAG_KEY) && f->last_picture.f) ff_progress_frame_await(&f->last_picture, si); @@ -322,7 +324,7 @@ static int decode_slice(AVCodecContext *c, void *arg) if (f->version == 3 && f->micro_version > 1 || f->version > 3) get_rac(&fs->c, (uint8_t[]) { 129 }); fs->ac_byte_count = f->version > 2 || (!x && !y) ? fs->c.bytestream - fs->c.bytestream_start - 1 : 0; - init_get_bits(&fs->gb, + init_get_bits(&gb, fs->c.bytestream_start + fs->ac_byte_count, (fs->c.bytestream_end - fs->c.bytestream_start - fs->ac_byte_count) * 8); } @@ -333,29 +335,29 @@ static int decode_slice(AVCodecContext *c, void *arg) const int chroma_height = AV_CEIL_RSHIFT(height, f->chroma_v_shift); const int cx = x >> f->chroma_h_shift; const int cy = y >> f->chroma_v_shift; - decode_plane(fs, sc, p->data[0] + ps*x + y*p->linesize[0], width, height, p->linesize[0], 0, 1); + decode_plane(fs, sc, &gb, p->data[0] + ps*x + y*p->linesize[0], width, height, p->linesize[0], 0, 1); if (f->chroma_planes) { - decode_plane(fs, sc, p->data[1] + ps*cx+cy*p->linesize[1], chroma_width, chroma_height, p->linesize[1], 1, 1); - decode_plane(fs, sc, p->data[2] + ps*cx+cy*p->linesize[2], chroma_width, chroma_height, p->linesize[2], 1, 1); + decode_plane(fs, sc, &gb, p->data[1] + ps*cx+cy*p->linesize[1], chroma_width, chroma_height, p->linesize[1], 1, 1); + decode_plane(fs, sc, &gb, p->data[2] + ps*cx+cy*p->linesize[2], chroma_width, chroma_height, p->linesize[2], 1, 1); } if (fs->transparency) - decode_plane(fs, sc, p->data[3] + ps*x + y*p->linesize[3], width, height, p->linesize[3], (f->version >= 4 && !f->chroma_planes) ? 1 : 2, 1); + decode_plane(fs, sc, &gb, p->data[3] + ps*x + y*p->linesize[3], width, height, p->linesize[3], (f->version >= 4 && !f->chroma_planes) ? 1 : 2, 1); } else if (f->colorspace == 0) { - decode_plane(fs, sc, p->data[0] + ps*x + y*p->linesize[0] , width, height, p->linesize[0], 0, 2); - decode_plane(fs, sc, p->data[0] + ps*x + y*p->linesize[0] + 1, width, height, p->linesize[0], 1, 2); + decode_plane(fs, sc, &gb, p->data[0] + ps*x + y*p->linesize[0] , width, height, p->linesize[0], 0, 2); + decode_plane(fs, sc, &gb, p->data[0] + ps*x + y*p->linesize[0] + 1, width, height, p->linesize[0], 1, 2); } else if (f->use32bit) { uint8_t *planes[4] = { p->data[0] + ps * x + y * p->linesize[0], p->data[1] + ps * x + y * p->linesize[1], p->data[2] + ps * x + y * p->linesize[2], p->data[3] + ps * x + y * p->linesize[3] }; - decode_rgb_frame32(fs, sc, planes, width, height, p->linesize); + decode_rgb_frame32(fs, sc, &gb, planes, width, height, p->linesize); } else { uint8_t *planes[4] = { p->data[0] + ps * x + y * p->linesize[0], p->data[1] + ps * x + y * p->linesize[1], p->data[2] + ps * x + y * p->linesize[2], p->data[3] + ps * x + y * p->linesize[3] }; - decode_rgb_frame(fs, sc, planes, width, height, p->linesize); + decode_rgb_frame(fs, sc, &gb, planes, width, height, p->linesize); } if (fs->ac != AC_GOLOMB_RICE && f->version > 2) { int v; diff --git a/libavcodec/ffv1dec_template.c b/libavcodec/ffv1dec_template.c index 8e2e38c0b9..e9d3002be9 100644 --- a/libavcodec/ffv1dec_template.c +++ b/libavcodec/ffv1dec_template.c @@ -23,8 +23,8 @@ #include "ffv1_template.c" static av_always_inline int -RENAME(decode_line)(FFV1Context *s, FFV1SliceContext *sc, int w, - TYPE *sample[2], int plane_index, int bits) +RENAME(decode_line)(FFV1Context *s, FFV1SliceContext *sc, GetBitContext *gb, + int w, TYPE *sample[2], int plane_index, int bits) { PlaneContext *const p = &s->plane[plane_index]; RangeCoder *const c = &s->c; @@ -33,7 +33,7 @@ RENAME(decode_line)(FFV1Context *s, FFV1SliceContext *sc, int w, int run_mode = 0; int run_index = sc->run_index; - if (is_input_end(s)) + if (is_input_end(s, gb)) return AVERROR_INVALIDDATA; if (s->slice_coding_mode == 1) { @@ -53,7 +53,7 @@ RENAME(decode_line)(FFV1Context *s, FFV1SliceContext *sc, int w, int diff, context, sign; if (!(x & 1023)) { - if (is_input_end(s)) + if (is_input_end(s, gb)) return AVERROR_INVALIDDATA; } @@ -74,13 +74,13 @@ RENAME(decode_line)(FFV1Context *s, FFV1SliceContext *sc, int w, if (run_mode) { if (run_count == 0 && run_mode == 1) { - if (get_bits1(&s->gb)) { + if (get_bits1(gb)) { run_count = 1 << ff_log2_run[run_index]; if (x + run_count <= w) run_index++; } else { if (ff_log2_run[run_index]) - run_count = get_bits(&s->gb, ff_log2_run[run_index]); + run_count = get_bits(gb, ff_log2_run[run_index]); else run_count = 0; if (run_index) @@ -105,17 +105,17 @@ RENAME(decode_line)(FFV1Context *s, FFV1SliceContext *sc, int w, if (run_count < 0) { run_mode = 0; run_count = 0; - diff = get_vlc_symbol(&s->gb, &p->vlc_state[context], + diff = get_vlc_symbol(gb, &p->vlc_state[context], bits); if (diff >= 0) diff++; } else diff = 0; } else - diff = get_vlc_symbol(&s->gb, &p->vlc_state[context], bits); + diff = get_vlc_symbol(gb, &p->vlc_state[context], bits); ff_dlog(s->avctx, "count:%d index:%d, mode:%d, x:%d pos:%d\n", - run_count, run_index, run_mode, x, get_bits_count(&s->gb)); + run_count, run_index, run_mode, x, get_bits_count(gb)); } if (sign) @@ -128,6 +128,7 @@ RENAME(decode_line)(FFV1Context *s, FFV1SliceContext *sc, int w, } static int RENAME(decode_rgb_frame)(FFV1Context *s, FFV1SliceContext *sc, + GetBitContext *gb, uint8_t *src[4], int w, int h, int stride[4]) { int x, y, p; @@ -157,9 +158,9 @@ static int RENAME(decode_rgb_frame)(FFV1Context *s, FFV1SliceContext *sc, sample[p][1][-1]= sample[p][0][0 ]; sample[p][0][ w]= sample[p][0][w-1]; if (lbd && s->slice_coding_mode == 0) - ret = RENAME(decode_line)(s, sc, w, sample[p], (p + 1)/2, 9); + ret = RENAME(decode_line)(s, sc, gb, w, sample[p], (p + 1)/2, 9); else - ret = RENAME(decode_line)(s, sc, w, sample[p], (p + 1)/2, bits + (s->slice_coding_mode != 1)); + ret = RENAME(decode_line)(s, sc, gb, w, sample[p], (p + 1)/2, bits + (s->slice_coding_mode != 1)); if (ret < 0) return ret; }

[FFmpeg-devel,10/39] lavc/ffv1dec: move the bitreader to stack

Checks

Commit Message

Comments

Patch