demux: allow refresh seek for non-video streams

Since d41f0a54b0, enabling a stream will
no longer perform a refresh seek, to fix issues with switching video
tracks. Additionally, 62e9a0c5f6 also
prevents refresh seek on track switching when it happens right after a
seek.

Unfortunately, when external audio files are loaded, preventing refresh
seeks can cause A-V sync issues. Since external tracks have separate demuxer
instances from the internal tracks, the demuxer instances from both
internal and external tracks are explicitly sought to the same pts when
seeking is performed. When enabling an external audio track for the first
time, the existing logic prevents refresh seek because no packets have ever
been read, so the track ends up not being sought. This means that switching
the track in the middle of playback results in a huge A-V desync.

To make it worse, unlike one demuxer instance with multiple tracks,
tracks from multiple demuxer instances are not synced in any meaningful
way beyond the separate explicit seeking. The only thing which keeps these
tracks synced is the generic A-V sync logic, which is unfit for such large
desync above. This means the audio is at the start position after the track
is switched, behind the video, so the audio is not considered ready, and
audio is continuously filtered sequentially until it is synced to the video.
While this is happening, the audio filtering exhausts all CPU resources.

There is also a case with cache enabled: if a seek causes some new data to
be cached, the demuxer is sought to the end of joined cache range.
If track is switched after this, the existing logic prevents a refresh seek,
so the demuxer is at a wrong position after the track is switched.

Fix this by allowing refresh seek for non-video streams, even when no packets
have been read yet or immediately after a seek.
This commit is contained in:
nanahi 2024-06-21 03:43:08 -04:00 committed by Dudemanguy
parent e5d85704a3
commit 940854c86f
1 changed files with 25 additions and 13 deletions

View File

@ -3964,6 +3964,28 @@ static void initiate_refresh_seek(struct demux_internal *in,
in->seek_pts = start_ts; in->seek_pts = start_ts;
} }
// Called locked.
static void refresh_track(struct demuxer *demuxer, struct sh_stream *stream,
double ref_pts)
{
struct demux_internal *in = demuxer->in;
struct demux_stream *ds = stream->ds;
ref_pts = MP_ADD_PTS(ref_pts, -in->ts_offset);
MP_VERBOSE(in, "refresh track %d\n", stream->index);
if (in->back_demuxing)
ds->back_seek_pos = ref_pts;
// Allow refresh seek for non-video streams, even if no packets have
// ever been read yet or after seeking. This is necessary because:
// - A-V sync targets may come from different demuxers, so enabling an external
// audio track for the first time can cause desync since a seek is not performed.
// - If cache is enabled and a seek causes some new data to be cached, the demuxer
// is sought to the end of cache after cache joining. Switching track immediately
// after this also causes the same problem.
if (!in->after_seek || ds->type != STREAM_VIDEO)
initiate_refresh_seek(in, ds, ref_pts);
}
// Set whether the given stream should return packets. // Set whether the given stream should return packets.
// ref_pts is used only if the stream is enabled. Then it serves as approximate // ref_pts is used only if the stream is enabled. Then it serves as approximate
// start pts for this stream (in the worst case it is ignored). // start pts for this stream (in the worst case it is ignored).
@ -3973,19 +3995,14 @@ void demuxer_select_track(struct demuxer *demuxer, struct sh_stream *stream,
struct demux_internal *in = demuxer->in; struct demux_internal *in = demuxer->in;
struct demux_stream *ds = stream->ds; struct demux_stream *ds = stream->ds;
mp_mutex_lock(&in->lock); mp_mutex_lock(&in->lock);
ref_pts = MP_ADD_PTS(ref_pts, -in->ts_offset);
// don't flush buffers if stream is already selected / unselected // don't flush buffers if stream is already selected / unselected
if (ds->selected != selected) { if (ds->selected != selected) {
MP_VERBOSE(in, "%sselect track %d\n", selected ? "" : "de", stream->index); MP_VERBOSE(in, "%sselect track %d\n", selected ? "" : "de", stream->index);
ds->selected = selected; ds->selected = selected;
update_stream_selection_state(in, ds); update_stream_selection_state(in, ds);
in->tracks_switched = true; in->tracks_switched = true;
if (ds->selected) { if (ds->selected)
if (in->back_demuxing) refresh_track(demuxer, stream, ref_pts);
ds->back_seek_pos = ref_pts;
if (!in->after_seek)
initiate_refresh_seek(in, ds, ref_pts);
}
if (in->threading) { if (in->threading) {
mp_cond_signal(&in->wakeup); mp_cond_signal(&in->wakeup);
} else { } else {
@ -4003,14 +4020,9 @@ void demuxer_refresh_track(struct demuxer *demuxer, struct sh_stream *stream,
struct demux_internal *in = demuxer->in; struct demux_internal *in = demuxer->in;
struct demux_stream *ds = stream->ds; struct demux_stream *ds = stream->ds;
mp_mutex_lock(&in->lock); mp_mutex_lock(&in->lock);
ref_pts = MP_ADD_PTS(ref_pts, -in->ts_offset);
if (ds->selected) { if (ds->selected) {
MP_VERBOSE(in, "refresh track %d\n", stream->index);
update_stream_selection_state(in, ds); update_stream_selection_state(in, ds);
if (in->back_demuxing) refresh_track(demuxer, stream, ref_pts);
ds->back_seek_pos = ref_pts;
if (!in->after_seek)
initiate_refresh_seek(in, ds, ref_pts);
} }
mp_mutex_unlock(&in->lock); mp_mutex_unlock(&in->lock);
} }