Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
 help / color / mirror / Atom feed
From: Dimitry Andric <dimitry@unified-streaming.com>
To: FFmpeg development discussions and patches <ffmpeg-devel@ffmpeg.org>
Subject: Re: [FFmpeg-devel] [PATCH] avformat/mov: Fix decoding fragmented MP4 with multiple sample entries and empty stsc
Date: Wed, 2 Jul 2025 14:05:05 +0200
Message-ID: <A10752E2-8E5A-4CF6-A3A4-F8B3B9B8D4F4@unified-streaming.com> (raw)
In-Reply-To: <E4C5AB80-C449-4313-879B-89EF2EDA28E8@unified-streaming.com>

On 31 May 2025, at 20:16, Dimitry Andric <dimitry@unified-streaming.com> wrote:
> 
> On 9 May 2025, at 00:15, James Almer <jamrial@gmail.com> wrote:
>> 
>> On 5/8/2025 7:14 PM, Dimitry Andric wrote:
>>> On 28 Apr 2025, at 13:00, Dimitry Andric <dimitry@unified-streaming.com> wrote:
>>>> 
>>>> On 19 Apr 2025, at 16:27, Dimitry Andric <dimitry@unified-streaming.com> wrote:
>>>>> 
>>>>> On 10 Apr 2025, at 11:03, Dimitry Andric <dimitry@unified-streaming.com> wrote:
>>>>>> 
>>>>>> On 3 Apr 2025, at 22:02, Dimitry Andric <dimitry@unified-streaming.com> wrote:
>>>>>>> 
>>>>>>> When decoding fragmented MP4 files that have an empty stsc box, and
>>>>>>> instead contain sample description indexes in their tfhd boxes, the mov
>>>>>>> demuxer does not notify the decoder whenever the current sample
>>>>>>> description index changes. If the SPS or PPS changed sufficiently, this
>>>>>>> can lead to unexpected decoding errors.
>>>>>>> 
>>>>>>> To fix this, in mov_finalize_packet(), when stsc_data is not available,
>>>>>>> use get_frag_stream_info_from_pkt() to get at the current fragment
>>>>>>> stream info, and retrieve the current sample description index from
>>>>>>> there. Then use that index in a similar manner as the stsc case.
>>>>>>> 
>>>>>>> Signed-off-by: Dimitry Andric <dimitry@unified-streaming.com>
>>>>>>> ---
>>>>>>> libavformat/mov.c | 50 ++++++++++++++++++++++++++++-------------------
>>>>>>> 1 file changed, 30 insertions(+), 20 deletions(-)
>>>>>>> 
>>>>>>> diff --git a/libavformat/mov.c b/libavformat/mov.c
>>>>>>> index 452690090c..ead89192f4 100644
>>>>>>> --- a/libavformat/mov.c
>>>>>>> +++ b/libavformat/mov.c
>>>>>>> @@ -10756,25 +10756,29 @@ static int mov_switch_root(AVFormatContext *s, int64_t target, int index)
>>>>>>> return 1;
>>>>>>> }
>>>>>>> 
>>>>>>> -static int mov_change_extradata(AVStream *st, AVPacket *pkt)
>>>>>>> +static int mov_change_extradata(AVStream *st, AVPacket *pkt, int stsd_id)
>>>>>>> {
>>>>>>> MOVStreamContext *sc = st->priv_data;
>>>>>>> uint8_t *side, *extradata;
>>>>>>> int extradata_size;
>>>>>>> 
>>>>>>> -    /* Save the current index. */
>>>>>>> -    sc->last_stsd_index = sc->stsc_data[sc->stsc_index].id - 1;
>>>>>>> +    if (stsd_id > 0 &&
>>>>>>> +        stsd_id - 1 < sc->stsd_count &&
>>>>>>> +        stsd_id - 1 != sc->last_stsd_index) {
>>>>>>> +        /* Save the current index. */
>>>>>>> +        sc->last_stsd_index = stsd_id - 1;
>>>>>>> 
>>>>>>> -    /* Notify the decoder that extradata changed. */
>>>>>>> -    extradata_size = sc->extradata_size[sc->last_stsd_index];
>>>>>>> -    extradata = sc->extradata[sc->last_stsd_index];
>>>>>>> -    if (st->discard != AVDISCARD_ALL && extradata_size > 0 && extradata) {
>>>>>>> -        side = av_packet_new_side_data(pkt,
>>>>>>> -                                       AV_PKT_DATA_NEW_EXTRADATA,
>>>>>>> -                                       extradata_size);
>>>>>>> -        if (!side)
>>>>>>> -            return AVERROR(ENOMEM);
>>>>>>> -        memcpy(side, extradata, extradata_size);
>>>>>>> +        /* Notify the decoder that extradata changed. */
>>>>>>> +        extradata_size = sc->extradata_size[sc->last_stsd_index];
>>>>>>> +        extradata = sc->extradata[sc->last_stsd_index];
>>>>>>> +        if (st->discard != AVDISCARD_ALL && extradata_size > 0 && extradata) {
>>>>>>> +            side = av_packet_new_side_data(pkt,
>>>>>>> +                                           AV_PKT_DATA_NEW_EXTRADATA,
>>>>>>> +                                           extradata_size);
>>>>>>> +            if (!side)
>>>>>>> +                return AVERROR(ENOMEM);
>>>>>>> +            memcpy(side, extradata, extradata_size);
>>>>>>> +        }
>>>>>>> }
>>>>>>> 
>>>>>>> return 0;
>>>>>>> @@ -10893,13 +10897,10 @@ static int mov_finalize_packet(AVFormatContext *s, AVStream *st, AVIndexEntry *s
>>>>>>> 
>>>>>>> /* Multiple stsd handling. */
>>>>>>> if (sc->stsc_data) {
>>>>>>> -        if (sc->stsc_data[sc->stsc_index].id > 0 &&
>>>>>>> -            sc->stsc_data[sc->stsc_index].id - 1 < sc->stsd_count &&
>>>>>>> -            sc->stsc_data[sc->stsc_index].id - 1 != sc->last_stsd_index) {
>>>>>>> -            int ret = mov_change_extradata(st, pkt);
>>>>>>> -            if (ret < 0)
>>>>>>> -                return ret;
>>>>>>> -        }
>>>>>>> +        int stsd_id = sc->stsc_data[sc->stsc_index].id;
>>>>>>> +        int ret = mov_change_extradata(st, pkt, stsd_id);
>>>>>>> +        if (ret < 0)
>>>>>>> +            return ret;
>>>>>>> 
>>>>>>>     /* Update the stsc index for the next sample */
>>>>>>>     sc->stsc_sample++;
>>>>>>> @@ -10908,6 +10909,15 @@ static int mov_finalize_packet(AVFormatContext *s, AVStream *st, AVIndexEntry *s
>>>>>>>         sc->stsc_index++;
>>>>>>>         sc->stsc_sample = 0;
>>>>>>>     }
>>>>>>> +    } else {
>>>>>>> +        MOVContext *mov = s->priv_data;
>>>>>>> +        MOVFragmentStreamInfo *frag_stream_info = get_frag_stream_info_from_pkt(&mov->frag_index, pkt, sc->id);
>>>>>>> +        if (frag_stream_info) {
>>>>>>> +            int stsd_id = frag_stream_info->stsd_id;
>>>>>>> +            int ret = mov_change_extradata(st, pkt, stsd_id);
>>>>>>> +            if (ret < 0)
>>>>>>> +                return ret;
>>>>>>> +        }
>>>>>>> }
>>>>>>> 
>>>>>>> return 0;
>>>>>>> -- 
>>>>>>> 2.43.0
>>>>>>> 
>>>>>> 
>>>>>> Any comments on this patch?
>>>>> 
>>>>> Ping :)
>>>> 
>>>> Is there any particular group of persons that "own" the mov muxer?
>>> Another ping.
>> 
>> I'll have a look seeing no one else will.
> 
> To provide some backstory here, I will attempt to explain further what
> this patch is supposed to fix. It is specifically about AVC (or possibly
> HEVC) video that has more than one referenced PPS in the elementary
> stream. (One encoder that sometimes produces this kind of video is x264,
> unless you use the --stitchable option).
> 
> In a MP4 file this can be represented by multiple sample description
> entries in the 'stsd' box, and in a progressive file there is a 'stsc'
> box which defines which samples have which sample description indexes.
> FFmpeg handles these just fine.
> 
> However, in a fragmented MP4 file the 'stsc' box is usually empty, and
> the fragments have a 'tfhd' box with a sample description index field
> instead. Such files can sometimes not be decoded properly by FFmpeg,
> since it does not call mov_change_extradata() whenever the sample
> description index changes, somewhere in the middle of the video. In that
> case, it will either complain about a bad PPS ID, or if the ID matches
> but the PPS contents does not, lots of decoding errors will occur.
> 
> This proposed patch makes it so mov_change_extradata() is called even if
> MovStreamContext's sc_data field is empty, but
> get_frag_stream_info_from_pkt() returns a valid stsd_id in its
> MOVFragmentStreamInfo. For fragmented files, mov_read_tfhd() already
> takes care of reading the stsd_id from the tfhd boxes.

Another ping.

-Dimitry

_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".

      reply	other threads:[~2025-07-02 12:05 UTC|newest]

Thread overview: 8+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2025-04-03 20:02 Dimitry Andric
2025-04-10  9:03 ` Dimitry Andric
2025-04-19 14:27   ` Dimitry Andric
2025-04-28 11:00     ` Dimitry Andric
2025-05-08 22:14       ` Dimitry Andric
2025-05-08 22:15         ` James Almer
2025-05-31 18:16           ` Dimitry Andric
2025-07-02 12:05             ` Dimitry Andric [this message]

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=A10752E2-8E5A-4CF6-A3A4-F8B3B9B8D4F4@unified-streaming.com \
    --to=dimitry@unified-streaming.com \
    --cc=ffmpeg-devel@ffmpeg.org \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link

Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel

This inbox may be cloned and mirrored by anyone:

	git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git

	# If you have public-inbox 1.1+ installed, you may
	# initialize and index your mirror using the following commands:
	public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \
		ffmpegdev@gitmailbox.com
	public-inbox-index ffmpegdev

Example config snippet for mirrors.


AGPL code for this site: git clone https://public-inbox.org/public-inbox.git