From: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
To: ffmpeg-devel@ffmpeg.org
Subject: Re: [FFmpeg-devel] [PATCH 2/2] libfdk-aacdec: Flush delayed samples at the end
Date: Fri, 21 Jan 2022 15:42:36 +0100
Message-ID: <AM7PR03MB666089896D949B4855DDAB428F5B9@AM7PR03MB6660.eurprd03.prod.outlook.com> (raw)
In-Reply-To: <4cf21020-5cdf-6532-f6fb-3995ba1f3d78@martin.st>
Martin Storsjö:
> On Fri, 21 Jan 2022, Andreas Rheinhardt wrote:
>
>> Martin Storsjö:
>>> Also trim off delay samples at the start instead of adjusting pts
>>> to compensate for them; this avoids unwanted offsets if working
>>> with raw samples without considering their pts.
>>> ---
>>> libavcodec/libfdk-aacdec.c | 80 +++++++++++++++++++++++++++++++-------
>>> 1 file changed, 65 insertions(+), 15 deletions(-)
>>>
>>> diff --git a/libavcodec/libfdk-aacdec.c b/libavcodec/libfdk-aacdec.c
>>> index 93b52023b0..d560e313ca 100644
>>> --- a/libavcodec/libfdk-aacdec.c
>>> +++ b/libavcodec/libfdk-aacdec.c
>>> @@ -58,7 +58,11 @@ typedef struct FDKAACDecContext {
>>> int drc_cut;
>>> int album_mode;
>>> int level_limit;
>>> - int output_delay;
>>> +#if FDKDEC_VER_AT_LEAST(2, 5) // 2.5.10
>>> + int output_delay_set;
>>> + int flush_samples;
>>> + int delay_samples;
>>> +#endif
>>> } FDKAACDecContext;
>>>
>>>
>>> @@ -123,7 +127,12 @@ static int get_stream_info(AVCodecContext *avctx)
>>> avctx->sample_rate = info->sampleRate;
>>> avctx->frame_size = info->frameSize;
>>> #if FDKDEC_VER_AT_LEAST(2, 5) // 2.5.10
>>> - s->output_delay = info->outputDelay;
>>> + if (!s->output_delay_set && info->outputDelay) {
>>> + // Set this only once.
>>> + s->flush_samples = info->outputDelay;
>>> + s->delay_samples = info->outputDelay;
>>> + s->output_delay_set = 1;
>>> + }
>>> #endif
>>>
>>> for (i = 0; i < info->numChannels; i++) {
>>> @@ -367,14 +376,31 @@ static int fdk_aac_decode_frame(AVCodecContext
>>> *avctx, void *data,
>>> int ret;
>>> AAC_DECODER_ERROR err;
>>> UINT valid = avpkt->size;
>>> + UINT flags = 0;
>>> + int input_offset = 0;
>>>
>>> - err = aacDecoder_Fill(s->handle, &avpkt->data, &avpkt->size,
>>> &valid);
>>> - if (err != AAC_DEC_OK) {
>>> - av_log(avctx, AV_LOG_ERROR, "aacDecoder_Fill() failed:
>>> %x\n", err);
>>> - return AVERROR_INVALIDDATA;
>>> + if (avpkt->size) {
>>> + err = aacDecoder_Fill(s->handle, &avpkt->data, &avpkt->size,
>>> &valid);
>>> + if (err != AAC_DEC_OK) {
>>> + av_log(avctx, AV_LOG_ERROR, "aacDecoder_Fill() failed:
>>> %x\n", err);
>>> + return AVERROR_INVALIDDATA;
>>> + }
>>> + } else {
>>> +#if FDKDEC_VER_AT_LEAST(2, 5) // 2.5.10
>>> + /* Handle decoder draining */
>>> + if (s->flush_samples > 0) {
>>> + flags |= AACDEC_FLUSH;
>>> + } else {
>>> + return AVERROR_EOF;
>>> + }
>>> +#else
>>> + return AVERROR_EOF;
>>> +#endif
>>> }
>>>
>>> - err = aacDecoder_DecodeFrame(s->handle, (INT_PCM *)
>>> s->decoder_buffer, s->decoder_buffer_size / sizeof(INT_PCM), 0);
>>> + err = aacDecoder_DecodeFrame(s->handle, (INT_PCM *)
>>> s->decoder_buffer,
>>> + s->decoder_buffer_size /
>>> sizeof(INT_PCM),
>>> + flags);
>>> if (err == AAC_DEC_NOT_ENOUGH_BITS) {
>>> ret = avpkt->size - valid;
>>> goto end;
>>> @@ -390,16 +416,36 @@ static int fdk_aac_decode_frame(AVCodecContext
>>> *avctx, void *data,
>>> goto end;
>>> frame->nb_samples = avctx->frame_size;
>>>
>>> +#if FDKDEC_VER_AT_LEAST(2, 5) // 2.5.10
>>> + if (flags & AACDEC_FLUSH) {
>>> + // Only return the right amount of samples at the end; if
>>> calling the
>>> + // decoder with AACDEC_FLUSH, it will keep returning frames
>>> indefinitely.
>>> + frame->nb_samples = FFMIN(s->flush_samples, frame->nb_samples);
>>> + av_log(s, AV_LOG_DEBUG, "Returning %d/%d delayed samples.\n",
>>> + frame->nb_samples, s->flush_samples);
>>> + s->flush_samples -= frame->nb_samples;
>>> + } else {
>>> + // Trim off samples from the start to compensate for extra
>>> decoder
>>> + // delay. We could also just adjust the pts, but this avoids
>>> + // including the extra samples in the output altogether.
>>> + if (s->delay_samples) {
>>> + int drop_samples = FFMIN(s->delay_samples,
>>> frame->nb_samples);
>>> + av_log(s, AV_LOG_DEBUG, "Dropping %d/%d delayed
>>> samples.\n",
>>> + drop_samples, s->delay_samples);
>>> + s->delay_samples -= drop_samples;
>>> + frame->nb_samples -= drop_samples;
>>> + input_offset = drop_samples * avctx->channels;
>>> + if (frame->nb_samples <= 0)
>>> + return 0;
>>> + }
>>> + }
>>> +#endif
>>> +
>>> if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
>>> goto end;
>>>
>>> - if (frame->pts != AV_NOPTS_VALUE)
>>> - frame->pts -= av_rescale_q(s->output_delay,
>>> - (AVRational){1, avctx->sample_rate},
>>> - avctx->time_base);
>>> -
>>> - memcpy(frame->extended_data[0], s->decoder_buffer,
>>> - avctx->channels * avctx->frame_size *
>>> + memcpy(frame->extended_data[0], s->decoder_buffer + input_offset,
>>> + avctx->channels * frame->nb_samples *
>>> av_get_bytes_per_sample(avctx->sample_fmt));
>>>
>>> *got_frame_ptr = 1;
>>> @@ -432,7 +478,11 @@ const AVCodec ff_libfdk_aac_decoder = {
>>> .decode = fdk_aac_decode_frame,
>>> .close = fdk_aac_decode_close,
>>> .flush = fdk_aac_decode_flush,
>>> - .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_CHANNEL_CONF,
>>> + .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_CHANNEL_CONF
>>> +#if FDKDEC_VER_AT_LEAST(2, 5) // 2.5.10
>>> + | AV_CODEC_CAP_DELAY
>>> +#endif
>>> + ,
>>> .priv_class = &fdk_aac_dec_class,
>>> .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE |
>>> FF_CODEC_CAP_INIT_CLEANUP,
>>>
>>
>> When I use the libfdk-aac decoder I get the exact number of samples like
>> with the native aac decoder (namely number of frames * 1024, as
>> expected). What makes you believe this is necessary?
>
> The fdk-aac decoder can have, depending on combination of options, some
> amount of extra internal delay, that the libavcodec internal aac decoder
> doesn't have. (It's also possible to set the options in a state where
> the fdk-aac decoder doesn't induce any extra delay.)
>
> Currently, we compensate for that extra delay by just offsetting pts
> backwards, so for a stream with N packets, we return samples with
> timestamps [-delay,N*framesize-delay].
>
> In order not to lose data at the end, we must make the decoder flushable
> and flush up to (delay) samples at the end. And since one doesn't
> normally expect extra delay samples at the start of an AAC decoder
> output, we also trim out the same amount of samples at the start (to
> simplify for users that don't observe the pts, who otherwise are
> surprised by the stream starting from pts -delay instead of at pts 0).
>
Interesting: There is indeed a delay at the start (720 samples in a
quick test) compared to the native AAC decoder.
Furthermore, the current code is buggy, as it believes that
avcodec->time_base to be the time_base of the returned AVFrames (it is
in reality avcodec->pkt_timebase; just test with AAC-in-Matroska for this).
I haven't tested your patches, but I have now realized that there is
indeed an issue. And your patch should also fix the wrong timebase issue.
- Andreas
_______________________________________________
ffmpeg-devel mailing list
ffmpeg-devel@ffmpeg.org
https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
To unsubscribe, visit link above, or email
ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
next prev parent reply other threads:[~2022-01-21 14:42 UTC|newest]
Thread overview: 6+ messages / expand[flat|nested] mbox.gz Atom feed top
2022-01-19 20:38 [FFmpeg-devel] [PATCH 1/2] libfdk-aacdec: Add an option for setting the decoder's DRC album mode Martin Storsjö
2022-01-19 20:38 ` [FFmpeg-devel] [PATCH 2/2] libfdk-aacdec: Flush delayed samples at the end Martin Storsjö
2022-01-21 13:00 ` Andreas Rheinhardt
2022-01-21 13:58 ` Martin Storsjö
2022-01-21 14:42 ` Andreas Rheinhardt [this message]
2022-02-03 11:53 ` Martin Storsjö
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=AM7PR03MB666089896D949B4855DDAB428F5B9@AM7PR03MB6660.eurprd03.prod.outlook.com \
--to=andreas.rheinhardt@outlook.com \
--cc=ffmpeg-devel@ffmpeg.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
This inbox may be cloned and mirrored by anyone:
git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git
# If you have public-inbox 1.1+ installed, you may
# initialize and index your mirror using the following commands:
public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \
ffmpegdev@gitmailbox.com
public-inbox-index ffmpegdev
Example config snippet for mirrors.
AGPL code for this site: git clone https://public-inbox.org/public-inbox.git