From: Vittorio Palmisano via ffmpeg-devel <ffmpeg-devel@ffmpeg.org> To: ffmpeg-devel@ffmpeg.org Cc: Vittorio Palmisano <code@ffmpeg.org> Subject: [FFmpeg-devel] [PATCH] avfilter/af_whisper: fix srt index and int64 printf format (PR #20566) Date: Sun, 21 Sep 2025 13:24:20 -0000 Message-ID: <175846106087.25.12870891924088260781@463a07221176> (raw) PR #20566 opened by Vittorio Palmisano (vpalmisano) URL: https://code.ffmpeg.org/FFmpeg/FFmpeg/pulls/20566 Patch URL: https://code.ffmpeg.org/FFmpeg/FFmpeg/pulls/20566.patch avfilter/af_whisper: fix srt index and int64 printf format - Use PRId64 for printing int64_t values in the SRT output. - Increment the subtitle index correctly for each segment. >From 8349df829eb64e972c0d58d622d4648a93cd27ef Mon Sep 17 00:00:00 2001 From: Vittorio Palmisano <vpalmisano@gmail.com> Date: Sun, 21 Sep 2025 15:19:51 +0200 Subject: [PATCH] avfilter/af_whisper: fix srt index and int64 printf format - Use PRId64 for printing int64_t values in the SRT output. - Increment the subtitle index correctly for each segment. --- libavfilter/af_whisper.c | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/libavfilter/af_whisper.c b/libavfilter/af_whisper.c index 663fe446bb..4d61cc0c9a 100644 --- a/libavfilter/af_whisper.c +++ b/libavfilter/af_whisper.c @@ -150,7 +150,7 @@ static int init(AVFilterContext *ctx) } av_log(ctx, AV_LOG_INFO, - "Whisper filter initialized: model: %s lang: %s queue: %ld ms\n", + "Whisper filter initialized: model: %s lang: %s queue: %" PRId64 " ms\n", wctx->model_path, wctx->language, wctx->queue / 1000); return 0; @@ -194,7 +194,7 @@ static void run_transcription(AVFilterContext *ctx, AVFrame *frame, int samples) const float duration = (float) samples / WHISPER_SAMPLE_RATE; av_log(ctx, AV_LOG_INFO, - "run transcription at %ld ms, %d/%d samples (%.2f seconds)...\n", + "run transcription at %" PRId64 " ms, %d/%d samples (%.2f seconds)...\n", timestamp_ms, samples, wctx->audio_buffer_fill_size, duration); struct whisper_full_params params = whisper_full_default_params(WHISPER_SAMPLING_GREEDY); @@ -228,7 +228,7 @@ static void run_transcription(AVFilterContext *ctx, AVFrame *frame, int samples) const int64_t t0_ms = whisper_full_get_segment_t0(wctx->ctx_wsp, i) * 10; const int64_t t1_ms = whisper_full_get_segment_t1(wctx->ctx_wsp, i) * 10; - av_log(ctx, AV_LOG_DEBUG, " [%ld-%ld%s]: \"%s\"\n", + av_log(ctx, AV_LOG_DEBUG, " [%" PRId64 "-%" PRId64 "%s]: \"%s\"\n", timestamp_ms + t0_ms, timestamp_ms + t1_ms, turn ? " (turn)" : "", text_cleaned); if (segments_text) { @@ -246,13 +246,13 @@ static void run_transcription(AVFilterContext *ctx, AVFrame *frame, int samples) if (!av_strcasecmp(wctx->format, "srt")) { buf = av_asprintf - ("%d\n%02ld:%02ld:%02ld,%03ld --> %02ld:%02ld:%02ld,%03ld\n%s\n\n", + ("%d\n%02" PRId64 ":%02" PRId64 ":%02" PRId64 ",%03" PRId64 " --> %02" PRId64 ":%02" PRId64 ":%02" PRId64 ",%03" PRId64 "\n%s\n\n", wctx->index, start_t / 3600000, (start_t / 60000) % 60, (start_t / 1000) % 60, start_t % 1000, end_t / 3600000, (end_t / 60000) % 60, (end_t / 1000) % 60, end_t % 1000, text_cleaned); } else if (!av_strcasecmp(wctx->format, "json")) { - buf = av_asprintf("{\"start\":%ld,\"end\":%ld,\"text\":\"%s\"}\n", start_t, end_t, text_cleaned); + buf = av_asprintf("{\"start\":%" PRId64 ",\"end\":%" PRId64 ",\"text\":\"%s\"}\n", start_t, end_t, text_cleaned); } else buf = av_strdup(text_cleaned); @@ -260,13 +260,13 @@ static void run_transcription(AVFilterContext *ctx, AVFrame *frame, int samples) avio_write(wctx->avio_context, buf, strlen(buf)); av_freep(&buf); } + + wctx->index++; } av_freep(&text_cleaned); } - wctx->index++; - AVDictionary **metadata = &frame->metadata; if (metadata && segments_text) { av_dict_set(metadata, "lavfi.whisper.text", segments_text, 0); -- 2.49.1 _______________________________________________ ffmpeg-devel mailing list -- ffmpeg-devel@ffmpeg.org To unsubscribe send an email to ffmpeg-devel-leave@ffmpeg.org
reply other threads:[~2025-09-21 13:25 UTC|newest] Thread overview: [no followups] expand[flat|nested] mbox.gz Atom feed
Reply instructions: You may reply publicly to this message via plain-text email using any one of the following methods: * Save the following mbox file, import it into your mail client, and reply-to-all from there: mbox Avoid top-posting and favor interleaved quoting: https://en.wikipedia.org/wiki/Posting_style#Interleaved_style * Reply using the --to, --cc, and --in-reply-to switches of git-send-email(1): git send-email \ --in-reply-to=175846106087.25.12870891924088260781@463a07221176 \ --to=ffmpeg-devel@ffmpeg.org \ --cc=code@ffmpeg.org \ /path/to/YOUR_REPLY https://kernel.org/pub/software/scm/git/docs/git-send-email.html * If your mail client supports setting the In-Reply-To header via mailto: links, try the mailto: link
Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel This inbox may be cloned and mirrored by anyone: git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git # If you have public-inbox 1.1+ installed, you may # initialize and index your mirror using the following commands: public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \ ffmpegdev@gitmailbox.com public-inbox-index ffmpegdev Example config snippet for mirrors. AGPL code for this site: git clone https://public-inbox.org/public-inbox.git