From: Roy Funderburk <royffmpeg@funderburk.us> To: FFmpeg development discussions and patches <ffmpeg-devel@ffmpeg.org>, Michael Niedermayer <michael@niedermayer.cc> Subject: Re: [FFmpeg-devel] [PATCH v3 2/2] avformat/avcodec: Add DTS-UHD demuxer and parser, movenc support. Date: Sun, 16 Apr 2023 21:13:35 -0700 Message-ID: <080aed51-b15f-763b-6448-3f0ad2a52a4f@funderburk.us> (raw) In-Reply-To: <20230416195546.GG275832@pb2> Demuxing of DTS-UHD input files per ETSI TS 102 114 is added as demuxer "dtsuhd". movenc supports DTS-UHD audio track. Signed-off-by: Roy Funderburk <Roy.Funderburk@xperi.com> --- Changelog | 1 + configure | 1 + doc/general_contents.texi | 1 + libavformat/Makefile | 1 + libavformat/allformats.c | 1 + libavformat/dtshddec.c | 2 +- libavformat/dtsuhddec.c | 216 ++++++++++++++++++++++++++++++++++++++ libavformat/movenc.c | 32 ++++++ libavformat/version.h | 2 +- 9 files changed, 255 insertions(+), 2 deletions(-) create mode 100644 libavformat/dtsuhddec.c diff --git a/Changelog b/Changelog index a40f32c23f..f683b49bb2 100644 --- a/Changelog +++ b/Changelog @@ -3,6 +3,7 @@ releases are sorted from youngest to oldest. version <next>: - libaribcaption decoder +- DTS-UHD demuxer version 6.0: - Radiance HDR image support diff --git a/configure b/configure index 033db7442d..557821ceef 100755 --- a/configure +++ b/configure @@ -3425,6 +3425,7 @@ dash_demuxer_deps="libxml2" dirac_demuxer_select="dirac_parser" dts_demuxer_select="dca_parser" dtshd_demuxer_select="dca_parser" +dtsuhd_demuxer_select="dtsuhd_parser" dv_demuxer_select="dvprofile" dv_muxer_select="dvprofile" dxa_demuxer_select="riffdec" diff --git a/doc/general_contents.texi b/doc/general_contents.texi index 2eeebd847d..e1ba9c4597 100644 --- a/doc/general_contents.texi +++ b/doc/general_contents.texi @@ -597,6 +597,7 @@ library: @item raw DNxHD @tab X @tab X @item raw DTS @tab X @tab X @item raw DTS-HD @tab @tab X +@item raw DTS-UHD @tab @tab @item raw E-AC-3 @tab X @tab X @item raw FLAC @tab X @tab X @item raw GSM @tab @tab X diff --git a/libavformat/Makefile b/libavformat/Makefile index 048649689b..42cf19348f 100644 --- a/libavformat/Makefile +++ b/libavformat/Makefile @@ -186,6 +186,7 @@ OBJS-$(CONFIG_DSICIN_DEMUXER) += dsicin.o OBJS-$(CONFIG_DSS_DEMUXER) += dss.o OBJS-$(CONFIG_DTSHD_DEMUXER) += dtshddec.o OBJS-$(CONFIG_DTS_DEMUXER) += dtsdec.o rawdec.o +OBJS-$(CONFIG_DTSUHD_DEMUXER) += dtsuhddec.o OBJS-$(CONFIG_DTS_MUXER) += rawenc.o OBJS-$(CONFIG_DV_MUXER) += dvenc.o OBJS-$(CONFIG_DVBSUB_DEMUXER) += dvbsub.o rawdec.o diff --git a/libavformat/allformats.c b/libavformat/allformats.c index cb5b69e9cd..1b48ce6073 100644 --- a/libavformat/allformats.c +++ b/libavformat/allformats.c @@ -144,6 +144,7 @@ extern const AVInputFormat ff_dss_demuxer; extern const AVInputFormat ff_dts_demuxer; extern const FFOutputFormat ff_dts_muxer; extern const AVInputFormat ff_dtshd_demuxer; +extern const AVInputFormat ff_dtsuhd_demuxer; extern const AVInputFormat ff_dv_demuxer; extern const FFOutputFormat ff_dv_muxer; extern const AVInputFormat ff_dvbsub_demuxer; diff --git a/libavformat/dtshddec.c b/libavformat/dtshddec.c index a3dea0668f..6e9e78a335 100644 --- a/libavformat/dtshddec.c +++ b/libavformat/dtshddec.c @@ -46,7 +46,7 @@ typedef struct DTSHDDemuxContext { static int dtshd_probe(const AVProbeData *p) { if (AV_RB64(p->buf) == DTSHDHDR) - return AVPROBE_SCORE_MAX; + return AVPROBE_SCORE_MAX - 4; // DTSUHD (.dtsx) files also have this signature. return 0; } diff --git a/libavformat/dtsuhddec.c b/libavformat/dtsuhddec.c new file mode 100644 index 0000000000..d840c0a033 --- /dev/null +++ b/libavformat/dtsuhddec.c @@ -0,0 +1,216 @@ +/* + * DTS-UHD audio demuxer + * Copyright (c) 2023 Xperi Corporation / DTS, Inc. + * + * This file is part of FFmpeg. + * + * FFmpeg is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * FFmpeg is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with FFmpeg; if not, write to the Free Software + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA + */ + +/** + * @file + * Report DTS-UHD audio stream configuration and extract raw packet data. + */ + +#include "internal.h" +#include "libavcodec/dtsuhd_common.h" +#include "libavcodec/put_bits.h" +#include "libavutil/intreadwrite.h" + +#define DTSUHD_BUFFER_SIZE (1024 * 1024) + +typedef struct DTSUHDDemuxContext { + size_t data_end; + struct DTSUHD *dtsuhd; + uint8_t *buf; +} DTSUHDDemuxContext; + +static int probe(const AVProbeData *p) +{ + int offset = av_dtsuhd_strmdata_payload(p->buf, p->buf_size, NULL); + int score = 0; + struct DTSUHD *h = av_dtsuhd_create(); + + if (h && offset >= 0) { + for (; offset + 4 < p->buf_size; offset++) { + if (dtsuhd_is_syncword(AV_RB32(p->buf + offset))) { + if (DTSUHD_OK == av_dtsuhd_frame(h, p->buf + offset, p->buf_size - offset, NULL, NULL)) { + score = AVPROBE_SCORE_MAX - 3; + break; + } + } + } + } + + av_dtsuhd_destroy(h); + return score; +} + +static av_cold int read_close(AVFormatContext *s) +{ + DTSUHDDemuxContext *dtsxs = s->priv_data; + + av_freep(&dtsxs->buf); + av_dtsuhd_destroy(dtsxs->dtsuhd); + dtsxs->dtsuhd = NULL; + + return 0; +} + +static int find_first_syncword(DTSUHDDemuxContext *dtsuhd, int data_start) +{ + while (data_start + 4 < DTSUHD_BUFFER_SIZE && + !dtsuhd_is_syncword(AV_RB32(dtsuhd->buf + data_start))) { + data_start++; + } + + return data_start; +} + +static int write_extradata(AVCodecParameters *par, DTSUHDDescriptorInfo *di) +{ + PutBitContext pbc; + int ret; + int size; + uint8_t udts[32]; + + init_put_bits(&pbc, udts, sizeof(udts)); + put_bits32(&pbc, 0); // udts box size + put_bits32(&pbc, AV_RB32("udts")); // udts box signature + put_bits(&pbc, 6, di->decoder_profile_code); + put_bits(&pbc, 2, di->frame_duration_code); + put_bits(&pbc, 3, di->max_payload_code); + put_bits(&pbc, 5, di->num_pres_code); + put_bits32(&pbc, di->channel_mask); + put_bits(&pbc, 1, di->base_sample_freq_code); + put_bits(&pbc, 2, di->sample_rate_mod); + put_bits(&pbc, 3, di->rep_type); + put_bits(&pbc, 3, 0); + put_bits(&pbc, 1, 0); + put_bits64(&pbc, di->num_pres_code + 1, 0); // ID Tag present for each presentation. + flush_put_bits(&pbc); // byte align + size = put_bytes_output(&pbc); + AV_WB32(udts, size); + + ret = ff_alloc_extradata(par, size); + if (ret < 0) + return ret; + + memcpy(par->extradata, udts, size); + + return 0; +} + +static int read_header(AVFormatContext *s) +{ + AVIOContext *pb = s->pb; + AVStream *st = avformat_new_stream(s, NULL); + DTSUHDDemuxContext *dtsuhd = s->priv_data; + DTSUHDDescriptorInfo di; + DTSUHDFrameInfo fi; + int buf_bytes; + int ret = DTSUHD_INVALID_FRAME; + int data_start; + + if (!(pb->seekable & AVIO_SEEKABLE_NORMAL)) + return AVERROR(EIO); + + dtsuhd->buf = av_malloc(DTSUHD_BUFFER_SIZE); + dtsuhd->dtsuhd = av_dtsuhd_create(); + if (!dtsuhd->buf || !dtsuhd->dtsuhd || !st) + return AVERROR(ENOMEM); + + buf_bytes = avio_read(pb, dtsuhd->buf, DTSUHD_BUFFER_SIZE); + if (buf_bytes < 0) + return buf_bytes; + + data_start = av_dtsuhd_strmdata_payload(dtsuhd->buf, buf_bytes, &dtsuhd->data_end); + if (data_start < 0) + return data_start; + + dtsuhd->data_end += data_start; + if (data_start == 0) + dtsuhd->data_end = avio_size(pb); // Not a DTSHDHDR chunk file, decode frames to end of file. + + data_start = find_first_syncword(dtsuhd, data_start); + if (avio_seek(pb, data_start, SEEK_SET) < 0) + return AVERROR(EINVAL); + + ret = av_dtsuhd_frame(dtsuhd->dtsuhd, dtsuhd->buf + data_start, + buf_bytes - data_start, &fi, &di); + if (ret != DTSUHD_OK || !di.valid) { + av_log(s, AV_LOG_ERROR, "Unable to process DTS-UHD file. File may be invalid.\n"); + return AVERROR_INVALIDDATA; + } + + ffstream(st)->need_parsing = AVSTREAM_PARSE_FULL_RAW; + st->codecpar->codec_type = AVMEDIA_TYPE_AUDIO; + st->codecpar->codec_id = s->iformat->raw_codec_id; + st->codecpar->ch_layout.order = AV_CHANNEL_ORDER_NATIVE; + st->codecpar->ch_layout.nb_channels = di.channel_count; + st->codecpar->ch_layout.u.mask = di.ffmpeg_channel_mask; + st->codecpar->codec_tag = AV_RL32(di.coding_name); + st->codecpar->frame_size = 512 << di.frame_duration_code; + st->codecpar->sample_rate = di.sample_rate; + +#if FF_API_OLD_CHANNEL_LAYOUT +FF_DISABLE_DEPRECATION_WARNINGS + st->codecpar->channels = di.channel_count; + st->codecpar->channel_layout = di.ffmpeg_channel_mask; +FF_ENABLE_DEPRECATION_WARNINGS +#endif + + ret = write_extradata(st->codecpar, &di); + if (ret < 0) + return ret; + + if (st->codecpar->sample_rate) + avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate); + + return 0; +} + +static int read_packet(AVFormatContext *s, AVPacket *pkt) +{ + DTSUHDDemuxContext *dtsuhd = s->priv_data; + int64_t size, left; + int ret; + + left = dtsuhd->data_end - avio_tell(s->pb); + size = FFMIN(left, DTSUHD_MAX_FRAME_SIZE); + if (size <= 0) + return AVERROR_EOF; + + ret = av_get_packet(s->pb, pkt, size); + if (ret < 0) + return ret; + + pkt->stream_index = 0; + + return ret; +} + +AVInputFormat ff_dtsuhd_demuxer = { + .name = "dtsuhd", + .long_name = NULL_IF_CONFIG_SMALL("DTS-UHD"), + .priv_data_size = sizeof(DTSUHDDemuxContext), + .read_probe = probe, + .read_header = read_header, + .read_packet = read_packet, + .read_close = read_close, + .flags = AVFMT_GENERIC_INDEX, + .extensions = "dtsx", + .raw_codec_id = AV_CODEC_ID_DTSUHD, +}; diff --git a/libavformat/movenc.c b/libavformat/movenc.c index c370922c7d..e727407694 100644 --- a/libavformat/movenc.c +++ b/libavformat/movenc.c @@ -762,6 +762,24 @@ static int mov_write_esds_tag(AVIOContext *pb, MOVTrack *track) // Basic return update_size(pb, pos); } +static int mov_write_udts_tag(AVIOContext *pb, MOVTrack *track) +{ + if (track->vos_len < 12) { + av_log(pb, AV_LOG_ERROR, + "Cannot write moov atom before DTS-UHD packets." + " Set the delay_moov flag to fix this.\n"); + return AVERROR(EINVAL); + } + + /* Write vos_data is udts box. */ + if (memcmp(track->vos_data + 4, "udts", 4) == 0) { + avio_write(pb, track->vos_data, track->vos_len); + return track->vos_len; + } + + return 0; +} + static int mov_pcm_le_gt16(enum AVCodecID codec_id) { return codec_id == AV_CODEC_ID_PCM_S24LE || @@ -1367,6 +1385,8 @@ static int mov_write_audio_tag(AVFormatContext *s, AVIOContext *pb, MOVMuxContex ret = mov_write_dops_tag(s, pb, track); else if (track->par->codec_id == AV_CODEC_ID_TRUEHD) ret = mov_write_dmlp_tag(s, pb, track); + else if (track->par->codec_id == AV_CODEC_ID_DTSUHD) + ret = mov_write_udts_tag(pb, track); else if (tag == MOV_MP4_IPCM_TAG || tag == MOV_MP4_FPCM_TAG) { if (track->par->ch_layout.nb_channels > 1) ret = mov_write_chnl_tag(s, pb, track); @@ -2781,6 +2801,7 @@ static int mov_write_stbl_tag(AVFormatContext *s, AVIOContext *pb, MOVMuxContext if ((track->par->codec_type == AVMEDIA_TYPE_VIDEO || track->par->codec_id == AV_CODEC_ID_TRUEHD || track->par->codec_id == AV_CODEC_ID_MPEGH_3D_AUDIO || + track->par->codec_id == AV_CODEC_ID_DTSUHD || track->par->codec_tag == MKTAG('r','t','p',' ')) && track->has_keyframes && track->has_keyframes < track->entry) mov_write_stss_tag(pb, track, MOV_SYNC_SAMPLE); @@ -5673,6 +5694,14 @@ static void mov_parse_vc1_frame(AVPacket *pkt, MOVTrack *trk) } } +static void mov_parse_dtsuhd_frame(AVPacket *pkt, MOVTrack *trk) +{ + if (pkt->size > 4 && AV_RB32(pkt->data) == 0x40411BF2) { + trk->cluster[trk->entry].flags |= MOV_SYNC_SAMPLE; + trk->has_keyframes++; + } + } + static void mov_parse_truehd_frame(AVPacket *pkt, MOVTrack *trk) { int length; @@ -6343,6 +6372,8 @@ int ff_mov_write_packet(AVFormatContext *s, AVPacket *pkt) mov_parse_vc1_frame(pkt, trk); } else if (par->codec_id == AV_CODEC_ID_TRUEHD) { mov_parse_truehd_frame(pkt, trk); + } else if (par->codec_id == AV_CODEC_ID_DTSUHD) { + mov_parse_dtsuhd_frame(pkt, trk); } else if (pkt->flags & AV_PKT_FLAG_KEY) { if (mov->mode == MODE_MOV && par->codec_id == AV_CODEC_ID_MPEG2VIDEO && trk->entry > 0) { // force sync sample for the first key frame @@ -7800,6 +7831,7 @@ static const AVCodecTag codec_mp4_tags[] = { { AV_CODEC_ID_AC3, MKTAG('a', 'c', '-', '3') }, { AV_CODEC_ID_EAC3, MKTAG('e', 'c', '-', '3') }, { AV_CODEC_ID_DTS, MKTAG('m', 'p', '4', 'a') }, + { AV_CODEC_ID_DTSUHD, MKTAG('d', 't', 's', 'x') }, { AV_CODEC_ID_TRUEHD, MKTAG('m', 'l', 'p', 'a') }, { AV_CODEC_ID_FLAC, MKTAG('f', 'L', 'a', 'C') }, { AV_CODEC_ID_OPUS, MKTAG('O', 'p', 'u', 's') }, diff --git a/libavformat/version.h b/libavformat/version.h index cc56b7cf5c..384cbd49cc 100644 --- a/libavformat/version.h +++ b/libavformat/version.h @@ -31,7 +31,7 @@ #include "version_major.h" -#define LIBAVFORMAT_VERSION_MINOR 4 +#define LIBAVFORMAT_VERSION_MINOR 5 #define LIBAVFORMAT_VERSION_MICRO 101 #define LIBAVFORMAT_VERSION_INT AV_VERSION_INT(LIBAVFORMAT_VERSION_MAJOR, \ -- 2.17.1 _______________________________________________ ffmpeg-devel mailing list ffmpeg-devel@ffmpeg.org https://ffmpeg.org/mailman/listinfo/ffmpeg-devel To unsubscribe, visit link above, or email ffmpeg-devel-request@ffmpeg.org with subject "unsubscribe".
next prev parent reply other threads:[~2023-04-17 4:14 UTC|newest] Thread overview: 37+ messages / expand[flat|nested] mbox.gz Atom feed top 2023-04-14 15:39 [FFmpeg-devel] [PATCH] " Roy Funderburk 2023-04-14 16:40 ` Hendrik Leppkes 2023-04-14 16:48 ` Roy Funderburk 2023-04-15 14:56 ` Michael Niedermayer 2023-04-15 20:04 ` [FFmpeg-devel] [PATCH v2] " Roy Funderburk 2023-04-16 19:55 ` Michael Niedermayer 2023-04-16 21:52 ` Roy Funderburk 2023-04-17 4:12 ` [FFmpeg-devel] [PATCH v3 1/2] " Roy Funderburk 2023-05-08 17:49 ` Roy Funderburk 2023-05-13 7:28 ` Paul B Mahol 2023-05-15 14:50 ` Roy Funderburk 2023-05-15 20:35 ` Michael Niedermayer 2023-05-15 21:14 ` Roy Funderburk 2023-06-13 14:26 ` Paul B Mahol 2023-06-13 17:43 ` Roy Funderburk 2023-06-13 18:09 ` Paul B Mahol 2023-06-13 18:20 ` Roy Funderburk 2023-06-13 19:04 ` Anton Khirnov 2023-04-17 4:13 ` Roy Funderburk [this message] 2023-06-13 18:32 ` [FFmpeg-devel] [PATCH v3 2/2] " Paul B Mahol 2023-04-15 20:20 ` [FFmpeg-devel] [PATCH] " Roy Funderburk 2023-06-13 18:35 ` Paul B Mahol 2023-06-14 0:00 ` Roy Funderburk 2023-06-14 5:37 ` Paul B Mahol 2023-06-14 6:01 ` Paul B Mahol 2023-06-14 6:06 ` Paul B Mahol 2023-06-14 6:11 ` Paul B Mahol 2023-06-14 18:24 ` Roy Funderburk 2023-06-14 20:01 ` Roy Funderburk 2023-06-15 15:46 ` Paul B Mahol 2023-06-15 18:44 ` Roy Funderburk 2023-06-18 12:18 ` Paul B Mahol 2023-06-20 17:05 ` Roy Funderburk 2023-08-17 21:47 ` Roy Funderburk 2023-08-17 22:31 ` Paul B Mahol 2023-08-17 22:51 ` Roy Funderburk 2024-01-16 21:02 ` Roy Funderburk
Reply instructions: You may reply publicly to this message via plain-text email using any one of the following methods: * Save the following mbox file, import it into your mail client, and reply-to-all from there: mbox Avoid top-posting and favor interleaved quoting: https://en.wikipedia.org/wiki/Posting_style#Interleaved_style * Reply using the --to, --cc, and --in-reply-to switches of git-send-email(1): git send-email \ --in-reply-to=080aed51-b15f-763b-6448-3f0ad2a52a4f@funderburk.us \ --to=royffmpeg@funderburk.us \ --cc=ffmpeg-devel@ffmpeg.org \ --cc=michael@niedermayer.cc \ /path/to/YOUR_REPLY https://kernel.org/pub/software/scm/git/docs/git-send-email.html * If your mail client supports setting the In-Reply-To header via mailto: links, try the mailto: link
Git Inbox Mirror of the ffmpeg-devel mailing list - see https://ffmpeg.org/mailman/listinfo/ffmpeg-devel This inbox may be cloned and mirrored by anyone: git clone --mirror https://master.gitmailbox.com/ffmpegdev/0 ffmpegdev/git/0.git # If you have public-inbox 1.1+ installed, you may # initialize and index your mirror using the following commands: public-inbox-init -V2 ffmpegdev ffmpegdev/ https://master.gitmailbox.com/ffmpegdev \ ffmpegdev@gitmailbox.com public-inbox-index ffmpegdev Example config snippet for mirrors. AGPL code for this site: git clone https://public-inbox.org/public-inbox.git