[FFmpeg-devel] [PATCH v3 2/2] avformat/avcodec: Add DTS-UHD demuxer and parser, movenc support.
Paul B Mahol
onemda at gmail.com
Tue Jun 13 21:32:18 EEST 2023
On Mon, Apr 17, 2023 at 6:14 AM Roy Funderburk <royffmpeg at funderburk.us>
wrote:
> Demuxing of DTS-UHD input files per ETSI TS 102 114 is added as
> demuxer "dtsuhd". movenc supports DTS-UHD audio track.
>
> Signed-off-by: Roy Funderburk <Roy.Funderburk at xperi.com>
> ---
> Changelog | 1 +
> configure | 1 +
> doc/general_contents.texi | 1 +
> libavformat/Makefile | 1 +
> libavformat/allformats.c | 1 +
> libavformat/dtshddec.c | 2 +-
> libavformat/dtsuhddec.c | 216 ++++++++++++++++++++++++++++++++++++++
> libavformat/movenc.c | 32 ++++++
> libavformat/version.h | 2 +-
> 9 files changed, 255 insertions(+), 2 deletions(-)
> create mode 100644 libavformat/dtsuhddec.c
>
> diff --git a/Changelog b/Changelog
> index a40f32c23f..f683b49bb2 100644
> --- a/Changelog
> +++ b/Changelog
> @@ -3,6 +3,7 @@ releases are sorted from youngest to oldest.
>
> version <next>:
> - libaribcaption decoder
> +- DTS-UHD demuxer
>
> version 6.0:
> - Radiance HDR image support
> diff --git a/configure b/configure
> index 033db7442d..557821ceef 100755
> --- a/configure
> +++ b/configure
> @@ -3425,6 +3425,7 @@ dash_demuxer_deps="libxml2"
> dirac_demuxer_select="dirac_parser"
> dts_demuxer_select="dca_parser"
> dtshd_demuxer_select="dca_parser"
> +dtsuhd_demuxer_select="dtsuhd_parser"
> dv_demuxer_select="dvprofile"
> dv_muxer_select="dvprofile"
> dxa_demuxer_select="riffdec"
> diff --git a/doc/general_contents.texi b/doc/general_contents.texi
> index 2eeebd847d..e1ba9c4597 100644
> --- a/doc/general_contents.texi
> +++ b/doc/general_contents.texi
> @@ -597,6 +597,7 @@ library:
> @item raw DNxHD @tab X @tab X
> @item raw DTS @tab X @tab X
> @item raw DTS-HD @tab @tab X
> + at item raw DTS-UHD @tab @tab
> @item raw E-AC-3 @tab X @tab X
> @item raw FLAC @tab X @tab X
> @item raw GSM @tab @tab X
> diff --git a/libavformat/Makefile b/libavformat/Makefile
> index 048649689b..42cf19348f 100644
> --- a/libavformat/Makefile
> +++ b/libavformat/Makefile
> @@ -186,6 +186,7 @@ OBJS-$(CONFIG_DSICIN_DEMUXER) += dsicin.o
> OBJS-$(CONFIG_DSS_DEMUXER) += dss.o
> OBJS-$(CONFIG_DTSHD_DEMUXER) += dtshddec.o
> OBJS-$(CONFIG_DTS_DEMUXER) += dtsdec.o rawdec.o
> +OBJS-$(CONFIG_DTSUHD_DEMUXER) += dtsuhddec.o
> OBJS-$(CONFIG_DTS_MUXER) += rawenc.o
> OBJS-$(CONFIG_DV_MUXER) += dvenc.o
> OBJS-$(CONFIG_DVBSUB_DEMUXER) += dvbsub.o rawdec.o
> diff --git a/libavformat/allformats.c b/libavformat/allformats.c
> index cb5b69e9cd..1b48ce6073 100644
> --- a/libavformat/allformats.c
> +++ b/libavformat/allformats.c
> @@ -144,6 +144,7 @@ extern const AVInputFormat ff_dss_demuxer;
> extern const AVInputFormat ff_dts_demuxer;
> extern const FFOutputFormat ff_dts_muxer;
> extern const AVInputFormat ff_dtshd_demuxer;
> +extern const AVInputFormat ff_dtsuhd_demuxer;
> extern const AVInputFormat ff_dv_demuxer;
> extern const FFOutputFormat ff_dv_muxer;
> extern const AVInputFormat ff_dvbsub_demuxer;
> diff --git a/libavformat/dtshddec.c b/libavformat/dtshddec.c
> index a3dea0668f..6e9e78a335 100644
> --- a/libavformat/dtshddec.c
> +++ b/libavformat/dtshddec.c
> @@ -46,7 +46,7 @@ typedef struct DTSHDDemuxContext {
> static int dtshd_probe(const AVProbeData *p)
> {
> if (AV_RB64(p->buf) == DTSHDHDR)
> - return AVPROBE_SCORE_MAX;
> + return AVPROBE_SCORE_MAX - 4; // DTSUHD (.dtsx) files also have
> this signature.
> return 0;
> }
>
> diff --git a/libavformat/dtsuhddec.c b/libavformat/dtsuhddec.c
> new file mode 100644
> index 0000000000..d840c0a033
> --- /dev/null
> +++ b/libavformat/dtsuhddec.c
> @@ -0,0 +1,216 @@
> +/*
> + * DTS-UHD audio demuxer
> + * Copyright (c) 2023 Xperi Corporation / DTS, Inc.
> + *
> + * This file is part of FFmpeg.
> + *
> + * FFmpeg is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * FFmpeg is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with FFmpeg; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
> 02110-1301 USA
> + */
> +
> +/**
> + * @file
> + * Report DTS-UHD audio stream configuration and extract raw packet data.
> + */
> +
> +#include "internal.h"
> +#include "libavcodec/dtsuhd_common.h"
> +#include "libavcodec/put_bits.h"
> +#include "libavutil/intreadwrite.h"
> +
> +#define DTSUHD_BUFFER_SIZE (1024 * 1024)
> +
> +typedef struct DTSUHDDemuxContext {
> + size_t data_end;
> + struct DTSUHD *dtsuhd;
> + uint8_t *buf;
> +} DTSUHDDemuxContext;
> +
> +static int probe(const AVProbeData *p)
> +{
> + int offset = av_dtsuhd_strmdata_payload(p->buf, p->buf_size, NULL);
> + int score = 0;
> + struct DTSUHD *h = av_dtsuhd_create();
> +
> + if (h && offset >= 0) {
> + for (; offset + 4 < p->buf_size; offset++) {
> + if (dtsuhd_is_syncword(AV_RB32(p->buf + offset))) {
> + if (DTSUHD_OK == av_dtsuhd_frame(h, p->buf + offset,
> p->buf_size - offset, NULL, NULL)) {
> + score = AVPROBE_SCORE_MAX - 3;
> + break;
> + }
> + }
> + }
> + }
> +
> + av_dtsuhd_destroy(h);
>
Doing allocation in probe?
How much this is costly?
Probing should be very fast.
> + return score;
> +}
> +
> +static av_cold int read_close(AVFormatContext *s)
> +{
> + DTSUHDDemuxContext *dtsxs = s->priv_data;
> +
> + av_freep(&dtsxs->buf);
> + av_dtsuhd_destroy(dtsxs->dtsuhd);
> + dtsxs->dtsuhd = NULL;
> +
> + return 0;
> +}
> +
> +static int find_first_syncword(DTSUHDDemuxContext *dtsuhd, int data_start)
> +{
> + while (data_start + 4 < DTSUHD_BUFFER_SIZE &&
> + !dtsuhd_is_syncword(AV_RB32(dtsuhd->buf + data_start))) {
> + data_start++;
> + }
> +
> + return data_start;
> +}
> +
> +static int write_extradata(AVCodecParameters *par, DTSUHDDescriptorInfo
> *di)
> +{
> + PutBitContext pbc;
> + int ret;
> + int size;
> + uint8_t udts[32];
> +
> + init_put_bits(&pbc, udts, sizeof(udts));
> + put_bits32(&pbc, 0); // udts box size
> + put_bits32(&pbc, AV_RB32("udts")); // udts box signature
> + put_bits(&pbc, 6, di->decoder_profile_code);
> + put_bits(&pbc, 2, di->frame_duration_code);
> + put_bits(&pbc, 3, di->max_payload_code);
> + put_bits(&pbc, 5, di->num_pres_code);
> + put_bits32(&pbc, di->channel_mask);
> + put_bits(&pbc, 1, di->base_sample_freq_code);
> + put_bits(&pbc, 2, di->sample_rate_mod);
> + put_bits(&pbc, 3, di->rep_type);
> + put_bits(&pbc, 3, 0);
> + put_bits(&pbc, 1, 0);
> + put_bits64(&pbc, di->num_pres_code + 1, 0); // ID Tag present for
> each presentation.
> + flush_put_bits(&pbc); // byte align
> + size = put_bytes_output(&pbc);
> + AV_WB32(udts, size);
> +
> + ret = ff_alloc_extradata(par, size);
> + if (ret < 0)
> + return ret;
> +
> + memcpy(par->extradata, udts, size);
> +
> + return 0;
> +}
> +
> +static int read_header(AVFormatContext *s)
> +{
> + AVIOContext *pb = s->pb;
> + AVStream *st = avformat_new_stream(s, NULL);
> + DTSUHDDemuxContext *dtsuhd = s->priv_data;
> + DTSUHDDescriptorInfo di;
> + DTSUHDFrameInfo fi;
> + int buf_bytes;
> + int ret = DTSUHD_INVALID_FRAME;
> + int data_start;
> +
> + if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
> + return AVERROR(EIO);
> +
> + dtsuhd->buf = av_malloc(DTSUHD_BUFFER_SIZE);
> + dtsuhd->dtsuhd = av_dtsuhd_create();
> + if (!dtsuhd->buf || !dtsuhd->dtsuhd || !st)
> + return AVERROR(ENOMEM);
> +
> + buf_bytes = avio_read(pb, dtsuhd->buf, DTSUHD_BUFFER_SIZE);
> + if (buf_bytes < 0)
> + return buf_bytes;
> +
> + data_start = av_dtsuhd_strmdata_payload(dtsuhd->buf, buf_bytes,
> &dtsuhd->data_end);
> + if (data_start < 0)
> + return data_start;
> +
> + dtsuhd->data_end += data_start;
> + if (data_start == 0)
> + dtsuhd->data_end = avio_size(pb); // Not a DTSHDHDR chunk file,
> decode frames to end of file.
> +
> + data_start = find_first_syncword(dtsuhd, data_start);
> + if (avio_seek(pb, data_start, SEEK_SET) < 0)
> + return AVERROR(EINVAL);
> +
> + ret = av_dtsuhd_frame(dtsuhd->dtsuhd, dtsuhd->buf + data_start,
> + buf_bytes - data_start, &fi, &di);
> + if (ret != DTSUHD_OK || !di.valid) {
> + av_log(s, AV_LOG_ERROR, "Unable to process DTS-UHD file. File may
> be invalid.\n");
> + return AVERROR_INVALIDDATA;
> + }
> +
> + ffstream(st)->need_parsing = AVSTREAM_PARSE_FULL_RAW;
> + st->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;
> + st->codecpar->codec_id = s->iformat->raw_codec_id;
> + st->codecpar->ch_layout.order = AV_CHANNEL_ORDER_NATIVE;
> + st->codecpar->ch_layout.nb_channels = di.channel_count;
> + st->codecpar->ch_layout.u.mask = di.ffmpeg_channel_mask;
> + st->codecpar->codec_tag = AV_RL32(di.coding_name);
> + st->codecpar->frame_size = 512 << di.frame_duration_code;
> + st->codecpar->sample_rate = di.sample_rate;
> +
> +#if FF_API_OLD_CHANNEL_LAYOUT
> +FF_DISABLE_DEPRECATION_WARNINGS
> + st->codecpar->channels = di.channel_count;
> + st->codecpar->channel_layout = di.ffmpeg_channel_mask;
> +FF_ENABLE_DEPRECATION_WARNINGS
> +#endif
> +
> + ret = write_extradata(st->codecpar, &di);
> + if (ret < 0)
> + return ret;
> +
> + if (st->codecpar->sample_rate)
> + avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
> +
> + return 0;
> +}
> +
> +static int read_packet(AVFormatContext *s, AVPacket *pkt)
> +{
> + DTSUHDDemuxContext *dtsuhd = s->priv_data;
> + int64_t size, left;
> + int ret;
> +
> + left = dtsuhd->data_end - avio_tell(s->pb);
> + size = FFMIN(left, DTSUHD_MAX_FRAME_SIZE);
> + if (size <= 0)
> + return AVERROR_EOF;
> +
> + ret = av_get_packet(s->pb, pkt, size);
> + if (ret < 0)
> + return ret;
> +
> + pkt->stream_index = 0;
> +
> + return ret;
> +}
> +
> +AVInputFormat ff_dtsuhd_demuxer = {
> + .name = "dtsuhd",
> + .long_name = NULL_IF_CONFIG_SMALL("DTS-UHD"),
> + .priv_data_size = sizeof(DTSUHDDemuxContext),
> + .read_probe = probe,
> + .read_header = read_header,
> + .read_packet = read_packet,
> + .read_close = read_close,
> + .flags = AVFMT_GENERIC_INDEX,
> + .extensions = "dtsx",
> + .raw_codec_id = AV_CODEC_ID_DTSUHD,
> +};
> diff --git a/libavformat/movenc.c b/libavformat/movenc.c
> index c370922c7d..e727407694 100644
> --- a/libavformat/movenc.c
> +++ b/libavformat/movenc.c
> @@ -762,6 +762,24 @@ static int mov_write_esds_tag(AVIOContext *pb,
> MOVTrack *track) // Basic
> return update_size(pb, pos);
> }
>
> +static int mov_write_udts_tag(AVIOContext *pb, MOVTrack *track)
> +{
> + if (track->vos_len < 12) {
> + av_log(pb, AV_LOG_ERROR,
> + "Cannot write moov atom before DTS-UHD packets."
> + " Set the delay_moov flag to fix this.\n");
> + return AVERROR(EINVAL);
> + }
> +
> + /* Write vos_data is udts box. */
> + if (memcmp(track->vos_data + 4, "udts", 4) == 0) {
> + avio_write(pb, track->vos_data, track->vos_len);
> + return track->vos_len;
> + }
> +
> + return 0;
> +}
> +
> static int mov_pcm_le_gt16(enum AVCodecID codec_id)
> {
> return codec_id == AV_CODEC_ID_PCM_S24LE ||
> @@ -1367,6 +1385,8 @@ static int mov_write_audio_tag(AVFormatContext *s,
> AVIOContext *pb, MOVMuxContex
> ret = mov_write_dops_tag(s, pb, track);
> else if (track->par->codec_id == AV_CODEC_ID_TRUEHD)
> ret = mov_write_dmlp_tag(s, pb, track);
> + else if (track->par->codec_id == AV_CODEC_ID_DTSUHD)
> + ret = mov_write_udts_tag(pb, track);
> else if (tag == MOV_MP4_IPCM_TAG || tag == MOV_MP4_FPCM_TAG) {
> if (track->par->ch_layout.nb_channels > 1)
> ret = mov_write_chnl_tag(s, pb, track);
> @@ -2781,6 +2801,7 @@ static int mov_write_stbl_tag(AVFormatContext *s,
> AVIOContext *pb, MOVMuxContext
> if ((track->par->codec_type == AVMEDIA_TYPE_VIDEO ||
> track->par->codec_id == AV_CODEC_ID_TRUEHD ||
> track->par->codec_id == AV_CODEC_ID_MPEGH_3D_AUDIO ||
> + track->par->codec_id == AV_CODEC_ID_DTSUHD ||
> track->par->codec_tag == MKTAG('r','t','p',' ')) &&
> track->has_keyframes && track->has_keyframes < track->entry)
> mov_write_stss_tag(pb, track, MOV_SYNC_SAMPLE);
> @@ -5673,6 +5694,14 @@ static void mov_parse_vc1_frame(AVPacket *pkt,
> MOVTrack *trk)
> }
> }
>
> +static void mov_parse_dtsuhd_frame(AVPacket *pkt, MOVTrack *trk)
> +{
> + if (pkt->size > 4 && AV_RB32(pkt->data) == 0x40411BF2) {
> + trk->cluster[trk->entry].flags |= MOV_SYNC_SAMPLE;
> + trk->has_keyframes++;
> + }
> + }
> +
> static void mov_parse_truehd_frame(AVPacket *pkt, MOVTrack *trk)
> {
> int length;
> @@ -6343,6 +6372,8 @@ int ff_mov_write_packet(AVFormatContext *s, AVPacket
> *pkt)
> mov_parse_vc1_frame(pkt, trk);
> } else if (par->codec_id == AV_CODEC_ID_TRUEHD) {
> mov_parse_truehd_frame(pkt, trk);
> + } else if (par->codec_id == AV_CODEC_ID_DTSUHD) {
> + mov_parse_dtsuhd_frame(pkt, trk);
> } else if (pkt->flags & AV_PKT_FLAG_KEY) {
> if (mov->mode == MODE_MOV && par->codec_id ==
> AV_CODEC_ID_MPEG2VIDEO &&
> trk->entry > 0) { // force sync sample for the first key frame
> @@ -7800,6 +7831,7 @@ static const AVCodecTag codec_mp4_tags[] = {
> { AV_CODEC_ID_AC3, MKTAG('a', 'c', '-', '3') },
> { AV_CODEC_ID_EAC3, MKTAG('e', 'c', '-', '3') },
> { AV_CODEC_ID_DTS, MKTAG('m', 'p', '4', 'a') },
> + { AV_CODEC_ID_DTSUHD, MKTAG('d', 't', 's', 'x') },
> { AV_CODEC_ID_TRUEHD, MKTAG('m', 'l', 'p', 'a') },
> { AV_CODEC_ID_FLAC, MKTAG('f', 'L', 'a', 'C') },
> { AV_CODEC_ID_OPUS, MKTAG('O', 'p', 'u', 's') },
> diff --git a/libavformat/version.h b/libavformat/version.h
> index cc56b7cf5c..384cbd49cc 100644
> --- a/libavformat/version.h
> +++ b/libavformat/version.h
> @@ -31,7 +31,7 @@
>
> #include "version_major.h"
>
> -#define LIBAVFORMAT_VERSION_MINOR 4
> +#define LIBAVFORMAT_VERSION_MINOR 5
> #define LIBAVFORMAT_VERSION_MICRO 101
>
> #define LIBAVFORMAT_VERSION_INT AV_VERSION_INT(LIBAVFORMAT_VERSION_MAJOR,
> \
> --
> 2.17.1
>
>
> _______________________________________________
> ffmpeg-devel mailing list
> ffmpeg-devel at ffmpeg.org
> https://ffmpeg.org/mailman/listinfo/ffmpeg-devel
>
> To unsubscribe, visit link above, or email
> ffmpeg-devel-request at ffmpeg.org with subject "unsubscribe".
>
More information about the ffmpeg-devel
mailing list