Re: [libav-devel] [PATCH] Direct Stream Digital (DSD) decoder

Kostya Shishkov Wed, 16 Apr 2014 07:53:22 -0700

On Wed, Apr 16, 2014 at 04:13:19PM +0200, Luca Barbato wrote:
> From: Peter Ross <[email protected]>
> 
> Signed-off-by: Peter Ross <[email protected]>
> Signed-off-by: Michael Niedermayer <[email protected]>
> Signed-off-by: Jean-Baptiste Kempf <[email protected]>
> Signed-off-by: Luca Barbato <[email protected]>
> ---
> 
> The tests are missing, Vittorio willing to bake some?
> 
>  Changelog                 |   1 +
>  doc/general.texi          |   4 +
>  libavcodec/Makefile       |   8 +-
>  libavcodec/allcodecs.c    |   4 +
>  libavcodec/avcodec.h      |   4 +
>  libavcodec/codec_desc.c   |  28 +++++++
>  libavcodec/dsd_tablegen.c |  38 ++++++++++
>  libavcodec/dsd_tablegen.h |  95 ++++++++++++++++++++++++
>  libavcodec/dsddec.c       | 185 
> ++++++++++++++++++++++++++++++++++++++++++++++
>  libavcodec/utils.c        |   4 +
>  10 files changed, 370 insertions(+), 1 deletion(-)
>  create mode 100644 libavcodec/dsd_tablegen.c
>  create mode 100644 libavcodec/dsd_tablegen.h
>  create mode 100644 libavcodec/dsddec.c
> 
> diff --git a/Changelog b/Changelog
> index 55216e8..d895b94 100644
> --- a/Changelog
> +++ b/Changelog
> @@ -19,6 +19,7 @@ version <next>:
>  - LucasArts SMUSH demuxer
>  - MP2 encoding via TwoLAME
>  - asettb filter
> +- Direct Stream Digital (DSD) decoder
> 
> 
>  version 10:
> diff --git a/doc/general.texi b/doc/general.texi
> index 2612eb1..4b16075 100644
> --- a/doc/general.texi
> +++ b/doc/general.texi
> @@ -822,6 +822,10 @@ following image formats are supported:
>  @item DPCM Sol               @tab     @tab  X
>  @item DPCM Xan               @tab     @tab  X
>      @tab Used in Origin's Wing Commander IV AVI files.
> +@item DSD (Direct Stream Digitial), least significant bit first  @tab  @tab  
> X
> +@item DSD (Direct Stream Digitial), most significant bit first   @tab  @tab  
> X
> +@item DSD (Direct Stream Digitial), least significant bit first, planar  
> @tab  @tab  X
> +@item DSD (Direct Stream Digitial), most significant bit first, planar   
> @tab  @tab  X


one item should be enough

>  @item DSP Group TrueSpeech   @tab     @tab  X
>  @item DV audio               @tab     @tab  X
>  @item Enhanced AC-3          @tab  X  @tab  X
[...]
> diff --git a/libavcodec/dsd_tablegen.h b/libavcodec/dsd_tablegen.h
> new file mode 100644
> index 0000000..0bebaea
> --- /dev/null
> +++ b/libavcodec/dsd_tablegen.h
> @@ -0,0 +1,95 @@
> +/*
> + * Header file for hardcoded DSD tables
> + * based on BSD licensed dsd2pcm by Sebastian Gesemann
> + * Copyright (c) 2009, 2011 Sebastian Gesemann. All rights reserved.
> + *
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 
> USA
> + */
> +
> +#ifndef AVCODEC_DSD_TABLEGEN_H
> +#define AVCODEC_DSD_TABLEGEN_H
> +
> +#include <stdint.h>
> +#include "libavutil/attributes.h"
> +
> +#define HTAPS   48                /** number of FIR constants */
> +#define CTABLES ((HTAPS + 7) / 8) /** number of "8 MACs" lookup tables */
> +
> +#if CONFIG_HARDCODED_TABLES
> +#define dsd_ctables_tableinit()
> +#include "libavcodec/dsd_tables.h"
> +#else
> +#include "libavutil/common.h"
> +
> +/*
> + * Properties of this 96-tap lowpass filter when applied on a signal
> + * with sampling rate of 44100*64 Hz:
> + *
> + * () has a delay of 17 microseconds.

()?

> + *
> + * () flat response up to 48 kHz
> + *
> + * () if you downsample afterwards by a factor of 8, the
> + *    spectrum below 70 kHz is practically alias-free.
> + *
> + * () stopband rejection is about 160 dB
> + *
> + * The coefficient tables ("ctables") take only 6 Kibi Bytes and

barf

> + * should fit into a modern processor's fast cache.
> + */
> +
> +/**
> + * The 2nd half (48 coeffs) of a 96-tap symmetric lowpass filter
> + */
> +static const double htaps[HTAPS] = {
> +     0.09950731974056658,    0.09562845727714668,    0.08819647126516944,
> +     0.07782552527068175,    0.06534876523171299,    0.05172629311427257,
> +     0.0379429484910187,     0.02490921351762261,    0.0133774746265897,
> +     0.003883043418804416,  -0.003284703416210726,  -0.008080250212687497,
> +    -0.01067241812471033,   -0.01139427235000863,   -0.0106813877974587,
> +    -0.009007905078766049,  -0.006828859761015335,  -0.004535184322001496,
> +    -0.002425035959059578,  -0.0006922187080790708,  0.0005700762133516592,
> +     0.001353838005269448,   0.001713709169690937,   0.001742046839472948,
> +     0.001545601648013235,   0.001226696225277855,   0.0008704322683580222,
> +     0.0005381636200535649,  0.000266446345425276,   7.002968738383528e-05,
> +    -5.279407053811266e-05, -0.0001140625650874684, -0.0001304796361231895,
> +    -0.0001189970287491285, -9.396247155265073e-05, -6.577634378272832e-05,
> +    -4.07492895872535e-05,  -2.17407957554587e-05,  -9.163058931391722e-06,
> +    -2.017460145032201e-06,  1.249721855219005e-06,  2.166655190537392e-06,
> +     1.930520892991082e-06,  1.319400334374195e-06,  7.410039764949091e-07,
> +     3.423230509967409e-07,  1.244182214744588e-07,  3.130441005359396e-08
> +};
> +
> +static float ctables[CTABLES][256];
> +
> +static av_cold void dsd_ctables_tableinit(void)
> +{
> +    int t, e, m, k;
> +    double acc;
> +    for (t = 0; t < CTABLES; ++t) {
> +        k = FFMIN(HTAPS - t * 8, 8);

unless one decides to switch to non-multiple-of-8 tap filter k=8 in all cases
(otherwise one can pad filter anyway and see above)

> +        for (e = 0; e < 256; ++e) {
> +            acc = 0.0;
> +            for (m = 0; m < k; ++m)
> +                acc += (((e >> (7 - m)) & 1) * 2 - 1) * htaps[t * 8 + m];
> +            ctables[CTABLES - 1 - t][e] = (float)acc;
> +        }
> +    }
> +}
> +#endif /* CONFIG_HARDCODED_TABLES */
> +
> +#endif /* AVCODEC_DSD_TABLEGEN_H */
> diff --git a/libavcodec/dsddec.c b/libavcodec/dsddec.c
> new file mode 100644
> index 0000000..6876f16
> --- /dev/null
> +++ b/libavcodec/dsddec.c
> @@ -0,0 +1,185 @@
> +/*
> + * Direct Stream Digital (DSD) decoder
> + * based on BSD licensed dsd2pcm by Sebastian Gesemann
> + * Copyright (c) 2009, 2011 Sebastian Gesemann. All rights reserved.
> + * Copyright (c) 2014 Peter Ross
> + *
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 
> USA
> + */
> +
> +/**
> + * @file
> + * Direct Stream Digital (DSD) decoder
> + */
> +
> +#include "libavcodec/internal.h"
> +#include "libavcodec/mathops.h"
> +#include "avcodec.h"
> +#include "dsd_tablegen.h"
> +
> +#define FIFOSIZE 16              /** must be a power of two */
> +#define FIFOMASK (FIFOSIZE - 1)  /** bit mask for FIFO offsets */
> +
> +#if FIFOSIZE * 8 < HTAPS * 2
> +#error "FIFOSIZE too small"
> +#endif
> +
> +/*
> + * Per-channel buffer
> + */
> +typedef struct {
> +    unsigned char buf[FIFOSIZE];

uint8_t?

> +    unsigned pos;
> +} DSDContext;
> +
> +static void dsd2pcm_translate(DSDContext* s, size_t samples, int lsbf,
> +                              const uint8_t *src, ptrdiff_t src_stride,
> +                              float *dst, ptrdiff_t dst_stride)
> +{
> +    unsigned int pos, i;
> +    uint8_t *p;
> +    double sum;
> +
> +    pos = s->pos;
> +
> +    while (samples-- > 0) {

while (samples--)

it's more honest here

> +        s->buf[pos] = lsbf ? ff_reverse[*src] : *src;
> +        src += src_stride;
> +
> +        p = s->buf + ((pos - CTABLES) & FIFOMASK);
> +        *p = ff_reverse[*p];
> +
> +        sum = 0.0;
> +        for (i = 0; i < CTABLES; i++) {
> +            const uint8_t a = s->buf[(pos                     - i) & 
> FIFOMASK];
> +            const uint8_t b = s->buf[(pos - (CTABLES * 2 - 1) + i) & 
> FIFOMASK];
> +            sum += ctables[i][a] + ctables[i][b];
> +        }
> +
> +        *dst = (float)sum;
> +        dst += dst_stride;
> +
> +        pos = (pos + 1) & FIFOMASK;
> +    }
> +
> +    s->pos = pos;
> +}
> +
> +static av_cold void dsd_init_static_data(AVCodec *unused)
> +{
> +    dsd_ctables_tableinit();
> +}
> +
> +static av_cold int dsd_decode_init(AVCodecContext *avctx)
> +{
> +    DSDContext * s;
> +    int i;
> +
> +    s = av_malloc(sizeof(DSDContext) * avctx->channels);
> +    if (!s)
> +        return AVERROR(ENOMEM);
> +
> +    for (i = 0; i < avctx->channels; i++) {
> +        s[i].pos = 0;
> +        memset(s[i].buf, 0x69, sizeof(s[i].buf));
> +
> +        /* 0x69 = 01101001
> +         * This pattern "on repeat" makes a low energy 352.8 kHz tone
> +         * and a high energy 1.0584 MHz tone which should be filtered
> +         * out completely by any playback system --> silence
> +         */
> +    }
> +
> +    avctx->sample_fmt = AV_SAMPLE_FMT_FLTP;
> +    avctx->priv_data  = s;
> +    return 0;
> +}
> +
> +static av_always_inline
> +int dsd_decode_frame_internal(AVCodecContext *avctx, void *data,
> +                              int *got_frame_ptr, AVPacket *avpkt,
> +                              int lsbf, int planar)
> +{
> +    DSDContext * s = avctx->priv_data;
> +    AVFrame *frame = data;
> +    int ret, i;
> +    int src_next;
> +    int src_stride;
> +
> +    frame->nb_samples = avpkt->size / avctx->channels;
> +
> +    if (planar) {
> +        src_next   = frame->nb_samples;
> +        src_stride = 1;
> +    } else {
> +        src_next   = 1;
> +        src_stride = avctx->channels;
> +    }
> +
> +    if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
> +        return ret;
> +
> +    for (i = 0; i < avctx->channels; i++) {
> +        float *dst = ((float **)frame->extended_data)[i];
> +        dsd2pcm_translate(&s[i], frame->nb_samples, lsbf,
> +                          avpkt->data + i * src_next, src_stride,
> +                          dst, 1);
> +    }
> +
> +    *got_frame_ptr = 1;
> +    return frame->nb_samples * avctx->channels;
> +}
> +
> +static int dsd_lsbf_decode_frame(AVCodecContext *avctx, void *data,
> +                                 int *got_frame, AVPacket *avpkt)
> +{
> +    return dsd_decode_frame_internal(avctx, data, got_frame, avpkt, 1, 0);
> +}

empty line missing

> +static int dsd_msbf_decode_frame(AVCodecContext *avctx, void *data,
> +                                 int *got_frame, AVPacket *avpkt)
> +{
> +    return dsd_decode_frame_internal(avctx, data, got_frame, avpkt, 0, 0);
> +}
> +
> +static int dsd_lsbf_planar_decode_frame(AVCodecContext *avctx, void *data,
> +                                        int *got_frame, AVPacket *avpkt)
> +{
> +    return dsd_decode_frame_internal(avctx, data, got_frame, avpkt, 1, 1);
> +}
> +static int dsd_msbf_planar_decode_frame(AVCodecContext *avctx, void *data,
> +                                        int *got_frame, AVPacket *avpkt)
> +{
> +    return dsd_decode_frame_internal(avctx, data, got_frame, avpkt, 0, 1);
> +}
> +
> +#define DSD_DECODER(id_, name_, long_name_) \
> +AVCodec ff_##name_##_decoder = { \
> +    .name             = #name_, \
> +    .long_name        = NULL_IF_CONFIG_SMALL(long_name_), \
> +    .type             = AVMEDIA_TYPE_AUDIO, \
> +    .id               = AV_CODEC_ID_##id_, \
> +    .init             = dsd_decode_init, \
> +    .decode           = name_ ## _decode_frame, \
> +    .init_static_data = dsd_init_static_data, \
> +    .sample_fmts      = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_FLTP, \
> +                                                       AV_SAMPLE_FMT_NONE }, 
> \
> +};
> +
> +DSD_DECODER(DSD_LSBF, dsd_lsbf, "DSD (Direct Stream Digital), least 
> significant bit first")
> +DSD_DECODER(DSD_MSBF, dsd_msbf, "DSD (Direct Stream Digital), most 
> significant bit first")
> +DSD_DECODER(DSD_MSBF_PLANAR, dsd_msbf_planar, "DSD (Direct Stream Digital), 
> most significant bit first, planar")
> +DSD_DECODER(DSD_LSBF_PLANAR, dsd_lsbf_planar, "DSD (Direct Stream Digital), 
> least significant bit first, planar")

I wonder if it makes sense to contract it to "LSB/MSB first"

> diff --git a/libavcodec/utils.c b/libavcodec/utils.c
> index d9832e2..38a138b 100644
> --- a/libavcodec/utils.c
> +++ b/libavcodec/utils.c
> @@ -1929,6 +1929,10 @@ int av_get_exact_bits_per_sample(enum AVCodecID 
> codec_id)
>      case AV_CODEC_ID_ADPCM_G722:
>      case AV_CODEC_ID_ADPCM_YAMAHA:
>          return 4;
> +    case AV_CODEC_ID_DSD_LSBF:
> +    case AV_CODEC_ID_DSD_MSBF:
> +    case AV_CODEC_ID_DSD_LSBF_PLANAR:
> +    case AV_CODEC_ID_DSD_MSBF_PLANAR:
>      case AV_CODEC_ID_PCM_ALAW:
>      case AV_CODEC_ID_PCM_MULAW:
>      case AV_CODEC_ID_PCM_S8:
> --

in general LGTM
_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel

Re: [libav-devel] [PATCH] Direct Stream Digital (DSD) decoder

Reply via email to