On Thu, 28 Nov 2013 15:03:04 +0100, Vittorio Giovara 
<[email protected]> wrote:
> ---
>  Changelog                  |    1 +
>  doc/filters.texi           |   19 ++
>  libavfilter/Makefile       |    1 +
>  libavfilter/allfilters.c   |    1 +
>  libavfilter/version.h      |    4 +-
>  libavfilter/vf_framepack.c |  488 
> ++++++++++++++++++++++++++++++++++++++++++++
>  6 files changed, 512 insertions(+), 2 deletions(-)
>  create mode 100644 libavfilter/vf_framepack.c
> 
> diff --git a/Changelog b/Changelog
> index 78b3338..5a47b18 100644
> --- a/Changelog
> +++ b/Changelog
> @@ -51,6 +51,7 @@ version 10:
>  - support for decoding through VDPAU in avconv (the -hwaccel option)
>  - remove mp3_header_(de)compress bitstream filters
>  - codec level stereoscopic metadata handling
> +- framepack filter
>  
>  
>  version 9:
> diff --git a/doc/filters.texi b/doc/filters.texi
> index b32aad1..04779bc 100644
> --- a/doc/filters.texi
> +++ b/doc/filters.texi
> @@ -1252,6 +1252,25 @@ frames with a negative PTS.
>  
>  @end table
>  
> +@section framepack
> +
> +Packs two different video streams into a stereoscopic video. The two videos
> +should have the same size and framerate; you may conveniently adjust those
> +values with the @ref{scale} and @ref{fps} filters. If one video lasts longer
> +than the other, the last frame is repeated.
> +
> +This filter also sets proper signalling on supported codecs.
> +
> +This filter accepts the following named parameters:
> +@table @option
> +
> +@item format
> +Desired framepacking format. Supported values are @var{2d} (default),
> +@var{sbs}, @var{sbsqnx}, @var{tab}, @var{lines}, @var{columns}, 
> @var{frameseq}, @var{check}.
> +See a detailed format description in @file{libavutil/stereo3d.h}.
> +
> +@end table
> +
>  @anchor{frei0r}
>  @section frei0r
>  
> diff --git a/libavfilter/Makefile b/libavfilter/Makefile
> index 96fa8c0..92c1561 100644
> --- a/libavfilter/Makefile
> +++ b/libavfilter/Makefile
> @@ -54,6 +54,7 @@ OBJS-$(CONFIG_FADE_FILTER)                   += vf_fade.o
>  OBJS-$(CONFIG_FIELDORDER_FILTER)             += vf_fieldorder.o
>  OBJS-$(CONFIG_FORMAT_FILTER)                 += vf_format.o
>  OBJS-$(CONFIG_FPS_FILTER)                    += vf_fps.o
> +OBJS-$(CONFIG_FRAMEPACK_FILTER)              += vf_framepack.o
>  OBJS-$(CONFIG_FREI0R_FILTER)                 += vf_frei0r.o
>  OBJS-$(CONFIG_GRADFUN_FILTER)                += vf_gradfun.o
>  OBJS-$(CONFIG_HFLIP_FILTER)                  += vf_hflip.o
> diff --git a/libavfilter/allfilters.c b/libavfilter/allfilters.c
> index f041f5c..9702a0a 100644
> --- a/libavfilter/allfilters.c
> +++ b/libavfilter/allfilters.c
> @@ -74,6 +74,7 @@ void avfilter_register_all(void)
>      REGISTER_FILTER(FIELDORDER,     fieldorder,     vf);
>      REGISTER_FILTER(FORMAT,         format,         vf);
>      REGISTER_FILTER(FPS,            fps,            vf);
> +    REGISTER_FILTER(FRAMEPACK,      framepack,      vf);
>      REGISTER_FILTER(FREI0R,         frei0r,         vf);
>      REGISTER_FILTER(GRADFUN,        gradfun,        vf);
>      REGISTER_FILTER(HFLIP,          hflip,          vf);
> diff --git a/libavfilter/version.h b/libavfilter/version.h
> index bc079b4..3f7d9dc 100644
> --- a/libavfilter/version.h
> +++ b/libavfilter/version.h
> @@ -30,8 +30,8 @@
>  #include "libavutil/avutil.h"
>  
>  #define LIBAVFILTER_VERSION_MAJOR  3
> -#define LIBAVFILTER_VERSION_MINOR  11
> -#define LIBAVFILTER_VERSION_MICRO  1
> +#define LIBAVFILTER_VERSION_MINOR  12
> +#define LIBAVFILTER_VERSION_MICRO  0
>  
>  #define LIBAVFILTER_VERSION_INT AV_VERSION_INT(LIBAVFILTER_VERSION_MAJOR, \
>                                                 LIBAVFILTER_VERSION_MINOR, \
> diff --git a/libavfilter/vf_framepack.c b/libavfilter/vf_framepack.c
> new file mode 100644
> index 0000000..35f5656
> --- /dev/null
> +++ b/libavfilter/vf_framepack.c
> @@ -0,0 +1,488 @@
> +/*
> + * Copyright (c) 2013 Vittorio Giovara
> + *
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 
> USA
> + */
> +
> +/**
> + * @file
> + * Generate a frame packed video, by combining two views in a single surface.
> + */
> +
> +#include "libavutil/common.h"
> +#include "libavutil/opt.h"
> +#include "libavutil/pixdesc.h"
> +#include "libavutil/rational.h"
> +#include "libavutil/stereo3d.h"
> +
> +#include "avfilter.h"
> +#include "formats.h"
> +#include "internal.h"
> +#include "video.h"
> +
> +#define LEFT_VIEW  0
> +#define RIGHT_VIEW 1
> +
> +typedef struct FramepackContext {
> +    const AVClass *class;
> +
> +    const AVPixFmtDescriptor *pix_desc; ///< agreed pixel format
> +
> +    enum AVStereo3DType format;         ///< frame packed output
> +
> +    AVFrame *left;                      ///< left input frame
> +    AVFrame *right;                     ///< right input frame

You should be able to simplify the code by using an array[2] indexed with 
LEFT/RIGHT_VIEW
> +} FramepackContext;
> +
> +static const enum AVPixelFormat formats_supported[] = {
> +    AV_PIX_FMT_YUV420P,  AV_PIX_FMT_YUV422P,  AV_PIX_FMT_YUV444P,
> +    AV_PIX_FMT_YUV410P,  AV_PIX_FMT_YUVA420P, AV_PIX_FMT_YUVJ420P,
> +    AV_PIX_FMT_YUVJ422P, AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_YUVJ440P,
> +    AV_PIX_FMT_NONE
> +};
> +
> +static int query_formats(AVFilterContext *ctx)
> +{
> +    ff_set_common_formats(ctx, ff_make_format_list(formats_supported));
> +    return 0;
> +}
> +
> +static av_cold void framepack_uninit(AVFilterContext *ctx)
> +{
> +    FramepackContext *s = ctx->priv;
> +
> +    // clean any leftover frame
> +    av_frame_free(&s->left);
> +    av_frame_free(&s->right);
> +
> +    av_opt_free(s);

Not needed, lavfi does that for you

> +}
> +
> +static int config_input_left(AVFilterLink *inlink)
> +{
> +    FramepackContext *s = inlink->dst->priv;
> +
> +    // save pixel format which has to match the other one
> +    s->pix_desc = av_pix_fmt_desc_get(inlink->format);
> +
> +    return 0;
> +}
> +
> +static int config_input_right(AVFilterLink *inlink)
> +{
> +    FramepackContext *s = inlink->dst->priv;
> +    const AVPixFmtDescriptor *right_desc = 
> av_pix_fmt_desc_get(inlink->format);
> +
> +    if(!s->pix_desc || !right_desc)
> +        return AVERROR_BUG;
> +
> +    // check input format
> +    if (s->pix_desc != right_desc) {
> +        av_log(inlink->dst, AV_LOG_ERROR,
> +               "Left and right color spaces differ (%s vs %s).\n",
> +               s->pix_desc->name, right_desc->name);
> +        return AVERROR_INVALIDDATA;
> +    }

The inputs should be treated symmetrically, there is no guarantee in which order
they are initialized.  And the check is not needed anyway,
ff_set_common_formats() makes sure the formats are the same on all pads.

> +
> +    return 0;
> +}
> +
> +static int config_output(AVFilterLink *outlink)
> +{
> +    AVFilterContext *ctx = outlink->src;
> +    FramepackContext *s  = outlink->src->priv;
> +
> +    int width            = ctx->inputs[LEFT_VIEW]->w;
> +    int height           = ctx->inputs[LEFT_VIEW]->h;
> +    AVRational time_base = ctx->inputs[LEFT_VIEW]->time_base;
> +
> +    // check size and fps match on the other input
> +    if (width  != ctx->inputs[RIGHT_VIEW]->w ||
> +        height != ctx->inputs[RIGHT_VIEW]->h) {
> +        av_log(ctx, AV_LOG_ERROR,
> +               "Left and right sizes differ (%dx%d vs %dx%d).\n",
> +               width, height,
> +               ctx->inputs[RIGHT_VIEW]->w, ctx->inputs[RIGHT_VIEW]->h);
> +        return AVERROR_INVALIDDATA;
> +    } else if (av_cmp_q(time_base, ctx->inputs[RIGHT_VIEW]->time_base) != 0) 
> {
> +        av_log(ctx, AV_LOG_ERROR,
> +               "Left and right framerates differ (%d/%d vs %d/%d).\n",
> +               time_base.num, time_base.den,
> +               ctx->inputs[RIGHT_VIEW]->time_base.num,
> +               ctx->inputs[RIGHT_VIEW]->time_base.den);
> +        return AVERROR_INVALIDDATA;
> +    }
> +
> +    // modify output properties as needed
> +    switch (s->format) {
> +    case AV_STEREO3D_2D:
> +        av_log(ctx, AV_LOG_WARNING,
> +               "No frame packing mode selected, setting metadata only.\n");
> +        break;
> +    case AV_STEREO3D_FRAMESEQUENCE:
> +        time_base.den *= 2;
> +        break;
> +    case AV_STEREO3D_COLUMNS:
> +    case AV_STEREO3D_SIDEBYSIDE:
> +    case AV_STEREO3D_SIDEBYSIDE_QUINCUNX:
> +        width *= 2;
> +        break;
> +    case AV_STEREO3D_LINES:
> +    case AV_STEREO3D_TOPBOTTOM:
> +        height *= 2;
> +        break;
> +    case AV_STEREO3D_CHECKERBOARD:
> +        // same w/h/tb
> +        break;
> +    }
> +
> +    outlink->w         = width;
> +    outlink->h         = height;
> +    outlink->time_base = time_base;
> +
> +    return 0;
> +}
> +
> +static void pack_sidebyside_frame(FramepackContext *s,
> +                                  AVFrame *dst,
> +                                  int interleaved)
> +{
> +    int plane, i;
> +    int length = s->left->width;
> +    int lines  = s->left->height;
> +
> +    for (plane = 0; plane < s->pix_desc->nb_components; plane++) {
> +        const uint8_t *leftp  = s->left->data[plane];
> +        const uint8_t *rightp = s->right->data[plane];
> +        uint8_t *dstp         = dst->data[plane];
> +
> +        if (plane == 1 || plane == 2) {
> +            length = -(-s->left->width  >> s->pix_desc->log2_chroma_w);
> +            lines  = -(-s->left->height >> s->pix_desc->log2_chroma_h);
> +        }
> +
> +        if (!interleaved) {
> +            for (i = 0; i < lines; i++) {
> +                memcpy(dstp, leftp, length);
> +                memcpy(dstp + length, rightp, length);
> +
> +                dstp   += dst->linesize[plane];
> +                leftp  += s->left->linesize[plane];
> +                rightp += s->right->linesize[plane];
> +            }

Can't av_image_copy() handle the non-interleaved case?

> +        } else {
> +            for (i = 0; i < lines; i++) {
> +                int j;
> +                int k = 0;
> +
> +                for (j = 0; j < length; j++) {
> +                    dstp[k++] = leftp[j];
> +                    dstp[k++] = rightp[j];
> +                }
> +
> +                dstp   += dst->linesize[plane];
> +                leftp  += s->left->linesize[plane];
> +                rightp += s->right->linesize[plane];
> +            }
> +        }
> +    }
> +
> +    return;
> +}
> +
> +static void pack_topbottom_frame(FramepackContext *s,
> +                                 AVFrame *dst,
> +                                 int interleaved)
> +{
> +    int plane, i;
> +    int step   = interleaved ? 2 : 1;
> +    int length = s->left->width;
> +    int lines  = s->left->height;
> +
> +    for (plane = 0; plane < s->pix_desc->nb_components; plane++) {
> +        const uint8_t *srcp;
> +        uint8_t *dstp;
> +
> +        if (plane == 1 || plane == 2) {
> +            length = -(-s->left->width  >> s->pix_desc->log2_chroma_w);
> +            lines  = -(-s->left->height >> s->pix_desc->log2_chroma_h);
> +        }
> +
> +        // copy first frame line by line
> +        srcp = s->left->data[plane];
> +        dstp = dst->data[plane];
> +        for (i = 0; i < lines; i ++) {
> +            memcpy(dstp, srcp, length);
> +            dstp += dst->linesize[plane] * step;
> +            srcp += s->left->linesize[plane];
> +        }
> +
> +        // copy second frame line by line
> +        srcp = s->right->data[plane];
> +        if (interleaved) {
> +            // reset destination pointer and offset one line
> +            dstp = dst->data[plane] + dst->linesize[plane];
> +        }
> +        for (i = 0; i < lines; i ++) {
> +            memcpy(dstp, srcp, length);
> +            dstp += dst->linesize[plane] * step;
> +            srcp += s->right->linesize[plane];
> +        }
> +    }

Can't this be replaced by av_image_copy()?

> +
> +    return;
> +}
> +
> +static void pack_checkerboard_frame(FramepackContext *s, AVFrame *dst)
> +{
> +    int plane, i;
> +    int length = s->left->width;
> +    int lines  = s->left->height;
> +
> +    for (plane = 0; plane < s->pix_desc->nb_components; plane++) {
> +        const uint8_t *leftp  = s->left->data[plane];
> +        const uint8_t *rightp = s->right->data[plane];
> +        uint8_t *dstp         = dst->data[plane];
> +
> +        if (plane == 1 || plane == 2) {
> +            length = -(-s->left->width  >> s->pix_desc->log2_chroma_w);
> +            lines  = -(-s->left->height >> s->pix_desc->log2_chroma_h);
> +        }
> +
> +        // alternatively copy one pixel, changing source at each line
> +        for (i = 0; i < lines; i++) {
> +            int k;
> +            for (k = 0; k < length; k += 2) {
> +                dstp[k]     = i % 2 ? rightp[k] : leftp[k];
> +                dstp[k + 1] = i % 2 ? leftp[k + 1] : rightp[k + 1];
> +            }

This code looks shady. Should k not run over input length * 2? Or does this
packing lose half the resolution?

> +
> +            dstp   += dst->linesize[plane];
> +            leftp  += s->left->linesize[plane];
> +            rightp += s->right->linesize[plane];
> +        }
> +    }
> +
> +    return;
> +}
> +
> +static int set_side_data(AVFrame *out, enum AVStereo3DType format)
> +{
> +    AVStereo3D *stereo = av_stereo3d_create_side_data(out);
> +    if (!stereo)
> +        return AVERROR(ENOMEM);
> +
> +    stereo->type = format;
> +
> +    return 0;
> +}
> +
> +
> +static av_always_inline void pack_frame(FramepackContext *s, AVFrame *dst)
> +{
> +    switch (s->format) {
> +    case AV_STEREO3D_COLUMNS:
> +        pack_sidebyside_frame(s, dst, 1);
> +        break;
> +    case AV_STEREO3D_SIDEBYSIDE:
> +    case AV_STEREO3D_SIDEBYSIDE_QUINCUNX:
> +        pack_sidebyside_frame(s, dst, 0);
> +        break;
> +    case AV_STEREO3D_LINES:
> +        pack_topbottom_frame(s, dst, 1);
> +        break;
> +    case AV_STEREO3D_TOPBOTTOM:
> +        pack_topbottom_frame(s, dst, 0);
> +        break;
> +    case AV_STEREO3D_CHECKERBOARD:
> +        pack_checkerboard_frame(s, dst);
> +        break;
> +    }
> +
> +    return;
> +}
> +
> +static int filter_frame_left(AVFilterLink *inlink, AVFrame *frame)
> +{
> +    FramepackContext *s = inlink->dst->priv;
> +
> +    s->left = frame;
> +
> +    return 0;
> +}
> +
> +static int filter_frame_right(AVFilterLink *inlink, AVFrame *frame)
> +{
> +    FramepackContext *s = inlink->dst->priv;
> +
> +    s->right = frame;
> +
> +    return 0;
> +}
> +
> +static int request_frame(AVFilterLink *outlink)
> +{
> +    AVFilterContext *ctx = outlink->src;
> +    FramepackContext *s = ctx->priv;
> +    int ret, retl, retr;
> +    AVFrame *out;
> +    static uint64_t double_pts;

static? really? =p

> +
> +    /* get a frame on the left input, on EOF reuse previous */
> +    if (!s->left) {
> +        retl = ff_request_frame(ctx->inputs[LEFT_VIEW]);
> +        if (retl < 0 && retl != AVERROR_EOF)
> +            return retl;
> +    }
> +    /* get a new frame on the right input, on EOF reuse previous */
> +    if (!s->right) {
> +        retr = ff_request_frame(ctx->inputs[RIGHT_VIEW]);
> +        if (retr < 0 && retr != AVERROR_EOF)
> +            return retr;
> +    }
> +    /* when both return values are EOF, it means that both
> +     * videos are fully processed and we can stop */
> +    if (retl == retr && retl == AVERROR_EOF)
> +        return retl;
> +
> +    if (s->format == AV_STEREO3D_FRAMESEQUENCE) {
> +        AVFrame *cur;
> +        int i;
> +        double_pts = s->left->pts;
> +
> +        for (i = 0; i < 2; i++) {
> +            cur = i == 0 ? s->left : s->right;
> +            out = av_frame_clone(cur);
> +            if (!out)
> +                return AVERROR(ENOMEM);
> +
> +            out->pts = double_pts++;
> +            ret = set_side_data(out, s->format);
> +            if (ret < 0)
> +                return ret;
> +
> +            ret = ff_filter_frame(outlink, out);
> +            if (ret < 0)
> +                return ret;
> +        }
> +        if (retl != AVERROR_EOF)
> +            av_frame_free(&s->left);
> +        if (retr != AVERROR_EOF)
> +            av_frame_free(&s->right);
> +        return ret;
> +    } else if (s->format == AV_STEREO3D_2D) {
> +        out = av_frame_clone(s->left);

How is that supposed to work?
The caller connects two streams, but only the left one is actually read?
Looks awkward/hacky to me, perhaps it'd be better to have a separate filter.

> +        if (!out)
> +            return AVERROR(ENOMEM);
> +    } else {
> +        out = ff_get_video_buffer(outlink, outlink->w, outlink->h);
> +        if (!out)
> +            return AVERROR(ENOMEM);
> +
> +        pack_frame(s, out);
> +    }
> +
> +    ret = av_frame_copy_props(out, s->left);
> +    if (ret < 0)
> +        return ret;
> +
> +    ret = set_side_data(out, s->format);
> +    if (ret < 0)
> +        return ret;
> +
> +    ret = ff_filter_frame(outlink, out);
> +    if (ret < 0)
> +        return ret;
> +
> +    // cleanup keeping a valid frame on EOF
> +    if (retl != AVERROR_EOF)
> +        av_frame_free(&s->left);
> +    if (retr != AVERROR_EOF)
> +        av_frame_free(&s->right);

You could move the cleanup before ff_filter_frame, then just return
ff_filter_frame()

-- 
Anton Khirnov
_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel

Reply via email to