Re: [libav-devel] [PATCH 2/8] lavc: add an option for exporting cropping information to the caller

wm4 Fri, 30 Dec 2016 01:43:18 -0800

On Tue, 27 Dec 2016 19:31:15 +0100
Anton Khirnov <an...@khirnov.net> wrote:


> Also, add generic code for handling cropping, so the decoders can export
> just the cropping size and not bother with the rest.
> ---
>  doc/APIchanges             |   4 ++
>  libavcodec/avcodec.h       |  22 +++++++++
>  libavcodec/decode.c        | 112 
> ++++++++++++++++++++++++++++++++++++++++++++-
>  libavcodec/internal.h      |   6 +++
>  libavcodec/options_table.h |   1 +
>  libavcodec/version.h       |   4 +-
>  6 files changed, 146 insertions(+), 3 deletions(-)
> 
> diff --git a/doc/APIchanges b/doc/APIchanges
> index 10a2da4..a0ef198 100644
> --- a/doc/APIchanges
> +++ b/doc/APIchanges
> @@ -13,6 +13,10 @@ libavutil:     2015-08-28
>  
>  API changes, most recent first:
>  
> +2016-xx-xx - xxxxxxx - lavc 57.31.0 - avcodec.h
> +  Add AVCodecContext.apply_cropping to control whether cropping
> +  is handled by libavcodec or the caller.
> +
>  2016-xx-xx - xxxxxxx - lavu 55.30.0 - frame.h
>    Add AVFrame.crop_left/right/top/bottom fields for attaching cropping
>    information to video frames.
> diff --git a/libavcodec/avcodec.h b/libavcodec/avcodec.h
> index 95da50b..524e06a 100644
> --- a/libavcodec/avcodec.h
> +++ b/libavcodec/avcodec.h
> @@ -3112,6 +3112,28 @@ typedef struct AVCodecContext {
>       *             This field should be set before avcodec_open2() is called.
>       */
>      AVBufferRef *hw_frames_ctx;
> +
> +    /**
> +     * Video decoding only. Certain video codecs support cropping, meaning 
> that
> +     * only a sub-rectangle of the decoded frame is intended for display.  
> This
> +     * option controls how cropping is handled by libavcodec.
> +     *
> +     * When set to 1 (the default), libavcodec will apply cropping 
> internally.
> +     * I.e. it will modify the output frame width/height fields and offset 
> the
> +     * data pointers (only by as much as possible while preserving 
> alignment, or
> +     * by the full amount if the AV_CODEC_FLAG_UNALIGNED flag is set) so that
> +     * the frames output by the decoder refer only to the cropped area. The
> +     * crop_* fields of the output frames will be zero.
> +     *
> +     * When set to 0, the width/height fields of the output frames will be 
> set
> +     * to the coded dimensions and the crop_* fields will describe the 
> cropping
> +     * rectangle. Applying the cropping is left to the caller.

Maybe could explain why AVCodecContext or AVCodecPar width/height will
mismatch with the width/height of the AVFrame if it's set to 0. From
what I understand, containers will normally use a cropped dimension (?).

> +     *
> +     * When hardware acceleration with opaque output frames is used, the 
> actual
> +     * value of this option is disregarded and libavcodec behaves as if it 
> was
> +     * set to 0.
> +     */

Isn't that last part an implicit API change? This would probably annoy
a lot of people.

> +    int apply_cropping;
>  } AVCodecContext;
>  
>  /**
> diff --git a/libavcodec/decode.c b/libavcodec/decode.c
> index 0fd41ab..65ee8b0 100644
> --- a/libavcodec/decode.c
> +++ b/libavcodec/decode.c
> @@ -29,6 +29,7 @@
>  #include "libavutil/frame.h"
>  #include "libavutil/hwcontext.h"
>  #include "libavutil/imgutils.h"
> +#include "libavutil/intmath.h"
>  
>  #include "avcodec.h"
>  #include "bytestream.h"
> @@ -450,6 +451,106 @@ int attribute_align_arg 
> avcodec_send_packet(AVCodecContext *avctx, const AVPacke
>      return 0;
>  }
>  
> +static int calc_cropping_offsets(size_t offsets[4], const AVFrame *frame,
> +                                 const AVPixFmtDescriptor *desc)
> +{
> +    int i, j;
> +
> +    for (i = 0; frame->data[i]; i++) {
> +        const AVComponentDescriptor *comp = NULL;
> +        int shift_x = (i == 1 || i == 2) ? desc->log2_chroma_w : 0;
> +        int shift_y = (i == 1 || i == 2) ? desc->log2_chroma_h : 0;
> +
> +        if (desc->flags & (AV_PIX_FMT_FLAG_PAL | AV_PIX_FMT_FLAG_PSEUDOPAL) 
> && i == 1) {
> +            offsets[i] = 0;
> +            break;
> +        }
> +
> +        /* find any component descriptor for this plane */
> +        for (j = 0; j < desc->nb_components; j++) {
> +            if (desc->comp[j].plane == i) {
> +                comp = &desc->comp[j];
> +                break;
> +            }
> +        }
> +        if (!comp)
> +            return AVERROR_BUG;
> +
> +        offsets[i] = (frame->crop_top  >> shift_y) * frame->linesize[i] +
> +                     (frame->crop_left >> shift_x) * comp->step;
> +    }
> +
> +    return 0;
> +}
> +
> +static int apply_cropping(AVCodecContext *avctx, AVFrame *frame)
> +{
> +    const AVPixFmtDescriptor *desc;
> +    size_t offsets[4];
> +    int i;
> +
> +    /* make sure we are noisy about decoders returning invalid cropping data 
> */
> +    if (frame->crop_left >= INT_MAX - frame->crop_right        ||
> +        frame->crop_top  >= INT_MAX - frame->crop_bottom       ||

These fields are size_t, so why INT_MAX? Sure, the frame size can't be
larger than INT_MAX anyway, but this is a good opportunity for
nitpicking.

> +        (frame->crop_left + frame->crop_right) >= frame->width ||
> +        (frame->crop_top + frame->crop_bottom) >= frame->height) {
> +        av_log(avctx, AV_LOG_WARNING,
> +               "Invalid cropping information set by a decoder: 
> %zu/%zu/%zu/%zu "
> +               "(frame size %dx%d). This is a bug, please report it\n",
> +               frame->crop_left, frame->crop_right, frame->crop_top, 
> frame->crop_bottom,
> +               frame->width, frame->height);
> +        frame->crop_left   = 0;
> +        frame->crop_right  = 0;
> +        frame->crop_top    = 0;
> +        frame->crop_bottom = 0;
> +        return 0;
> +    }
> +
> +    if (!avctx->apply_cropping)
> +        return 0;
> +
> +    desc = av_pix_fmt_desc_get(frame->format);
> +    if (!desc)
> +        return AVERROR_BUG;
> +
> +    /* Do nothing for hwaccel formats.
> +     * Bitstream formats cannot be easily handled here either (and 
> corresponding
> +     * decoders should not export any cropping anyway), so also do nothing 
> for
> +     * those. */
> +    if (desc->flags & (AV_PIX_FMT_FLAG_BITSTREAM | AV_PIX_FMT_FLAG_HWACCEL))
> +        return 0;
> +
> +    /* calculate the offsets for each plane */
> +    calc_cropping_offsets(offsets, frame, desc);
> +
> +    /* adjust the offsets to avoid breaking alignment */
> +    if (!(avctx->flags & AV_CODEC_FLAG_UNALIGNED)) {
> +        int min_log2_align = INT_MAX;
> +
> +        for (i = 0; frame->data[i]; i++) {
> +            int log2_align = offsets[i] ? av_ctz(offsets[i]) : INT_MAX;
> +            min_log2_align = FFMIN(log2_align, min_log2_align);
> +        }
> +
> +        if (min_log2_align < 5) {
> +            frame->crop_left &= ~((1 << min_log2_align) - 1);
> +            calc_cropping_offsets(offsets, frame, desc);
> +        }
> +    }
> +
> +    for (i = 0; frame->data[i]; i++)
> +        frame->data[i] += offsets[i];
> +
> +    frame->width      -= (frame->crop_left + frame->crop_right);
> +    frame->height     -= (frame->crop_top  + frame->crop_bottom);
> +    frame->crop_left   = 0;
> +    frame->crop_right  = 0;
> +    frame->crop_top    = 0;
> +    frame->crop_bottom = 0;
> +
> +    return 0;
> +}
> +
>  int attribute_align_arg avcodec_receive_frame(AVCodecContext *avctx, AVFrame 
> *frame)
>  {
>      AVCodecInternal *avci = avctx->internal;
> @@ -472,6 +573,14 @@ int attribute_align_arg 
> avcodec_receive_frame(AVCodecContext *avctx, AVFrame *fr
>              return ret;
>      }
>  
> +    if (avctx->codec_type == AVMEDIA_TYPE_VIDEO) {
> +        ret = apply_cropping(avctx, frame);
> +        if (ret < 0) {
> +            av_frame_unref(frame);
> +            return ret;
> +        }
> +    }
> +
>      avctx->frame_number++;
>  
>      return 0;
> @@ -1029,7 +1138,8 @@ int ff_get_buffer(AVCodecContext *avctx, AVFrame 
> *frame, int flags)
>      ret = avctx->get_buffer2(avctx, frame, flags);
>  
>  end:
> -    if (avctx->codec_type == AVMEDIA_TYPE_VIDEO && !override_dimensions) {
> +    if (avctx->codec_type == AVMEDIA_TYPE_VIDEO && !override_dimensions &&
> +        !(avctx->codec->caps_internal & FF_CODEC_CAP_EXPORTS_CROPPING)) {
>          frame->width  = avctx->width;
>          frame->height = avctx->height;

Hm, not sure what's happening here. The existing code looks a bit
fishy. But I guess excluding this if cropping is "properly" done is the
right thing.

>      }
> diff --git a/libavcodec/internal.h b/libavcodec/internal.h
> index 796d45f..5b82504 100644
> --- a/libavcodec/internal.h
> +++ b/libavcodec/internal.h
> @@ -53,6 +53,12 @@
>   * from the input AVPacket.
>   */
>  #define FF_CODEC_CAP_SETS_PKT_DTS           (1 << 2)
> +/**
> + * The decoder sets the cropping fields in the output frames manually.
> + * If this cap is set, the generic code will initialize output frame
> + * dimensions to coded rather than display values.
> + */
> +#define FF_CODEC_CAP_EXPORTS_CROPPING       (1 << 3)
>  
>  #ifdef DEBUG
>  #   define ff_dlog(ctx, ...) av_log(ctx, AV_LOG_DEBUG, __VA_ARGS__)
> diff --git a/libavcodec/options_table.h b/libavcodec/options_table.h
> index 4deb223..3ac53fb 100644
> --- a/libavcodec/options_table.h
> +++ b/libavcodec/options_table.h
> @@ -531,6 +531,7 @@ static const AVOption avcodec_options[] = {
>  #if FF_API_SIDEDATA_ONLY_PKT
>  {"side_data_only_packets", NULL, OFFSET(side_data_only_packets), 
> AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, A|V|E },
>  #endif
> +{"apply_cropping", NULL, OFFSET(apply_cropping), AV_OPT_TYPE_INT, { .i64 = 1 
> }, 0, 1, V | D },
>  {NULL},
>  };
>  
> diff --git a/libavcodec/version.h b/libavcodec/version.h
> index 5b6fb6c..df0c01f 100644
> --- a/libavcodec/version.h
> +++ b/libavcodec/version.h
> @@ -28,8 +28,8 @@
>  #include "libavutil/version.h"
>  
>  #define LIBAVCODEC_VERSION_MAJOR 57
> -#define LIBAVCODEC_VERSION_MINOR 30
> -#define LIBAVCODEC_VERSION_MICRO  2
> +#define LIBAVCODEC_VERSION_MINOR 31
> +#define LIBAVCODEC_VERSION_MICRO  0
>  
>  #define LIBAVCODEC_VERSION_INT  AV_VERSION_INT(LIBAVCODEC_VERSION_MAJOR, \
>                                                 LIBAVCODEC_VERSION_MINOR, \

_______________________________________________
libav-devel mailing list
libav-devel@libav.org
https://lists.libav.org/mailman/listinfo/libav-devel

Re: [libav-devel] [PATCH 2/8] lavc: add an option for exporting cropping information to the caller

Reply via email to