On Tue, 27 Dec 2016 19:31:15 +0100
Anton Khirnov <[email protected]> wrote:
> Also, add generic code for handling cropping, so the decoders can export
> just the cropping size and not bother with the rest.
> ---
> doc/APIchanges | 4 ++
> libavcodec/avcodec.h | 22 +++++++++
> libavcodec/decode.c | 112
> ++++++++++++++++++++++++++++++++++++++++++++-
> libavcodec/internal.h | 6 +++
> libavcodec/options_table.h | 1 +
> libavcodec/version.h | 4 +-
> 6 files changed, 146 insertions(+), 3 deletions(-)
>
> diff --git a/doc/APIchanges b/doc/APIchanges
> index 10a2da4..a0ef198 100644
> --- a/doc/APIchanges
> +++ b/doc/APIchanges
> @@ -13,6 +13,10 @@ libavutil: 2015-08-28
>
> API changes, most recent first:
>
> +2016-xx-xx - xxxxxxx - lavc 57.31.0 - avcodec.h
> + Add AVCodecContext.apply_cropping to control whether cropping
> + is handled by libavcodec or the caller.
> +
> 2016-xx-xx - xxxxxxx - lavu 55.30.0 - frame.h
> Add AVFrame.crop_left/right/top/bottom fields for attaching cropping
> information to video frames.
> diff --git a/libavcodec/avcodec.h b/libavcodec/avcodec.h
> index 95da50b..524e06a 100644
> --- a/libavcodec/avcodec.h
> +++ b/libavcodec/avcodec.h
> @@ -3112,6 +3112,28 @@ typedef struct AVCodecContext {
> * This field should be set before avcodec_open2() is called.
> */
> AVBufferRef *hw_frames_ctx;
> +
> + /**
> + * Video decoding only. Certain video codecs support cropping, meaning
> that
> + * only a sub-rectangle of the decoded frame is intended for display.
> This
> + * option controls how cropping is handled by libavcodec.
> + *
> + * When set to 1 (the default), libavcodec will apply cropping
> internally.
> + * I.e. it will modify the output frame width/height fields and offset
> the
> + * data pointers (only by as much as possible while preserving
> alignment, or
> + * by the full amount if the AV_CODEC_FLAG_UNALIGNED flag is set) so that
> + * the frames output by the decoder refer only to the cropped area. The
> + * crop_* fields of the output frames will be zero.
> + *
> + * When set to 0, the width/height fields of the output frames will be
> set
> + * to the coded dimensions and the crop_* fields will describe the
> cropping
> + * rectangle. Applying the cropping is left to the caller.
Maybe could explain why AVCodecContext or AVCodecPar width/height will
mismatch with the width/height of the AVFrame if it's set to 0. From
what I understand, containers will normally use a cropped dimension (?).
> + *
> + * When hardware acceleration with opaque output frames is used, the
> actual
> + * value of this option is disregarded and libavcodec behaves as if it
> was
> + * set to 0.
> + */
Isn't that last part an implicit API change? This would probably annoy
a lot of people.
> + int apply_cropping;
> } AVCodecContext;
>
> /**
> diff --git a/libavcodec/decode.c b/libavcodec/decode.c
> index 0fd41ab..65ee8b0 100644
> --- a/libavcodec/decode.c
> +++ b/libavcodec/decode.c
> @@ -29,6 +29,7 @@
> #include "libavutil/frame.h"
> #include "libavutil/hwcontext.h"
> #include "libavutil/imgutils.h"
> +#include "libavutil/intmath.h"
>
> #include "avcodec.h"
> #include "bytestream.h"
> @@ -450,6 +451,106 @@ int attribute_align_arg
> avcodec_send_packet(AVCodecContext *avctx, const AVPacke
> return 0;
> }
>
> +static int calc_cropping_offsets(size_t offsets[4], const AVFrame *frame,
> + const AVPixFmtDescriptor *desc)
> +{
> + int i, j;
> +
> + for (i = 0; frame->data[i]; i++) {
> + const AVComponentDescriptor *comp = NULL;
> + int shift_x = (i == 1 || i == 2) ? desc->log2_chroma_w : 0;
> + int shift_y = (i == 1 || i == 2) ? desc->log2_chroma_h : 0;
> +
> + if (desc->flags & (AV_PIX_FMT_FLAG_PAL | AV_PIX_FMT_FLAG_PSEUDOPAL)
> && i == 1) {
> + offsets[i] = 0;
> + break;
> + }
> +
> + /* find any component descriptor for this plane */
> + for (j = 0; j < desc->nb_components; j++) {
> + if (desc->comp[j].plane == i) {
> + comp = &desc->comp[j];
> + break;
> + }
> + }
> + if (!comp)
> + return AVERROR_BUG;
> +
> + offsets[i] = (frame->crop_top >> shift_y) * frame->linesize[i] +
> + (frame->crop_left >> shift_x) * comp->step;
> + }
> +
> + return 0;
> +}
> +
> +static int apply_cropping(AVCodecContext *avctx, AVFrame *frame)
> +{
> + const AVPixFmtDescriptor *desc;
> + size_t offsets[4];
> + int i;
> +
> + /* make sure we are noisy about decoders returning invalid cropping data
> */
> + if (frame->crop_left >= INT_MAX - frame->crop_right ||
> + frame->crop_top >= INT_MAX - frame->crop_bottom ||
These fields are size_t, so why INT_MAX? Sure, the frame size can't be
larger than INT_MAX anyway, but this is a good opportunity for
nitpicking.
> + (frame->crop_left + frame->crop_right) >= frame->width ||
> + (frame->crop_top + frame->crop_bottom) >= frame->height) {
> + av_log(avctx, AV_LOG_WARNING,
> + "Invalid cropping information set by a decoder:
> %zu/%zu/%zu/%zu "
> + "(frame size %dx%d). This is a bug, please report it\n",
> + frame->crop_left, frame->crop_right, frame->crop_top,
> frame->crop_bottom,
> + frame->width, frame->height);
> + frame->crop_left = 0;
> + frame->crop_right = 0;
> + frame->crop_top = 0;
> + frame->crop_bottom = 0;
> + return 0;
> + }
> +
> + if (!avctx->apply_cropping)
> + return 0;
> +
> + desc = av_pix_fmt_desc_get(frame->format);
> + if (!desc)
> + return AVERROR_BUG;
> +
> + /* Do nothing for hwaccel formats.
> + * Bitstream formats cannot be easily handled here either (and
> corresponding
> + * decoders should not export any cropping anyway), so also do nothing
> for
> + * those. */
> + if (desc->flags & (AV_PIX_FMT_FLAG_BITSTREAM | AV_PIX_FMT_FLAG_HWACCEL))
> + return 0;
> +
> + /* calculate the offsets for each plane */
> + calc_cropping_offsets(offsets, frame, desc);
> +
> + /* adjust the offsets to avoid breaking alignment */
> + if (!(avctx->flags & AV_CODEC_FLAG_UNALIGNED)) {
> + int min_log2_align = INT_MAX;
> +
> + for (i = 0; frame->data[i]; i++) {
> + int log2_align = offsets[i] ? av_ctz(offsets[i]) : INT_MAX;
> + min_log2_align = FFMIN(log2_align, min_log2_align);
> + }
> +
> + if (min_log2_align < 5) {
> + frame->crop_left &= ~((1 << min_log2_align) - 1);
> + calc_cropping_offsets(offsets, frame, desc);
> + }
> + }
> +
> + for (i = 0; frame->data[i]; i++)
> + frame->data[i] += offsets[i];
> +
> + frame->width -= (frame->crop_left + frame->crop_right);
> + frame->height -= (frame->crop_top + frame->crop_bottom);
> + frame->crop_left = 0;
> + frame->crop_right = 0;
> + frame->crop_top = 0;
> + frame->crop_bottom = 0;
> +
> + return 0;
> +}
> +
> int attribute_align_arg avcodec_receive_frame(AVCodecContext *avctx, AVFrame
> *frame)
> {
> AVCodecInternal *avci = avctx->internal;
> @@ -472,6 +573,14 @@ int attribute_align_arg
> avcodec_receive_frame(AVCodecContext *avctx, AVFrame *fr
> return ret;
> }
>
> + if (avctx->codec_type == AVMEDIA_TYPE_VIDEO) {
> + ret = apply_cropping(avctx, frame);
> + if (ret < 0) {
> + av_frame_unref(frame);
> + return ret;
> + }
> + }
> +
> avctx->frame_number++;
>
> return 0;
> @@ -1029,7 +1138,8 @@ int ff_get_buffer(AVCodecContext *avctx, AVFrame
> *frame, int flags)
> ret = avctx->get_buffer2(avctx, frame, flags);
>
> end:
> - if (avctx->codec_type == AVMEDIA_TYPE_VIDEO && !override_dimensions) {
> + if (avctx->codec_type == AVMEDIA_TYPE_VIDEO && !override_dimensions &&
> + !(avctx->codec->caps_internal & FF_CODEC_CAP_EXPORTS_CROPPING)) {
> frame->width = avctx->width;
> frame->height = avctx->height;
Hm, not sure what's happening here. The existing code looks a bit
fishy. But I guess excluding this if cropping is "properly" done is the
right thing.
> }
> diff --git a/libavcodec/internal.h b/libavcodec/internal.h
> index 796d45f..5b82504 100644
> --- a/libavcodec/internal.h
> +++ b/libavcodec/internal.h
> @@ -53,6 +53,12 @@
> * from the input AVPacket.
> */
> #define FF_CODEC_CAP_SETS_PKT_DTS (1 << 2)
> +/**
> + * The decoder sets the cropping fields in the output frames manually.
> + * If this cap is set, the generic code will initialize output frame
> + * dimensions to coded rather than display values.
> + */
> +#define FF_CODEC_CAP_EXPORTS_CROPPING (1 << 3)
>
> #ifdef DEBUG
> # define ff_dlog(ctx, ...) av_log(ctx, AV_LOG_DEBUG, __VA_ARGS__)
> diff --git a/libavcodec/options_table.h b/libavcodec/options_table.h
> index 4deb223..3ac53fb 100644
> --- a/libavcodec/options_table.h
> +++ b/libavcodec/options_table.h
> @@ -531,6 +531,7 @@ static const AVOption avcodec_options[] = {
> #if FF_API_SIDEDATA_ONLY_PKT
> {"side_data_only_packets", NULL, OFFSET(side_data_only_packets),
> AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, A|V|E },
> #endif
> +{"apply_cropping", NULL, OFFSET(apply_cropping), AV_OPT_TYPE_INT, { .i64 = 1
> }, 0, 1, V | D },
> {NULL},
> };
>
> diff --git a/libavcodec/version.h b/libavcodec/version.h
> index 5b6fb6c..df0c01f 100644
> --- a/libavcodec/version.h
> +++ b/libavcodec/version.h
> @@ -28,8 +28,8 @@
> #include "libavutil/version.h"
>
> #define LIBAVCODEC_VERSION_MAJOR 57
> -#define LIBAVCODEC_VERSION_MINOR 30
> -#define LIBAVCODEC_VERSION_MICRO 2
> +#define LIBAVCODEC_VERSION_MINOR 31
> +#define LIBAVCODEC_VERSION_MICRO 0
>
> #define LIBAVCODEC_VERSION_INT AV_VERSION_INT(LIBAVCODEC_VERSION_MAJOR, \
> LIBAVCODEC_VERSION_MINOR, \
_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel