Quoting Mark Thompson (2017-01-10 00:54:37)
> Takes a raw input stream containing frames with correct timestamps but
> possibly out of order and inserts additional show-existing-frame
> packets to correct the ordering.
> ---
> More specifically, it fixes up the output of VAAPI VP9 with B-frames enabled
> to show the frames in the right order. It may be desirable to follow it with
> vp9_superframe immediately to make a complete 1 packet -> 1 frame stream.
>
>
> libavcodec/Makefile | 1 +
> libavcodec/bitstream_filters.c | 1 +
> libavcodec/vp9_reorder_bsf.c | 412
> +++++++++++++++++++++++++++++++++++++++++
> 3 files changed, 414 insertions(+)
> create mode 100644 libavcodec/vp9_reorder_bsf.c
>
> diff --git a/libavcodec/Makefile b/libavcodec/Makefile
> index 7be9c2880..6e3a5ab66 100644
> --- a/libavcodec/Makefile
> +++ b/libavcodec/Makefile
> @@ -769,6 +769,7 @@ OBJS-$(CONFIG_NOISE_BSF) += noise_bsf.o
> OBJS-$(CONFIG_NULL_BSF) += null_bsf.o
> OBJS-$(CONFIG_REMOVE_EXTRADATA_BSF) += remove_extradata_bsf.o
> OBJS-$(CONFIG_TEXT2MOVSUB_BSF) += movsub_bsf.o
> +OBJS-$(CONFIG_VP9_REORDER_BSF) += vp9_reorder_bsf.o
> OBJS-$(CONFIG_VP9_SUPERFRAME_BSF) += vp9_superframe_bsf.o
> OBJS-$(CONFIG_VP9_SUPERFRAME_SPLIT_BSF) += vp9_superframe_split_bsf.o
>
> diff --git a/libavcodec/bitstream_filters.c b/libavcodec/bitstream_filters.c
> index d46fdad81..5e3a39f4d 100644
> --- a/libavcodec/bitstream_filters.c
> +++ b/libavcodec/bitstream_filters.c
> @@ -38,6 +38,7 @@ extern const AVBitStreamFilter ff_null_bsf;
> extern const AVBitStreamFilter ff_text2movsub_bsf;
> extern const AVBitStreamFilter ff_noise_bsf;
> extern const AVBitStreamFilter ff_remove_extradata_bsf;
> +extern const AVBitStreamFilter ff_vp9_reorder_bsf;
> extern const AVBitStreamFilter ff_vp9_superframe_bsf;
> extern const AVBitStreamFilter ff_vp9_superframe_split_bsf;
>
> diff --git a/libavcodec/vp9_reorder_bsf.c b/libavcodec/vp9_reorder_bsf.c
> new file mode 100644
> index 000000000..c6d54472f
> --- /dev/null
> +++ b/libavcodec/vp9_reorder_bsf.c
> @@ -0,0 +1,412 @@
> +/*
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301
> USA
> + */
> +
> +#include "libavutil/avassert.h"
> +#include "libavutil/intmath.h"
> +#include "libavutil/log.h"
> +#include "libavutil/mem.h"
> +#include "libavutil/opt.h"
> +
> +#include "bitstream.h"
> +#include "bsf.h"
> +#include "put_bits.h"
> +
> +#define FRAME_SLOTS 8
> +
> +typedef struct VP9ReorderFrame {
> + AVPacket *packet;
> + int needs_output;
> + int needs_display;
> +
> + int64_t pts;
> + int64_t sequence;
> + unsigned int slots;
> +
> + unsigned int profile;
> +
> + unsigned int show_existing_frame;
> + unsigned int frame_to_show;
> +
> + unsigned int frame_type;
> + unsigned int show_frame;
> + unsigned int refresh_frame_flags;
> +} VP9ReorderFrame;
> +
> +typedef struct VP9ReorderContext {
> + int64_t sequence;
> + VP9ReorderFrame *slot[FRAME_SLOTS];
> + VP9ReorderFrame *next_frame;
> +} VP9ReorderContext;
> +
> +static void vp9_reorder_frame_free(VP9ReorderFrame **frame)
> +{
> + if (*frame)
> + av_packet_free(&(*frame)->packet);
> + av_freep(frame);
> +}
> +
> +static void vp9_reorder_clear_slot(VP9ReorderContext *ctx, int s)
> +{
> + if (ctx->slot[s]) {
> + ctx->slot[s]->slots &= ~(1 << s);
> + if (ctx->slot[s]->slots == 0)
> + vp9_reorder_frame_free(&ctx->slot[s]);
> + else
> + ctx->slot[s] = NULL;
> + }
> +}
> +
> +static int vp9_reorder_frame_parse(AVBSFContext *bsf, VP9ReorderFrame *frame)
> +{
> + BitstreamContext bc;
> + int err;
> +
> + unsigned int frame_marker;
> + unsigned int profile_low_bit, profile_high_bit, reserved_zero;
> + unsigned int error_resilient_mode;
> + unsigned int frame_sync_code;
> +
> + err = bitstream_init8(&bc, frame->packet->data, frame->packet->size);
> + if (err)
> + return err;
> +
> + frame_marker = bitstream_read(&bc, 2);
> + if (frame_marker != 2) {
> + av_log(bsf, AV_LOG_ERROR, "Invalid frame marker: %u.\n",
> + frame_marker);
> + return AVERROR_INVALIDDATA;
> + }
> +
> + profile_low_bit = bitstream_read_bit(&bc);
> + profile_high_bit = bitstream_read_bit(&bc);
> + frame->profile = (profile_high_bit << 1) | profile_low_bit;
> + if (frame->profile == 3) {
> + reserved_zero = bitstream_read_bit(&bc);
> + if (reserved_zero != 0) {
> + av_log(bsf, AV_LOG_ERROR, "Profile reserved_zero bit set: "
> + "unsupported profile or invalid bitstream.\n");
> + return AVERROR_INVALIDDATA;
> + }
> + }
> +
> + frame->show_existing_frame = bitstream_read_bit(&bc);
> + if (frame->show_existing_frame) {
> + frame->frame_to_show = bitstream_read(&bc, 3);
> + return 0;
> + }
> +
> + frame->frame_type = bitstream_read_bit(&bc);
> + frame->show_frame = bitstream_read_bit(&bc);
> + error_resilient_mode = bitstream_read_bit(&bc);
> +
> + if (frame->frame_type == 0) {
> + frame_sync_code = bitstream_read(&bc, 24);
> + if (frame_sync_code != 0x498342) {
> + av_log(bsf, AV_LOG_ERROR, "Invalid frame sync code: %06x.\n",
> + frame_sync_code);
> + return AVERROR_INVALIDDATA;
> + }
> + frame->refresh_frame_flags = 0xff;
> + } else {
> + unsigned int intra_only;
> +
> + if (frame->show_frame == 0)
> + intra_only = bitstream_read_bit(&bc);
> + else
> + intra_only = 0;
> + if (error_resilient_mode == 0) {
> + // reset_frame_context
> + bitstream_skip(&bc, 2);
> + }
> + if (intra_only) {
> + frame_sync_code = bitstream_read(&bc, 24);
> + if (frame_sync_code != 0x498342) {
> + av_log(bsf, AV_LOG_ERROR, "Invalid frame sync code: "
> + "%06x.\n", frame_sync_code);
> + return AVERROR_INVALIDDATA;
> + }
> + if (frame->profile > 0) {
> + unsigned int color_space;
> + if (frame->profile >= 2) {
> + // ten_or_twelve_bit
> + bitstream_skip(&bc, 1);
> + }
> + color_space = bitstream_read(&bc, 3);
> + if (color_space != 7 /* CS_RGB */) {
> + // color_range
> + bitstream_skip(&bc, 1);
> + if (frame->profile == 1 || frame->profile == 3) {
> + // subsampling
> + bitstream_skip(&bc, 3);
> + }
> + } else {
> + if (frame->profile == 1 || frame->profile == 3)
> + bitstream_skip(&bc, 1);
> + }
> + }
> + frame->refresh_frame_flags = bitstream_read(&bc, 8);
> + } else {
> + frame->refresh_frame_flags = bitstream_read(&bc, 8);
> + }
> + }
> +
> + return 0;
> +}
> +
> +static int vp9_reorder_make_output(AVBSFContext *bsf,
> + AVPacket *out,
> + VP9ReorderFrame *last_frame)
> +{
> + VP9ReorderContext *ctx = bsf->priv_data;
> + VP9ReorderFrame *next_output = last_frame,
> + *next_display = last_frame, *frame;
> + int s, err;
> +
> + for (s = 0; s < FRAME_SLOTS; s++) {
> + frame = ctx->slot[s];
> + if (!frame)
> + continue;
> + if (frame->needs_output && (!next_output ||
> + frame->sequence < next_output->sequence))
> + next_output = frame;
> + if (frame->needs_display && (!next_display ||
> + frame->pts < next_display->pts))
> + next_display = frame;
> + }
> +
> + if (!next_output && !next_display)
> + return AVERROR(EAGAIN);
> +
> + if (!next_display ||
> + next_output->sequence < next_display->sequence)
> + frame = next_output;
> + else
> + frame = next_display;
> +
> + if (frame->needs_output && frame->needs_display &&
> + next_output == next_display) {
> + if (frame->needs_display) {
Isn't this always true due to containing if()?
> + av_log(bsf, AV_LOG_DEBUG, "Output and display frame "
> + "%"PRId64" (%"PRId64") in order.\n",
> + frame->sequence, frame->pts);
> + } else {
> + av_log(bsf, AV_LOG_DEBUG, "Output unshown frame "
> + "%"PRId64" (%"PRId64") in order.\n",
> + frame->sequence, frame->pts);
> + }
> +
> + av_packet_move_ref(out, frame->packet);
> +
> + frame->needs_output = frame->needs_display = 0;
> + } else if (frame->needs_output) {
> + if (frame->needs_display) {
> + av_log(bsf, AV_LOG_DEBUG, "Output frame %"PRId64" "
> + "(%"PRId64") for later display.\n",
> + frame->sequence, frame->pts);
> + } else {
> + av_log(bsf, AV_LOG_DEBUG, "Output unshown frame "
> + "%"PRId64" (%"PRId64") to keep order.\n",
> + frame->sequence, frame->pts);
> + }
> +
> + av_packet_move_ref(out, frame->packet);
> + out->pts = out->dts;
> +
> + frame->needs_output = 0;
> + } else {
> + PutBitContext pb;
> +
> + av_assert0(!frame->needs_output && frame->needs_display);
> +
> + if (frame->slots == 0) {
> + av_log(bsf, AV_LOG_ERROR, "Attempting to display frame "
> + "which is no longer available?\n");
> + frame->needs_display = 0;
> + return AVERROR_INVALIDDATA;
> + }
> +
> + s = ff_ctz(frame->slots);
> + av_assert0(s < FRAME_SLOTS);
> +
> + av_log(bsf, AV_LOG_DEBUG, "Display frame %"PRId64" "
> + "(%"PRId64") from slot %d.\n",
> + frame->sequence, frame->pts, s);
> +
> + frame->packet = av_packet_alloc();
> + if (!frame->packet)
> + return AVERROR(ENOMEM);
> +
> + err = av_new_packet(out, 2);
> + if (err < 0)
> + return err;
> +
> + init_put_bits(&pb, out->data, 2);
> +
> + // frame_marker
> + put_bits(&pb, 2, 2);
> + // profile_low_bit
> + put_bits(&pb, 1, frame->profile & 1);
> + // profile_high_bit
> + put_bits(&pb, 1, (frame->profile >> 1) & 1);
> + if (frame->profile == 3) {
> + // reserved_zero
> + put_bits(&pb, 1, 0);
> + }
> + // show_existing_frame
> + put_bits(&pb, 1, 1);
> + // frame_to_show_map_idx
> + put_bits(&pb, 3, s);
> +
> + while (put_bits_count(&pb) < 16)
> + put_bits(&pb, 1, 0);
> +
> + flush_put_bits(&pb);
> + out->pts = out->dts = frame->pts;
> +
> + frame->needs_display = 0;
> + }
> +
> + return 0;
> +}
> +
> +static int vp9_reorder_filter(AVBSFContext *bsf, AVPacket *out)
> +{
> + VP9ReorderContext *ctx = bsf->priv_data;
> + VP9ReorderFrame *frame;
> + AVPacket *in;
> + int err, s;
> +
> + if (ctx->next_frame) {
> + frame = ctx->next_frame;
> +
> + } else {
> + err = ff_bsf_get_packet(bsf, &in);
> + if (err < 0) {
> + if (err == AVERROR_EOF)
> + return vp9_reorder_make_output(bsf, out, NULL);
> + return err;
> + }
> +
> + if (in->data[in->size - 1] & 0xe0 == 0xc0) {
> + av_log(bsf, AV_LOG_ERROR, "Input in superframes is not "
> + "supported.\n");
> + return AVERROR_INVALIDDATA;
This return and the one below leak in.
> + }
> +
> + frame = av_mallocz(sizeof(*frame));
> + if (!frame)
> + return AVERROR(ENOMEM);
> +
> + frame->packet = in;
> + frame->pts = in->pts;
> + frame->sequence = ++ctx->sequence;
> + err = vp9_reorder_frame_parse(bsf, frame);
> + if (err) {
> + av_log(bsf, AV_LOG_ERROR, "Failed to parse input "
> + "frame: %d.\n", err);
> + goto fail;
> + }
> +
> + frame->needs_output = 1;
> + frame->needs_display = frame->pts != AV_NOPTS_VALUE;
> +
> + if (frame->show_existing_frame)
> + av_log(bsf, AV_LOG_DEBUG, "Show frame %"PRId64" "
> + "(%"PRId64"): show %u.\n", frame->sequence,
> + frame->pts, frame->frame_to_show);
> + else
> + av_log(bsf, AV_LOG_DEBUG, "New frame %"PRId64" "
> + "(%"PRId64"): type %u show %u refresh %02x.\n",
> + frame->sequence, frame->pts, frame->frame_type,
> + frame->show_frame, frame->refresh_frame_flags);
> +
> + ctx->next_frame = frame;
> + }
> +
> + for (s = 0; s < FRAME_SLOTS; s++) {
> + if (!(frame->refresh_frame_flags & 1 << s))
nit: I'd prefer parentheses around (4 << s)
> + continue;
> + if (ctx->slot[s] && ctx->slot[s]->needs_display &&
> + ctx->slot[s]->slots == 1 << s) {
> + // We are overwriting this slot, which is last reference
> + // to the frame previously present in it. In order to be
> + // a valid stream, that frame must already have been
> + // displayed before the pts of the current frame.
> + err = vp9_reorder_make_output(bsf, out, ctx->slot[s]);
> + if (err < 0) {
> + av_log(bsf, AV_LOG_ERROR, "Failed to create "
> + "output overwriting slot %d: %d.\n",
> + s, err);
> + // Clear the slot anyway, so we don't end up
> + // in an infinite loop.
> + vp9_reorder_clear_slot(ctx, s);
> + return AVERROR_INVALIDDATA;
> + }
> + return 0;
> + }
> + vp9_reorder_clear_slot(ctx, s);
> + }
> +
> + for (s = 0; s < FRAME_SLOTS; s++) {
> + if (!(frame->refresh_frame_flags & 1 << s))
> + continue;
> + ctx->slot[s] = frame;
> + }
> + frame->slots = frame->refresh_frame_flags;
> +
> + if (!frame->refresh_frame_flags) {
> + err = vp9_reorder_make_output(bsf, out, frame);
> + if (err < 0) {
> + av_log(bsf, AV_LOG_ERROR, "Failed to create output "
> + "for transient frame.\n");
> + ctx->next_frame = NULL;
> + return AVERROR_INVALIDDATA;
> + }
> + if (!frame->needs_display)
> + ctx->next_frame = NULL;
> + return 0;
> + }
> +
> + ctx->next_frame = NULL;
> + return AVERROR(EAGAIN);
> +
> +fail:
> + vp9_reorder_frame_free(&frame);
> + return err;
> +}
A very general observation I have is that this function has many exit
points so that it's hard to follow what happens.
But I don't have any specific suggestions how to improve that, so feel
free to ignore this comment.
--
Anton Khirnov
_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel