On 2017/6/24 7:39, Mark Thompson wrote:
> This is able to modify some header metadata found in the SPS/VUI,
> and can also add/remove AUDs and insert user data in SEI NAL units.
> ---
>  doc/bitstream_filters.texi     |  47 +++++
>  libavcodec/Makefile            |   2 +
>  libavcodec/bitstream_filters.c |   1 +
>  libavcodec/h264_metadata_bsf.c | 462 
> +++++++++++++++++++++++++++++++++++++++++
>  4 files changed, 512 insertions(+)
>  create mode 100644 libavcodec/h264_metadata_bsf.c
> 
> diff --git a/doc/bitstream_filters.texi b/doc/bitstream_filters.texi
> index af14b67ad..474a9d5c1 100644
> --- a/doc/bitstream_filters.texi
> +++ b/doc/bitstream_filters.texi
> @@ -39,6 +39,53 @@ When this option is enabled, the long-term headers are 
> removed from the
>  bitstream after extraction.
>  @end table
>  
> +@section h264_metadata
> +
> +Modify metadata attached to the H.264 stream.
> +
> +@table @option
> +@item aud
> +Insert or remove AUD NAL units in all access units of the stream.
> +
> +@table @samp
> +@item insert
> +@item remove
> +@end table
> +
> +@item sample_aspect_ratio
> +Set the sample aspect ratio in the stream in the VUI parameters.
> +
> +@item video_format
> +@item video_full_range_flag
> +Set the video format in the stream (see H.264 section E.2.1 and
> +table E-2).
> +
> +@item colour_primaries
> +@item transfer_characteristics
> +@item matrix_coefficients
> +Set the colour description in the stream (see H.264 section E.2.1
> +and tables E-3, E-4 and E-5).
> +
> +@item chroma_sample_loc_type
> +Set the chroma sample location in the stream (see H.264 section
> +E.2.1 and figure E-1).
> +
> +@item frame_rate
> +@item fixed_frame_rate_flag
> +Set the frame rate in the VUI parameters (num_units_in_tick /
> +time_scale).  Note that this is likely to be overridden by container
> +parameters when the stream is in a container.
> +
> +@item sei_user_data
> +Insert a string as SEI unregistered user data.  The argument must
> +be of the form @emph{UUID+string}, where the UUID is as hex digits
> +possibly separated by hyphens, and the string can be anything.
> +
> +For example, @samp{086f3693-b7b3-4f2c-9653-21492feee5b8+hello} will
> +insert the string ``hello'' associated with the given UUID.
> +
> +@end table
> +
>  @section h264_mp4toannexb
>  
>  @section imx_dump_header
> diff --git a/libavcodec/Makefile b/libavcodec/Makefile
> index b6c34444d..10a05adf2 100644
> --- a/libavcodec/Makefile
> +++ b/libavcodec/Makefile
> @@ -768,6 +768,8 @@ OBJS-$(CONFIG_CHOMP_BSF)                  += chomp_bsf.o
>  OBJS-$(CONFIG_DUMP_EXTRADATA_BSF)         += dump_extradata_bsf.o
>  OBJS-$(CONFIG_EXTRACT_EXTRADATA_BSF)      += extract_extradata_bsf.o    \
>                                               h2645_parse.o
> +OBJS-$(CONFIG_H264_METADATA_BSF)          += h264_metadata_bsf.o \
> +                                             cbs.o cbs_h2645.o
>  OBJS-$(CONFIG_H264_MP4TOANNEXB_BSF)       += h264_mp4toannexb_bsf.o
>  OBJS-$(CONFIG_HEVC_MP4TOANNEXB_BSF)       += hevc_mp4toannexb_bsf.o
>  OBJS-$(CONFIG_IMX_DUMP_HEADER_BSF)        += imx_dump_header_bsf.o
> diff --git a/libavcodec/bitstream_filters.c b/libavcodec/bitstream_filters.c
> index 2e423acaf..4ad50508c 100644
> --- a/libavcodec/bitstream_filters.c
> +++ b/libavcodec/bitstream_filters.c
> @@ -28,6 +28,7 @@ extern const AVBitStreamFilter ff_aac_adtstoasc_bsf;
>  extern const AVBitStreamFilter ff_chomp_bsf;
>  extern const AVBitStreamFilter ff_dump_extradata_bsf;
>  extern const AVBitStreamFilter ff_extract_extradata_bsf;
> +extern const AVBitStreamFilter ff_h264_metadata_bsf;
>  extern const AVBitStreamFilter ff_h264_mp4toannexb_bsf;
>  extern const AVBitStreamFilter ff_hevc_mp4toannexb_bsf;
>  extern const AVBitStreamFilter ff_imx_dump_header_bsf;
> diff --git a/libavcodec/h264_metadata_bsf.c b/libavcodec/h264_metadata_bsf.c
> new file mode 100644
> index 000000000..4eb58ce45
> --- /dev/null
> +++ b/libavcodec/h264_metadata_bsf.c
> @@ -0,0 +1,462 @@
> +/*
> + * This file is part of Libav.
> + *
> + * Libav is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU Lesser General Public
> + * License as published by the Free Software Foundation; either
> + * version 2.1 of the License, or (at your option) any later version.
> + *
> + * Libav is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
> + * Lesser General Public License for more details.
> + *
> + * You should have received a copy of the GNU Lesser General Public
> + * License along with Libav; if not, write to the Free Software
> + * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 
> USA
> + */
> +
> +#include "libavutil/common.h"
> +#include "libavutil/opt.h"
> +
> +#include "bsf.h"
> +#include "cbs.h"
> +#include "cbs_h264.h"
> +#include "h264.h"
> +#include "h264_sei.h"
> +
> +enum {
> +    PASS,
> +    INSERT,
> +    REMOVE,
> +};
> +
> +typedef struct H264MetadataContext {
> +    const AVClass *class;
> +
> +    CodedBitstreamContext cbc;
> +    CodedBitstreamFragment access_unit;
> +
> +    H264RawAUD aud_nal;
> +    H264RawSEI sei_nal;
> +
> +    int aud;
> +
> +    AVRational sample_aspect_ratio;
> +
> +    int video_format;
> +    int video_full_range_flag;
> +    int colour_primaries;
> +    int transfer_characteristics;
> +    int matrix_coefficients;
> +
> +    int chroma_sample_loc_type;
> +
> +    AVRational frame_rate;
> +    int fixed_frame_rate_flag;
> +
> +    const char *sei_user_data;
> +} H264MetadataContext;
> +
> +
> +static int h264_metadata_update_sps(AVBSFContext *bsf,
> +                                    H264RawSPS *sps)
> +{
> +    H264MetadataContext *ctx = bsf->priv_data;
> +    int need_vui = 0;
> +
> +    if (ctx->sample_aspect_ratio.num && ctx->sample_aspect_ratio.den) {
> +        // Table E-1.
> +        static const AVRational sar_idc[] = {
> +            {   0,  0 }, // Unspecified (never written here).
> +            {   1,  1 }, {  12, 11 }, {  10, 11 }, {  16, 11 },
> +            {  40, 33 }, {  24, 11 }, {  20, 11 }, {  32, 11 },
> +            {  80, 33 }, {  18, 11 }, {  15, 11 }, {  64, 33 },
> +            { 160, 99 }, {   4,  3 }, {   3,  2 }, {   2,  1 },
> +        };
> +        int num, den, i;
> +
> +        av_reduce(&num, &den, ctx->sample_aspect_ratio.num,
> +                  ctx->sample_aspect_ratio.den, 65535);
> +
> +        for (i = 1; i < FF_ARRAY_ELEMS(sar_idc); i++) {
> +            if (num == sar_idc[i].num &&
> +                den == sar_idc[i].den)
> +                break;
> +        }
> +        if (i == FF_ARRAY_ELEMS(sar_idc)) {
> +            sps->vui.aspect_ratio_idc = 255;
> +            sps->vui.sar_width  = num;
> +            sps->vui.sar_height = den;
> +        } else {
> +            sps->vui.aspect_ratio_idc = i;
> +        }
> +        sps->vui.aspect_ratio_info_present_flag = 1;
> +        need_vui = 1;
> +    }
> +
> +#define SET_OR_INFER(field, value, present_flag, infer) do { \
> +        if (value >= 0) { \
> +            field = value; \
> +            need_vui = 1; \
> +        } else if (!present_flag) \
> +            field = infer; \
> +    } while (0)
> +
> +    if (ctx->video_format             >= 0 ||
> +        ctx->video_full_range_flag    >= 0 ||
> +        ctx->colour_primaries         >= 0 ||
> +        ctx->transfer_characteristics >= 0 ||
> +        ctx->matrix_coefficients      >= 0) {
> +
> +        SET_OR_INFER(sps->vui.video_format, ctx->video_format,
> +                     sps->vui.video_signal_type_present_flag, 5);
> +
> +        SET_OR_INFER(sps->vui.video_full_range_flag,
> +                     ctx->video_full_range_flag,
> +                     sps->vui.video_signal_type_present_flag, 0);
> +
> +        if (ctx->colour_primaries         >= 0 ||
> +            ctx->transfer_characteristics >= 0 ||
> +            ctx->matrix_coefficients      >= 0) {
> +
> +            SET_OR_INFER(sps->vui.colour_primaries,
> +                         ctx->colour_primaries,
> +                         sps->vui.colour_description_present_flag, 2);
> +
> +            SET_OR_INFER(sps->vui.transfer_characteristics,
> +                         ctx->transfer_characteristics,
> +                         sps->vui.colour_description_present_flag, 2);
> +
> +            SET_OR_INFER(sps->vui.matrix_coefficients,
> +                         ctx->matrix_coefficients,
> +                         sps->vui.colour_description_present_flag, 2);
> +
> +            sps->vui.colour_description_present_flag = 1;
> +        }
> +        sps->vui.video_signal_type_present_flag = 1;
> +        need_vui = 1;
> +    }
> +
> +    if (ctx->chroma_sample_loc_type >= 0) {
> +        sps->vui.chroma_sample_loc_type_top_field =
> +            ctx->chroma_sample_loc_type;
> +        sps->vui.chroma_sample_loc_type_bottom_field =
> +            ctx->chroma_sample_loc_type;
> +        sps->vui.chroma_loc_info_present_flag = 1;
> +        need_vui = 1;
> +    }
> +
> +    if (ctx->frame_rate.num && ctx->frame_rate.den) {
> +        int num, den;
> +
> +        av_reduce(&num, &den, 2 * ctx->frame_rate.num, ctx->frame_rate.den,
> +                  UINT32_MAX > INT_MAX ? UINT32_MAX : INT_MAX);
> +
> +        sps->vui.time_scale        = num;
> +        sps->vui.num_units_in_tick = den;
> +
> +        sps->vui.timing_info_present_flag = 1;
> +        need_vui = 1;
> +    }
> +    SET_OR_INFER(sps->vui.fixed_frame_rate_flag,
> +                 ctx->fixed_frame_rate_flag,
> +                 sps->vui.timing_info_present_flag, 0);
> +
> +    if (need_vui)
> +        sps->vui_parameters_present_flag = 1;
> +
> +    return 0;
> +}
> +
> +static int h264_metadata_filter(AVBSFContext *bsf, AVPacket *out)
> +{
> +    H264MetadataContext *ctx = bsf->priv_data;
> +    AVPacket *in = NULL;
> +    CodedBitstreamFragment *au = &ctx->access_unit;
> +    int err, i, j, has_sps;
> +    char *sei_udu_string = NULL;
> +
> +    err = ff_bsf_get_packet(bsf, &in);
> +    if (err < 0)
> +        goto fail;
> +
> +    err = ff_cbs_read_packet(&ctx->cbc, au, in);
> +    if (err < 0) {
> +        av_log(bsf, AV_LOG_ERROR, "Failed to read packet.\n");
> +        goto fail;
> +    }
> +
> +    if (au->nb_units == 0) {
> +        av_log(bsf, AV_LOG_ERROR, "No NAL units in packet.\n");
> +        err = AVERROR_INVALIDDATA;
> +        goto fail;
> +    }
> +
> +    // If an AUD is present, it must be the first NAL unit.
> +    if (au->units[0].type == H264_NAL_AUD) {
> +        if (ctx->aud == REMOVE)
> +            ff_cbs_delete_unit(&ctx->cbc, au, 0);
> +    } else {
> +        if (ctx->aud == INSERT) {
> +            static const int primary_pic_type_table[] = {
> +                0x084, // 2, 7
> +                0x0a5, // 0, 2, 5, 7
> +                0x0e7, // 0, 1, 2, 5, 6, 7
> +                0x210, // 4, 9
> +                0x318, // 3, 4, 8, 9
> +                0x294, // 2, 4, 7, 9
> +                0x3bd, // 0, 2, 3, 4, 5, 7, 8, 9
> +                0x3ff, // 0, 1, 2, 3, 4, 5, 6, 7, 8, 9
> +            };
> +            int primary_pic_type_mask = 0xff;
> +            H264RawAUD *aud = &ctx->aud_nal;
> +
> +            for (i = 0; i < au->nb_units; i++) {
> +                if (au->units[i].type == H264_NAL_SLICE ||
> +                    au->units[i].type == H264_NAL_IDR_SLICE) {
> +                    H264RawSlice *slice = au->units[i].content;
> +                    for (j = 0; j < FF_ARRAY_ELEMS(primary_pic_type_table); 
> j++) {
> +                         if (!(primary_pic_type_table[j] &
> +                               (1 << slice->header.slice_type)))
> +                             primary_pic_type_mask &= ~(1 << j);
> +                    }
> +                }
> +            }
> +            for (j = 0; j < FF_ARRAY_ELEMS(primary_pic_type_table); j++)
> +                if (primary_pic_type_mask & (1 << j))
> +                    break;
> +            if (j >= FF_ARRAY_ELEMS(primary_pic_type_table)) {
> +                av_log(bsf, AV_LOG_ERROR, "No usable primary_pic_type: "
> +                       "invalid slice types?\n");
> +                err = AVERROR_INVALIDDATA;
> +                goto fail;
> +            }
> +
> +            aud->nal_unit_header.nal_unit_type = H264_NAL_AUD;
> +            aud->primary_pic_type = j;
> +
> +            err = ff_cbs_insert_unit_content(&ctx->cbc, au,
> +                                             0, H264_NAL_AUD, aud);
> +            if (err) {
> +                av_log(bsf, AV_LOG_ERROR, "Failed to insert AUD.\n");
> +                goto fail;
> +            }
> +        }
> +    }
> +
> +    has_sps = 0;
> +    for (i = 0; i < au->nb_units; i++) {
> +        if (au->units[i].type == H264_NAL_SPS) {
> +            h264_metadata_update_sps(bsf, au->units[i].content);
> +            has_sps = 1;
> +        }
> +    }
> +
> +    // Only insert the SEI in access units containing SPSs.
> +    if (has_sps && ctx->sei_user_data) {
> +        H264RawSEI *sei;
> +        H264RawSEIPayload *payload;
> +        H264RawSEIUserDataUnregistered *udu;
> +        int sei_pos;
> +
> +        for (i = 0; i < au->nb_units; i++) {
> +            if (au->units[i].type == H264_NAL_SEI ||
> +                au->units[i].type == H264_NAL_SLICE ||
> +                au->units[i].type == H264_NAL_IDR_SLICE)
> +                break;
> +        }
> +        sei_pos = i;
> +
> +        if (sei_pos < au->nb_units &&
> +            au->units[sei_pos].type == H264_NAL_SEI) {
> +            sei = au->units[sei_pos].content;
> +        } else {
> +            sei = &ctx->sei_nal;
> +            memset(sei, 0, sizeof(*sei));
> +
> +            sei->nal_unit_header.nal_unit_type = H264_NAL_SEI;
> +
> +            err = ff_cbs_insert_unit_content(&ctx->cbc, au,
> +                                             sei_pos, H264_NAL_SEI, sei);
> +            if (err < 0) {
> +                av_log(bsf, AV_LOG_ERROR, "Failed to insert SEI.\n");
> +                goto fail;
> +            }
> +        }
> +
> +        payload = &sei->payload[sei->payload_count];
> +
> +        payload->payload_type = H264_SEI_TYPE_USER_DATA_UNREGISTERED;
> +        udu = &payload->user_data_unregistered;
> +
> +        for (i = j = 0; j < 32 && ctx->sei_user_data[i]; i++) {
> +            int c, v;
> +            c = ctx->sei_user_data[i];
> +            if (c == '-')
> +                continue;
> +            else if (c >= '0' && c <= '9')
> +                v = c - '0';
> +            else if (c >= 'A' && c <= 'F')
> +                v = c - 'A' + 10;
> +            else if (c >= 'a' && c <= 'f')
> +                v = c - 'a' + 10;
> +            else
> +                goto invalid_user_data;

How about if (c== '-') 
              continue;
          else if (av_isxdigit(c))
              c = av_tolower(c)
              v = (c <= '9' ? c - '0' : c - 'a' + 10);
          else
              goto invalid_user_data;

> +            if (i & 1)
> +                udu->uuid_iso_iec_11578[j / 2] |= v;
> +            else
> +                udu->uuid_iso_iec_11578[j / 2] = v << 4;
> +            ++j;
> +        }
> +        if (j == 32 && ctx->sei_user_data[i] == '+') {
> +            sei_udu_string = av_strdup(ctx->sei_user_data + i + 1);
> +            if (!sei_udu_string) {
> +                err = AVERROR(ENOMEM);
> +                goto sei_fail;
> +            }
> +
> +            udu->data = sei_udu_string;
> +            udu->data_length = strlen(sei_udu_string);
> +
> +            payload->payload_size = 16 + udu->data_length;
> +
> +        } else {
> +        invalid_user_data:
> +            av_log(bsf, AV_LOG_ERROR, "Invalid user data: "
> +                   "must be \"UUID+string\".\n");
> +            err = AVERROR(EINVAL);
> +        sei_fail:
> +            memset(payload, 0, sizeof(&payload));
> +            goto fail;
> +        }
> +
> +        ++sei->payload_count;
> +    }
> +
> +    err = ff_cbs_write_packet(&ctx->cbc, out, au);
> +    if (err < 0) {
> +        av_log(bsf, AV_LOG_ERROR, "Failed to write packet.\n");
> +        goto fail;
> +    }
> +
> +    err = av_packet_copy_props(out, in);
> +    if (err < 0)
> +        goto fail;
> +
> +    err = 0;
> +fail:
> +    ff_cbs_fragment_uninit(&ctx->cbc, au);
> +    av_freep(&sei_udu_string);
> +
> +    av_packet_free(&in);
> +
> +    return err;
> +}
> +
> +static int h264_metadata_init(AVBSFContext *bsf)
> +{
> +    H264MetadataContext *ctx = bsf->priv_data;
> +    CodedBitstreamFragment *au = &ctx->access_unit;
> +    int err, i;
> +
> +    err = ff_cbs_init(&ctx->cbc, AV_CODEC_ID_H264, bsf);
> +    if (err < 0)
> +        return err;
> +
> +    if (bsf->par_in->extradata) {
> +        err = ff_cbs_read_extradata(&ctx->cbc, au, bsf->par_in);
> +        if (err < 0) {
> +            av_log(bsf, AV_LOG_ERROR, "Failed to read extradata.\n");
> +            return err;
> +        }
> +
> +        for (i = 0; i < au->nb_units; i++) {
> +            if (au->units[i].type == H264_NAL_SPS)
> +                h264_metadata_update_sps(bsf, au->units[i].content);
> +        }
> +
> +        err = ff_cbs_write_extradata(&ctx->cbc, bsf->par_out, au);
> +        if (err < 0) {
> +            av_log(bsf, AV_LOG_ERROR, "Failed to write extradata.\n");
> +            return err;
> +        }
> +
> +        ff_cbs_fragment_uninit(&ctx->cbc, au);
> +    }
> +
> +    return 0;
> +}
> +
> +static void h264_metadata_close(AVBSFContext *bsf)
> +{
> +    H264MetadataContext *ctx = bsf->priv_data;
> +    ff_cbs_close(&ctx->cbc);
> +}
> +
> +#define OFFSET(x) offsetof(H264MetadataContext, x)
> +static const AVOption h264_metadata_options[] = {
> +    { "aud", "Access Unit Delimiter NAL units",
> +        OFFSET(aud), AV_OPT_TYPE_INT,
> +        { .i64 = PASS }, PASS, REMOVE, 0, "aud" },
> +    { "pass",   NULL, 0, AV_OPT_TYPE_CONST, { .i64 = PASS   }, .unit = "aud" 
> },
> +    { "insert", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = INSERT }, .unit = "aud" 
> },
> +    { "remove", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = REMOVE }, .unit = "aud" 
> },
> +
> +    { "sample_aspect_ratio", "Set sample aspect ratio (table E-1)",
> +        OFFSET(sample_aspect_ratio), AV_OPT_TYPE_RATIONAL,
> +        { .i64 = 0 }, 0, 65535 },
> +
> +    { "video_format", "Set video format (table E-2)",
> +        OFFSET(video_format), AV_OPT_TYPE_INT,
> +        { .i64 = -1 }, -1, 7 },
> +    { "video_full_range_flag", "Set video full range flag",
> +        OFFSET(video_full_range_flag), AV_OPT_TYPE_INT,
> +        { .i64 = -1 }, -1, 1 },
> +    { "colour_primaries", "Set colour primaries (table E-3)",
> +        OFFSET(colour_primaries), AV_OPT_TYPE_INT,
> +        { .i64 = -1 }, -1, 255 },
> +    { "transfer_characteristics", "Set transfer characteristics (table E-4)",
> +        OFFSET(transfer_characteristics), AV_OPT_TYPE_INT,
> +        { .i64 = -1 }, -1, 255 },
> +    { "matrix_coefficients", "Set matrix coefficients (table E-5)",
> +        OFFSET(matrix_coefficients), AV_OPT_TYPE_INT,
> +        { .i64 = -1 }, -1, 255 },
> +
> +    { "chroma_sample_loc_type", "Set chroma sample location type (figure 
> E-1)",
> +        OFFSET(chroma_sample_loc_type), AV_OPT_TYPE_INT,
> +        { .i64 = -1 }, -1, 6 },
> +
> +    { "frame_rate", "Set VUI frame rate (num_units_in_tick / time_scale)",
> +        OFFSET(frame_rate), AV_OPT_TYPE_RATIONAL,
> +        { .i64 = 0 }, 0, UINT_MAX },
> +    { "fixed_frame_rate_flag", "Set VUI fixed frame rate flag",
> +        OFFSET(fixed_frame_rate_flag), AV_OPT_TYPE_INT,
> +        { .i64 = -1 }, -1, 1 },
> +
> +    { "sei_user_data", "Insert SEI user data (UUID+string)",
> +        OFFSET(sei_user_data), AV_OPT_TYPE_STRING, { .str = NULL } },
> +
> +    { NULL }
> +};
> +
> +static const AVClass h264_metadata_class = {
> +    .class_name = "h264_metadata_bsf",
> +    .item_name  = av_default_item_name,
> +    .option     = h264_metadata_options,
> +    .version    = LIBAVCODEC_VERSION_MAJOR,
> +};
> +
> +static const enum AVCodecID h264_metadata_codec_ids[] = {
> +    AV_CODEC_ID_H264, AV_CODEC_ID_NONE,
> +};
> +
> +const AVBitStreamFilter ff_h264_metadata_bsf = {
> +    .name           = "h264_metadata",
> +    .priv_data_size = sizeof(H264MetadataContext),
> +    .priv_class     = &h264_metadata_class,
> +    .init           = &h264_metadata_init,
> +    .close          = &h264_metadata_close,
> +    .filter         = &h264_metadata_filter,
> +    .codec_ids      = h264_metadata_codec_ids,
> +};
> 
_______________________________________________
libav-devel mailing list
[email protected]
https://lists.libav.org/mailman/listinfo/libav-devel

Reply via email to