doxygen/5.0/libaomdec_8c_source.html

/*

 * Copyright (c) 2010, Google, Inc.

 *

 * This file is part of FFmpeg.

 *

 * FFmpeg is free software; you can redistribute it and/or

 * modify it under the terms of the GNU Lesser General Public

 * License as published by the Free Software Foundation; either

 * version 2.1 of the License, or (at your option) any later version.

 *

 * FFmpeg is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

 * Lesser General Public License for more details.

 *

 * You should have received a copy of the GNU Lesser General Public

 * License along with FFmpeg; if not, write to the Free Software

 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

 */


/**

 * @file

 * AV1 decoder support via libaom

 */


#include <aom/aom_decoder.h>

#include <aom/aomdx.h>


#include "libavutil/common.h"

#include "libavutil/cpu.h"

#include "libavutil/imgutils.h"


#include "avcodec.h"

#include "internal.h"

#include "profiles.h"


typedef struct AV1DecodeContext {

    struct aom_codec_ctx decoder;

} AV1DecodeContext;


static av_cold int aom_init(AVCodecContext *avctx,

                            const struct aom_codec_iface *iface)

{

    AV1DecodeContext *ctx           = avctx->priv_data;

    struct aom_codec_dec_cfg deccfg = {

        .threads = FFMIN(avctx->thread_count ? avctx->thread_count : av_cpu_count(), 16)

    };


    av_log(avctx, AV_LOG_INFO, "%s\n", aom_codec_version_str());

    av_log(avctx, AV_LOG_VERBOSE, "%s\n", aom_codec_build_config());


    if (aom_codec_dec_init(&ctx->decoder, iface, &deccfg, 0) != AOM_CODEC_OK) {

        const char *error = aom_codec_error(&ctx->decoder);

        av_log(avctx, AV_LOG_ERROR, "Failed to initialize decoder: %s\n",

               error);

        return AVERROR(EINVAL);

    }


    return 0;

}


static void image_copy_16_to_8(AVFrame *pic, struct aom_image *img)

{

    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pic->format);

    int i;


    for (i = 0; i < desc->nb_components; i++) {

        int w = img->d_w;

        int h = img->d_h;

        int x, y;


        if (i) {

            w = (w + img->x_chroma_shift) >> img->x_chroma_shift;

            h = (h + img->y_chroma_shift) >> img->y_chroma_shift;

        }


        for (y = 0; y < h; y++) {

            uint16_t *src = (uint16_t *)(img->planes[i] + y * img->stride[i]);

            uint8_t *dst = pic->data[i] + y * pic->linesize[i];

            for (x = 0; x < w; x++)

                *dst++ = *src++;

        }

    }

}


// returns 0 on success, AVERROR_INVALIDDATA otherwise

static int set_pix_fmt(AVCodecContext *avctx, struct aom_image *img)

{

    static const enum AVColorRange color_ranges[] = {

        AVCOL_RANGE_MPEG, AVCOL_RANGE_JPEG

    };

    avctx->color_range = color_ranges[img->range];

    avctx->color_primaries = img->cp;

    avctx->colorspace  = img->mc;

    avctx->color_trc   = img->tc;


    switch (img->fmt) {

    case AOM_IMG_FMT_I420:

    case AOM_IMG_FMT_I42016:

        if (img->bit_depth == 8) {

            avctx->pix_fmt = img->monochrome ?

                             AV_PIX_FMT_GRAY8 : AV_PIX_FMT_YUV420P;

            avctx->profile = FF_PROFILE_AV1_MAIN;

            return 0;

        } else if (img->bit_depth == 10) {

            avctx->pix_fmt = img->monochrome ?

                             AV_PIX_FMT_GRAY10 : AV_PIX_FMT_YUV420P10;

            avctx->profile = FF_PROFILE_AV1_MAIN;

            return 0;

        } else if (img->bit_depth == 12) {

            avctx->pix_fmt = img->monochrome ?

                             AV_PIX_FMT_GRAY12 : AV_PIX_FMT_YUV420P12;

            avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;

            return 0;

        } else {

            return AVERROR_INVALIDDATA;

        }

    case AOM_IMG_FMT_I422:

    case AOM_IMG_FMT_I42216:

        if (img->bit_depth == 8) {

            avctx->pix_fmt = AV_PIX_FMT_YUV422P;

            avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;

            return 0;

        } else if (img->bit_depth == 10) {

            avctx->pix_fmt = AV_PIX_FMT_YUV422P10;

            avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;

            return 0;

        } else if (img->bit_depth == 12) {

            avctx->pix_fmt = AV_PIX_FMT_YUV422P12;

            avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;

            return 0;

        } else {

            return AVERROR_INVALIDDATA;

        }

    case AOM_IMG_FMT_I444:

    case AOM_IMG_FMT_I44416:

        if (img->bit_depth == 8) {

            avctx->pix_fmt = AV_PIX_FMT_YUV444P;

            avctx->profile = FF_PROFILE_AV1_HIGH;

            return 0;

        } else if (img->bit_depth == 10) {

            avctx->pix_fmt = AV_PIX_FMT_YUV444P10;

            avctx->profile = FF_PROFILE_AV1_HIGH;

            return 0;

        } else if (img->bit_depth == 12) {

            avctx->pix_fmt = AV_PIX_FMT_YUV444P12;

            avctx->profile = FF_PROFILE_AV1_PROFESSIONAL;

            return 0;

        } else {

            return AVERROR_INVALIDDATA;

        }


    default:

        return AVERROR_INVALIDDATA;

    }

}


static int aom_decode(AVCodecContext *avctx, void *data, int *got_frame,

                      AVPacket *avpkt)

{

    AV1DecodeContext *ctx = avctx->priv_data;

    AVFrame *picture      = data;

    const void *iter      = NULL;

    struct aom_image *img;

    int ret;


    if (aom_codec_decode(&ctx->decoder, avpkt->data, avpkt->size, NULL) !=

        AOM_CODEC_OK) {

        const char *error  = aom_codec_error(&ctx->decoder);

        const char *detail = aom_codec_error_detail(&ctx->decoder);


        av_log(avctx, AV_LOG_ERROR, "Failed to decode frame: %s\n", error);

        if (detail)

            av_log(avctx, AV_LOG_ERROR, "  Additional information: %s\n",

                   detail);

        return AVERROR_INVALIDDATA;

    }


    if ((img = aom_codec_get_frame(&ctx->decoder, &iter))) {

        if (img->d_w > img->w || img->d_h > img->h) {

            av_log(avctx, AV_LOG_ERROR, "Display dimensions %dx%d exceed storage %dx%d\n",

                   img->d_w, img->d_h, img->w, img->h);

            return AVERROR_EXTERNAL;

        }


        if ((ret = set_pix_fmt(avctx, img)) < 0) {

            av_log(avctx, AV_LOG_ERROR, "Unsupported output colorspace (%d) / bit_depth (%d)\n",

                   img->fmt, img->bit_depth);

            return ret;

        }


        if ((int)img->d_w != avctx->width || (int)img->d_h != avctx->height) {

            av_log(avctx, AV_LOG_INFO, "dimension change! %dx%d -> %dx%d\n",

                   avctx->width, avctx->height, img->d_w, img->d_h);

            ret = ff_set_dimensions(avctx, img->d_w, img->d_h);

            if (ret < 0)

                return ret;

        }

        if ((ret = ff_get_buffer(avctx, picture, 0)) < 0)

            return ret;


#ifdef AOM_CTRL_AOMD_GET_FRAME_FLAGS

        {

            aom_codec_frame_flags_t flags;

            ret = aom_codec_control(&ctx->decoder, AOMD_GET_FRAME_FLAGS, &flags);

            if (ret == AOM_CODEC_OK) {

                picture->key_frame = !!(flags & AOM_FRAME_IS_KEY);

                if (flags & (AOM_FRAME_IS_KEY | AOM_FRAME_IS_INTRAONLY))

                    picture->pict_type = AV_PICTURE_TYPE_I;

                else if (flags & AOM_FRAME_IS_SWITCH)

                    picture->pict_type = AV_PICTURE_TYPE_SP;

                else

                    picture->pict_type = AV_PICTURE_TYPE_P;

            }

        }

#endif


        av_reduce(&picture->sample_aspect_ratio.num,

                  &picture->sample_aspect_ratio.den,

                  picture->height * img->r_w,

                  picture->width * img->r_h,

                  INT_MAX);

        ff_set_sar(avctx, picture->sample_aspect_ratio);


        if ((img->fmt & AOM_IMG_FMT_HIGHBITDEPTH) && img->bit_depth == 8)

            image_copy_16_to_8(picture, img);

        else {

            const uint8_t *planes[4] = { img->planes[0], img->planes[1], img->planes[2] };

            const int      stride[4] = { img->stride[0], img->stride[1], img->stride[2] };


            av_image_copy(picture->data, picture->linesize, planes,

                          stride, avctx->pix_fmt, img->d_w, img->d_h);

        }

        *got_frame = 1;

    }

    return avpkt->size;

}


static av_cold int aom_free(AVCodecContext *avctx)

{

    AV1DecodeContext *ctx = avctx->priv_data;

    aom_codec_destroy(&ctx->decoder);

    return 0;

}


static av_cold int av1_init(AVCodecContext *avctx)

{

    return aom_init(avctx, aom_codec_av1_dx());

}


const AVCodec ff_libaom_av1_decoder = {

    .name           = "libaom-av1",

    .long_name      = NULL_IF_CONFIG_SMALL("libaom AV1"),

    .type           = AVMEDIA_TYPE_VIDEO,

    .id             = AV_CODEC_ID_AV1,

    .priv_data_size = sizeof(AV1DecodeContext),

    .init           = av1_init,

    .close          = aom_free,

    .decode         = aom_decode,

    .capabilities   = AV_CODEC_CAP_OTHER_THREADS | AV_CODEC_CAP_DR1,

    .caps_internal  = FF_CODEC_CAP_AUTO_THREADS,

    .profiles       = NULL_IF_CONFIG_SMALL(ff_av1_profiles),

    .wrapper_name   = "libaom",

};