doxygen/3.4/msvideo1enc_8c_source.html

 /*

  * Microsoft Video-1 Encoder

  * Copyright (c) 2009 Konstantin Shishkov

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 /**

  * @file

  * Microsoft Video-1 encoder

  */


 #include "avcodec.h"

 #include "internal.h"

 #include "bytestream.h"

 #include "libavutil/lfg.h"

 #include "elbg.h"

 #include "libavutil/imgutils.h"

 /**

  * Encoder context

  */

 typedef struct Msvideo1EncContext {

     AVCodecContext *avctx;

     AVLFG rnd;

     uint8_t *prev;


     int block[16*3];

     int block2[16*3];

     int codebook[8*3];

     int codebook2[8*3];

     int output[16*3];

     int output2[16*3];

     int avg[3];

     int bestpos;

     int keyint;

 } Msvideo1EncContext;


 enum MSV1Mode{

     MODE_SKIP = 0,

     MODE_FILL,

     MODE_2COL,

     MODE_8COL,

 };


 #define SKIP_PREFIX 0x8400

 #define SKIPS_MAX 0x03FF

 #define MKRGB555(in, off) (((in)[off] << 10) | ((in)[(off) + 1] << 5) | ((in)[(off) + 2]))


 static const int remap[16] = { 0, 1, 4, 5, 2, 3, 6, 7, 8, 9, 12, 13, 10, 11, 14, 15 };


 static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,

                                const AVFrame *pict, int *got_packet)

 {

     Msvideo1EncContext * const c = avctx->priv_data;

     const AVFrame *p = pict;

     uint16_t *src;

     uint8_t *prevptr;

     uint8_t *dst, *buf;

     int keyframe = 0;

     int no_skips = 1;

     int i, j, k, x, y, ret;

     int skips = 0;

     int quality = 24;


     if ((ret = ff_alloc_packet2(avctx, pkt, avctx->width*avctx->height*9 + AV_INPUT_BUFFER_MIN_SIZE, 0)) < 0)

         return ret;

     dst= buf= pkt->data;


     if(!c->prev)

         c->prev = av_malloc(avctx->width * 3 * (avctx->height + 3));

     prevptr = c->prev + avctx->width * 3 * (FFALIGN(avctx->height, 4) - 1);

     src = (uint16_t*)(p->data[0] + p->linesize[0]*(FFALIGN(avctx->height, 4) - 1));

     if(c->keyint >= avctx->keyint_min)

         keyframe = 1;


     for(y = 0; y < avctx->height; y += 4){

         for(x = 0; x < avctx->width; x += 4){

             int bestmode = MODE_SKIP;

             int bestscore = INT_MAX;

             int flags = 0;

             int score;


             for(j = 0; j < 4; j++){

                 for(i = 0; i < 4; i++){

                     uint16_t val = src[x + i - j*p->linesize[0]/2];

                     for(k = 0; k < 3; k++){

                         c->block[(i + j*4)*3 + k] =

                         c->block2[remap[i + j*4]*3 + k] = (val >> (10-k*5)) & 0x1F;

                     }

                 }

             }

             if(!keyframe){

                 bestscore = 0;

                 for(j = 0; j < 4; j++){

                     for(i = 0; i < 4*3; i++){

                         int t = prevptr[x*3 + i - j*3*avctx->width] - c->block[i + j*4*3];

                         bestscore += t*t;

                     }

                 }

                 bestscore /= quality;

             }

             // try to find optimal value to fill whole 4x4 block

             score = 0;

             avpriv_init_elbg(c->block, 3, 16, c->avg, 1, 1, c->output, &c->rnd);

             avpriv_do_elbg  (c->block, 3, 16, c->avg, 1, 1, c->output, &c->rnd);

             if(c->avg[0] == 1) // red component = 1 will be written as skip code

                 c->avg[0] = 0;

             for(j = 0; j < 4; j++){

                 for(i = 0; i < 4; i++){

                     for(k = 0; k < 3; k++){

                         int t = c->avg[k] - c->block[(i+j*4)*3+k];

                         score += t*t;

                     }

                 }

             }

             score /= quality;

             score += 2;

             if(score < bestscore){

                 bestscore = score;

                 bestmode = MODE_FILL;

             }

             // search for optimal filling of 2-color block

             score = 0;

             avpriv_init_elbg(c->block, 3, 16, c->codebook, 2, 1, c->output, &c->rnd);

             avpriv_do_elbg  (c->block, 3, 16, c->codebook, 2, 1, c->output, &c->rnd);

             // last output value should be always 1, swap codebooks if needed

             if(!c->output[15]){

                 for(i = 0; i < 3; i++)

                     FFSWAP(uint8_t, c->codebook[i], c->codebook[i+3]);

                 for(i = 0; i < 16; i++)

                     c->output[i] ^= 1;

             }

             for(j = 0; j < 4; j++){

                 for(i = 0; i < 4; i++){

                     for(k = 0; k < 3; k++){

                         int t = c->codebook[c->output[i+j*4]*3 + k] - c->block[i*3+k+j*4*3];

                         score += t*t;

                     }

                 }

             }

             score /= quality;

             score += 6;

             if(score < bestscore){

                 bestscore = score;

                 bestmode = MODE_2COL;

             }

             // search for optimal filling of 2-color 2x2 subblocks

             score = 0;

             for(i = 0; i < 4; i++){

                 avpriv_init_elbg(c->block2 + i*4*3, 3, 4, c->codebook2 + i*2*3, 2, 1, c->output2 + i*4, &c->rnd);

                 avpriv_do_elbg  (c->block2 + i*4*3, 3, 4, c->codebook2 + i*2*3, 2, 1, c->output2 + i*4, &c->rnd);

             }

             // last value should be always 1, swap codebooks if needed

             if(!c->output2[15]){

                 for(i = 0; i < 3; i++)

                     FFSWAP(uint8_t, c->codebook2[i+18], c->codebook2[i+21]);

                 for(i = 12; i < 16; i++)

                     c->output2[i] ^= 1;

             }

             for(j = 0; j < 4; j++){

                 for(i = 0; i < 4; i++){

                     for(k = 0; k < 3; k++){

                         int t = c->codebook2[(c->output2[remap[i+j*4]] + (i&2) + (j&2)*2)*3+k] - c->block[i*3+k + j*4*3];

                         score += t*t;

                     }

                 }

             }

             score /= quality;

             score += 18;

             if(score < bestscore){

                 bestscore = score;

                 bestmode = MODE_8COL;

             }


             if(bestmode == MODE_SKIP){

                 skips++;

                 no_skips = 0;

             }

             if((bestmode != MODE_SKIP && skips) || skips == SKIPS_MAX){

                 bytestream_put_le16(&dst, skips | SKIP_PREFIX);

                 skips = 0;

             }


             switch(bestmode){

             case MODE_FILL:

                 bytestream_put_le16(&dst, MKRGB555(c->avg,0) | 0x8000);

                 for(j = 0; j < 4; j++)

                     for(i = 0; i < 4; i++)

                         for(k = 0; k < 3; k++)

                             prevptr[x*3 + i*3 + k - j*3*avctx->width] = c->avg[k];

                 break;

             case MODE_2COL:

                 for(j = 0; j < 4; j++){

                     for(i = 0; i < 4; i++){

                         flags |= (c->output[i + j*4]^1) << (i + j*4);

                         for(k = 0; k < 3; k++)

                             prevptr[x*3 + i*3 + k - j*3*avctx->width] = c->codebook[c->output[i + j*4]*3 + k];

                     }

                 }

                 bytestream_put_le16(&dst, flags);

                 bytestream_put_le16(&dst, MKRGB555(c->codebook, 0));

                 bytestream_put_le16(&dst, MKRGB555(c->codebook, 3));

                 break;

             case MODE_8COL:

                 for(j = 0; j < 4; j++){

                     for(i = 0; i < 4; i++){

                         flags |= (c->output2[remap[i + j*4]]^1) << (i + j*4);

                         for(k = 0; k < 3; k++)

                             prevptr[x*3 + i*3 + k - j*3*avctx->width] = c->codebook2[(c->output2[remap[i+j*4]] + (i&2) + (j&2)*2)*3 + k];

                     }

                 }

                 bytestream_put_le16(&dst, flags);

                 bytestream_put_le16(&dst, MKRGB555(c->codebook2, 0) | 0x8000);

                 for(i = 3; i < 24; i += 3)

                     bytestream_put_le16(&dst, MKRGB555(c->codebook2, i));

                 break;

             }

         }

         src     -= p->linesize[0] << 1;

         prevptr -= avctx->width * 3 * 4;

     }

     if(skips)

         bytestream_put_le16(&dst, skips | SKIP_PREFIX);

     //EOF

     bytestream_put_byte(&dst, 0);

     bytestream_put_byte(&dst, 0);


     if(no_skips)

         keyframe = 1;

     if(keyframe)

         c->keyint = 0;

     else

         c->keyint++;

     if (keyframe) pkt->flags |= AV_PKT_FLAG_KEY;

     pkt->size = dst - buf;

     *got_packet = 1;


     return 0;

 }


 /**

  * init encoder

  */

 static av_cold int encode_init(AVCodecContext *avctx)

 {

     Msvideo1EncContext * const c = avctx->priv_data;


     c->avctx = avctx;

     if (av_image_check_size(avctx->width, avctx->height, 0, avctx) < 0) {

         return -1;

     }

     if((avctx->width&3) || (avctx->height&3)){

         av_log(avctx, AV_LOG_ERROR, "width and height must be multiples of 4\n");

         return -1;

     }


     avctx->bits_per_coded_sample = 16;


     c->keyint = avctx->keyint_min;

     av_lfg_init(&c->rnd, 1);


     return 0;

 }


 /**

  * Uninit encoder

  */

 static av_cold int encode_end(AVCodecContext *avctx)

 {

     Msvideo1EncContext * const c = avctx->priv_data;


     av_freep(&c->prev);


     return 0;

 }


 AVCodec ff_msvideo1_encoder = {

     .name           = "msvideo1",

     .long_name = NULL_IF_CONFIG_SMALL("Microsoft Video-1"),

     .type           = AVMEDIA_TYPE_VIDEO,

     .id             = AV_CODEC_ID_MSVIDEO1,

     .priv_data_size = sizeof(Msvideo1EncContext),

     .init           = encode_init,

     .encode2        = encode_frame,

     .close          = encode_end,

     .pix_fmts = (const enum AVPixelFormat[]){AV_PIX_FMT_RGB555, AV_PIX_FMT_NONE},

 };

encode_init
static av_cold int encode_init(AVCodecContext *avctx)
init encoder
Definition: msvideo1enc.c:260

AVLFG
Definition: lfg.h:27

MODE_2COL
Definition: msvideo1enc.c:55

val
const char const char void * val
Definition: avisynth_c.h:771

AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:201

AV_PIX_FMT_NONE
Definition: pixfmt.h:61

imgutils.h
misc image utilities

Msvideo1EncContext::output2
int output2[16 *3]
Definition: msvideo1enc.c:46

init
static av_cold int init(AVCodecContext *avctx)
Definition: avrndec.c:35

AVPacket::size
int size
Definition: avcodec.h:1680

pkt
static AVPacket pkt
Definition: demuxing_decoding.c:54

src
#define src
Definition: vp8dsp.c:254

AVCodec
AVCodec.
Definition: avcodec.h:3739

AV_CODEC_ID_MSVIDEO1
Definition: avcodec.h:266

ff_alloc_packet2
int ff_alloc_packet2(AVCodecContext *avctx, AVPacket *avpkt, int64_t size, int64_t min_size)
Check AVPacket size and/or allocate data.
Definition: encode.c:32

uint8_t
uint8_t
Definition: audio_convert.c:194

av_cold
#define av_cold
Definition: attributes.h:82

av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31

Msvideo1EncContext::keyint
int keyint
Definition: msvideo1enc.c:49

avpriv_do_elbg
int avpriv_do_elbg(int *points, int dim, int numpoints, int *codebook, int numCB, int max_steps, int *closest_cb, AVLFG *rand_state)
Implementation of the Enhanced LBG Algorithm Based on the paper "Neural Networks 14:1219-1237" that c...
Definition: elbg.c:371

AVPacket::data
uint8_t * data
Definition: avcodec.h:1679

flags
static int flags
Definition: log.c:57

Msvideo1EncContext::output
int output[16 *3]
Definition: msvideo1enc.c:45

AVCodecContext::bits_per_coded_sample
int bits_per_coded_sample
bits per sample/pixel from the demuxer (needed for huffyuv).
Definition: avcodec.h:3157

AV_INPUT_BUFFER_MIN_SIZE
#define AV_INPUT_BUFFER_MIN_SIZE
minimum encoding buffer size Used to avoid some checks during header writing.
Definition: avcodec.h:784

FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:48

av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28

MODE_SKIP
Definition: msvideo1enc.c:53

AV_PKT_FLAG_KEY
#define AV_PKT_FLAG_KEY
The packet contains a keyframe.
Definition: avcodec.h:1711

MODE_FILL
Definition: msvideo1enc.c:54

AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176

encode_frame
static int encode_frame(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *pict, int *got_packet)
Definition: msvideo1enc.c:65

SKIP_PREFIX
#define SKIP_PREFIX
Definition: msvideo1enc.c:59

NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:179

AVCodec::name
const char * name
Name of the codec implementation.
Definition: avcodec.h:3746

Msvideo1EncContext::codebook
int codebook[8 *3]
Definition: msvideo1enc.c:43

Msvideo1EncContext::block2
int block2[16 *3]
Definition: msvideo1enc.c:42

bytestream.h

AVPacket::flags
int flags
A combination of AV_PKT_FLAG values.
Definition: avcodec.h:1685

av_image_check_size
int av_image_check_size(unsigned int w, unsigned int h, int log_offset, void *log_ctx)
Check if the given dimension of an image is valid, meaning that all bytes of the image can be address...
Definition: imgutils.c:281

AVCodecContext::width
int width
picture width / height.
Definition: avcodec.h:1948

MODE_8COL
Definition: msvideo1enc.c:56

lfg.h

AVCodecContext::height
int height
Definition: avcodec.h:1948

avpriv_init_elbg
int avpriv_init_elbg(int *points, int dim, int numpoints, int *codebook, int numCB, int max_steps, int *closest_cb, AVLFG *rand_state)
Initialize the **codebook vector for the elbg algorithm.
Definition: elbg.c:337

avcodec.h
Libavcodec external API header.

remap
static const int remap[16]
Definition: msvideo1enc.c:63

encode_end
static av_cold int encode_end(AVCodecContext *avctx)
Uninit encoder.
Definition: msvideo1enc.c:286

AVFrame::linesize
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Definition: frame.h:232

Msvideo1EncContext::codebook2
int codebook2[8 *3]
Definition: msvideo1enc.c:44

AVCodecContext
main external API structure.
Definition: avcodec.h:1761

buf
void * buf
Definition: avisynth_c.h:690

MSV1Mode
MSV1Mode
Definition: msvideo1enc.c:52

ff_msvideo1_encoder
AVCodec ff_msvideo1_encoder
Definition: msvideo1enc.c:295

av_lfg_init
av_cold void av_lfg_init(AVLFG *c, unsigned int seed)
Definition: lfg.c:32

SKIPS_MAX
#define SKIPS_MAX
Definition: msvideo1enc.c:60

pix_fmts
static enum AVPixelFormat pix_fmts[]
Definition: libkvazaar.c:266

AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:215

Msvideo1EncContext::block
int block[16 *3]
Definition: msvideo1enc.c:41

internal.h
common internal api header.

Msvideo1EncContext::bestpos
int bestpos
Definition: msvideo1enc.c:48

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

AV_PIX_FMT_RGB555
#define AV_PIX_FMT_RGB555
Definition: pixfmt.h:367

Msvideo1EncContext::rnd
AVLFG rnd
Definition: msvideo1enc.c:38

AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:1803

elbg.h

Msvideo1EncContext::avctx
AVCodecContext * avctx
Definition: msvideo1enc.c:37

Msvideo1EncContext
Encoder context.
Definition: msvideo1enc.c:36

Msvideo1EncContext::avg
int avg[3]
Definition: msvideo1enc.c:47

MKRGB555
#define MKRGB555(in, off)
Definition: msvideo1enc.c:61

av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35

AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201

Msvideo1EncContext::prev
uint8_t * prev
Definition: msvideo1enc.c:39

FFSWAP
#define FFSWAP(type, a, b)
Definition: common.h:99

AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:60

AVPacket
This structure stores compressed data.
Definition: avcodec.h:1656

AVCodecContext::keyint_min
int keyint_min
minimum GOP size
Definition: avcodec.h:2435