doxygen/3.1/idctdsp__alpha_8c_source.html

 /*

  * Copyright (c) 2002 Falk Hueffner <falk@debian.org>

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 #include "libavutil/attributes.h"

 #include "libavcodec/idctdsp.h"

 #include "idctdsp_alpha.h"

 #include "asm.h"


 void put_pixels_clamped_mvi_asm(const int16_t *block, uint8_t *pixels,

                                 ptrdiff_t line_size);

 void add_pixels_clamped_mvi_asm(const int16_t *block, uint8_t *pixels,

                                 ptrdiff_t line_size);


 void (*put_pixels_clamped_axp_p)(const int16_t *block, uint8_t *pixels,

                                  ptrdiff_t line_size);

 void (*add_pixels_clamped_axp_p)(const int16_t *block, uint8_t *pixels,

                                  ptrdiff_t line_size);


 #if 0

 /* These functions were the base for the optimized assembler routines,

    and remain here for documentation purposes.  */

 static void put_pixels_clamped_mvi(const int16_t *block, uint8_t *pixels,

                                    ptrdiff_t line_size)

 {

     int i = 8;

     uint64_t clampmask = zap(-1, 0xaa); /* 0x00ff00ff00ff00ff */


     do {

         uint64_t shorts0, shorts1;


         shorts0 = ldq(block);

         shorts0 = maxsw4(shorts0, 0);

         shorts0 = minsw4(shorts0, clampmask);

         stl(pkwb(shorts0), pixels);


         shorts1 = ldq(block + 4);

         shorts1 = maxsw4(shorts1, 0);

         shorts1 = minsw4(shorts1, clampmask);

         stl(pkwb(shorts1), pixels + 4);


         pixels += line_size;

         block += 8;

     } while (--i);

 }


 void add_pixels_clamped_mvi(const int16_t *block, uint8_t *pixels,

                             ptrdiff_t line_size)

 {

     int h = 8;

     /* Keep this function a leaf function by generating the constants

        manually (mainly for the hack value ;-).  */

     uint64_t clampmask = zap(-1, 0xaa); /* 0x00ff00ff00ff00ff */

     uint64_t signmask  = zap(-1, 0x33);

     signmask ^= signmask >> 1;  /* 0x8000800080008000 */


     do {

         uint64_t shorts0, pix0, signs0;

         uint64_t shorts1, pix1, signs1;


         shorts0 = ldq(block);

         shorts1 = ldq(block + 4);


         pix0    = unpkbw(ldl(pixels));

         /* Signed subword add (MMX paddw).  */

         signs0  = shorts0 & signmask;

         shorts0 &= ~signmask;

         shorts0 += pix0;

         shorts0 ^= signs0;

         /* Clamp. */

         shorts0 = maxsw4(shorts0, 0);

         shorts0 = minsw4(shorts0, clampmask);


         /* Next 4.  */

         pix1    = unpkbw(ldl(pixels + 4));

         signs1  = shorts1 & signmask;

         shorts1 &= ~signmask;

         shorts1 += pix1;

         shorts1 ^= signs1;

         shorts1 = maxsw4(shorts1, 0);

         shorts1 = minsw4(shorts1, clampmask);


         stl(pkwb(shorts0), pixels);

         stl(pkwb(shorts1), pixels + 4);


         pixels += line_size;

         block += 8;

     } while (--h);

 }

 #endif


 av_cold void ff_idctdsp_init_alpha(IDCTDSPContext *c, AVCodecContext *avctx,

                                    unsigned high_bit_depth)

 {

     /* amask clears all bits that correspond to present features.  */

     if (amask(AMASK_MVI) == 0) {

         c->put_pixels_clamped = put_pixels_clamped_mvi_asm;

         c->add_pixels_clamped = add_pixels_clamped_mvi_asm;

     }


     put_pixels_clamped_axp_p = c->put_pixels_clamped;

     add_pixels_clamped_axp_p = c->add_pixels_clamped;


     if (!high_bit_depth && !avctx->lowres &&

         (avctx->idct_algo == FF_IDCT_AUTO ||

          avctx->idct_algo == FF_IDCT_SIMPLEALPHA)) {

         c->idct_put = ff_simple_idct_put_axp;

         c->idct_add = ff_simple_idct_add_axp;

         c->idct =     ff_simple_idct_axp;

     }

 }

ff_simple_idct_add_axp
void ff_simple_idct_add_axp(uint8_t *dest, int line_size, int16_t *block)
Definition: simple_idct_alpha.c:299

h
h
Definition: vp9dsp_template.c:2093

minsw4
#define minsw4(a, b)
Definition: asm.h:137

maxsw4
#define maxsw4(a, b)
Definition: asm.h:141

FF_IDCT_SIMPLEALPHA
#define FF_IDCT_SIMPLEALPHA
Definition: avcodec.h:3033

idctdsp_alpha.h

ldq
#define ldq(p)
Definition: asm.h:59

attributes.h
Macro definitions for various function/variable attributes.

block
static int16_t block[64]
Definition: dct.c:113

uint8_t
uint8_t
Definition: audio_convert.c:194

av_cold
#define av_cold
Definition: attributes.h:82

ff_simple_idct_axp
void ff_simple_idct_axp(int16_t *block)
Definition: simple_idct_alpha.c:253

IDCTDSPContext::put_pixels_clamped
void(* put_pixels_clamped)(const int16_t *block, uint8_t *pixels, ptrdiff_t line_size)
Definition: idctdsp.h:53

pkwb
#define pkwb(a)
Definition: asm.h:144

AVCodecContext::lowres
int lowres
low resolution decoding, 1-> 1/2 size, 2->1/4 size
Definition: avcodec.h:3059

AMASK_MVI
#define AMASK_MVI
Definition: asm.h:40

FF_IDCT_AUTO
#define FF_IDCT_AUTO
Definition: avcodec.h:3008

amask
#define amask
Definition: asm.h:99

put_pixels_clamped_axp_p
void(* put_pixels_clamped_axp_p)(const int16_t *block, uint8_t *pixels, ptrdiff_t line_size)
Definition: idctdsp_alpha.c:31

idctdsp.h

IDCTDSPContext::add_pixels_clamped
void(* add_pixels_clamped)(const int16_t *block, uint8_t *pixels, ptrdiff_t line_size)
Definition: idctdsp.h:59

add_pixels_clamped_mvi_asm
void add_pixels_clamped_mvi_asm(const int16_t *block, uint8_t *pixels, ptrdiff_t line_size)

ff_idctdsp_init_alpha
av_cold void ff_idctdsp_init_alpha(IDCTDSPContext *c, AVCodecContext *avctx, unsigned high_bit_depth)
Definition: idctdsp_alpha.c:108

stl
#define stl(l, p)
Definition: asm.h:76

AVCodecContext::idct_algo
int idct_algo
IDCT algorithm, see FF_IDCT_* below.
Definition: avcodec.h:3007

void
typedef void(APIENTRY *FF_PFNGLACTIVETEXTUREPROC)(GLenum texture)

put_pixels_clamped_mvi_asm
void put_pixels_clamped_mvi_asm(const int16_t *block, uint8_t *pixels, ptrdiff_t line_size)

IDCTDSPContext::idct_add
void(* idct_add)(uint8_t *dest, int line_size, int16_t *block)
block -> idct -> add dest -> clip to unsigned 8 bit -> dest.
Definition: idctdsp.h:77

IDCTDSPContext::idct_put
void(* idct_put)(uint8_t *dest, int line_size, int16_t *block)
block -> idct -> clip to unsigned 8 bit -> dest.
Definition: idctdsp.h:70

AVCodecContext
main external API structure.
Definition: avcodec.h:1649

zap
#define zap
Definition: asm.h:97

IDCTDSPContext
Definition: idctdsp.h:51

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

unpkbw
#define unpkbw(a)
Definition: asm.h:146

pixels
int pixels
Definition: avisynth_c.h:298

ldl
#define ldl(p)
Definition: asm.h:64

ff_simple_idct_put_axp
void ff_simple_idct_put_axp(uint8_t *dest, int line_size, int16_t *block)
Definition: simple_idct_alpha.c:293

asm.h

add_pixels_clamped_axp_p
void(* add_pixels_clamped_axp_p)(const int16_t *block, uint8_t *pixels, ptrdiff_t line_size)
Definition: idctdsp_alpha.c:33

IDCTDSPContext::idct
void(* idct)(int16_t *block)
Definition: idctdsp.h:63