~ubuntu-branches/ubuntu/jaunty/xvidcap/jaunty-proposed

« back to all changes in this revision

Viewing changes to ffmpeg/libavcodec/dct-test.c

Committer: Bazaar Package Importer
Author(s): Christian Marillat
Date: 2004-08-29 10:53:42 UTC
Revision ID: james.westby@ubuntu.com-20040829105342-qgmnry37eadfkoxx

Tags: upstream-1.1.3

Import upstream version 1.1.3

files added:

AUTHORS

COPYING

ChangeLog

INSTALL

Makefile.am

Makefile.in

NEWS

README

TODO

Xw/Base.c

Xw/Base.h

Xw/BaseP.h

Xw/Box.c

Xw/Box.h

Xw/BoxP.h

Xw/Button.c

Xw/Button.h

Xw/ButtonP.h

Xw/Field.c

Xw/Field.h

Xw/FieldP.h

Xw/Label.c

Xw/Label.h

Xw/LabelP.h

Xw/Makefile.am

Xw/Makefile.in

Xw/README

Xw/RootIcon.c

Xw/RootIcon.h

Xw/RootIconP.h

Xw/Toggle.c

Xw/Toggle.h

Xw/ToggleP.h

Xw/simple.c

Xw/testxw.c

Xw/testxw.xbm

aclocal.m4

compile

config.h.in

configure

configure.ac

depcomp

ffmpeg

ffmpeg/.nbattrs

ffmpeg/COPYING

ffmpeg/CREDITS

ffmpeg/Changelog

ffmpeg/INSTALL

ffmpeg/Makefile

ffmpeg/README

ffmpeg/berrno.h

ffmpeg/cmdutils.c

ffmpeg/cmdutils.h

ffmpeg/configure

ffmpeg/cygwin_inttypes.h

ffmpeg/doc

ffmpeg/doc/.nbattrs

ffmpeg/doc/Makefile

ffmpeg/doc/TODO

ffmpeg/doc/faq.html

ffmpeg/doc/faq.texi

ffmpeg/doc/ffmpeg-doc.html

ffmpeg/doc/ffmpeg-doc.texi

ffmpeg/doc/ffmpeg.1

ffmpeg/doc/ffmpeg_powerpc_performance_evaluation_howto.txt

ffmpeg/doc/ffplay-doc.html

ffmpeg/doc/ffplay-doc.texi

ffmpeg/doc/ffplay.1

ffmpeg/doc/ffserver-doc.html

ffmpeg/doc/ffserver-doc.texi

ffmpeg/doc/ffserver.1

ffmpeg/doc/ffserver.conf

ffmpeg/doc/hooks.html

ffmpeg/doc/hooks.texi

ffmpeg/doc/optimization.txt

ffmpeg/doc/texi2pod.pl

ffmpeg/ffinstall.nsi

ffmpeg/ffmpeg.c

ffmpeg/ffplay.c

ffmpeg/ffserver.c

ffmpeg/ffserver.h

ffmpeg/libavcodec

ffmpeg/libavcodec/.nbattrs

ffmpeg/libavcodec/4xm.c

ffmpeg/libavcodec/Doxyfile

ffmpeg/libavcodec/Makefile

ffmpeg/libavcodec/a52dec.c

ffmpeg/libavcodec/ac3.h

ffmpeg/libavcodec/ac3dec.c

ffmpeg/libavcodec/ac3enc.c

ffmpeg/libavcodec/ac3tab.h

ffmpeg/libavcodec/adpcm.c

ffmpeg/libavcodec/allcodecs.c

ffmpeg/libavcodec/alpha

ffmpeg/libavcodec/alpha/asm.h

ffmpeg/libavcodec/alpha/dsputil_alpha.c

ffmpeg/libavcodec/alpha/dsputil_alpha_asm.S

ffmpeg/libavcodec/alpha/motion_est_alpha.c

ffmpeg/libavcodec/alpha/motion_est_mvi_asm.S

ffmpeg/libavcodec/alpha/mpegvideo_alpha.c

ffmpeg/libavcodec/alpha/regdef.h

ffmpeg/libavcodec/alpha/simple_idct_alpha.c

ffmpeg/libavcodec/amr.c

ffmpeg/libavcodec/apiexample.c

ffmpeg/libavcodec/armv4l

ffmpeg/libavcodec/armv4l/dsputil_arm.c

ffmpeg/libavcodec/armv4l/jrevdct_arm.S

ffmpeg/libavcodec/armv4l/mpegvideo_arm.c

ffmpeg/libavcodec/armv4l/simple_idct_arm.S

ffmpeg/libavcodec/asv1.c

ffmpeg/libavcodec/avcodec.c

ffmpeg/libavcodec/avcodec.h

ffmpeg/libavcodec/bswap.h

ffmpeg/libavcodec/cabac.c

ffmpeg/libavcodec/cabac.h

ffmpeg/libavcodec/cljr.c

ffmpeg/libavcodec/common.c

ffmpeg/libavcodec/common.h

ffmpeg/libavcodec/cyuv.c

ffmpeg/libavcodec/dct-test.c

ffmpeg/libavcodec/dpcm.c

ffmpeg/libavcodec/dsputil.c

ffmpeg/libavcodec/dsputil.h

ffmpeg/libavcodec/dv.c

ffmpeg/libavcodec/dvdata.h

ffmpeg/libavcodec/error_resilience.c

ffmpeg/libavcodec/eval.c

ffmpeg/libavcodec/faad.c

ffmpeg/libavcodec/fastmemcpy.h

ffmpeg/libavcodec/fdctref.c

ffmpeg/libavcodec/fft-test.c

ffmpeg/libavcodec/fft.c

ffmpeg/libavcodec/ffv1.c

ffmpeg/libavcodec/golomb.c

ffmpeg/libavcodec/golomb.h

ffmpeg/libavcodec/h263.c

ffmpeg/libavcodec/h263data.h

ffmpeg/libavcodec/h263dec.c

ffmpeg/libavcodec/h264.c

ffmpeg/libavcodec/h264data.h

ffmpeg/libavcodec/huffyuv.c

ffmpeg/libavcodec/i386

ffmpeg/libavcodec/i386/cputest.c

ffmpeg/libavcodec/i386/dsputil_mmx.c

ffmpeg/libavcodec/i386/dsputil_mmx_avg.h

ffmpeg/libavcodec/i386/dsputil_mmx_rnd.h

ffmpeg/libavcodec/i386/fdct_mmx.c

ffmpeg/libavcodec/i386/fft_sse.c

ffmpeg/libavcodec/i386/idct_mmx.c

ffmpeg/libavcodec/i386/mmx.h

ffmpeg/libavcodec/i386/motion_est_mmx.c

ffmpeg/libavcodec/i386/mpegvideo_mmx.c

ffmpeg/libavcodec/i386/mpegvideo_mmx_template.c

ffmpeg/libavcodec/i386/simple_idct_mmx.c

ffmpeg/libavcodec/imgconvert.c

ffmpeg/libavcodec/imgconvert_template.h

ffmpeg/libavcodec/imgresample.c

ffmpeg/libavcodec/indeo3.c

ffmpeg/libavcodec/indeo3data.h

ffmpeg/libavcodec/interplayvideo.c

ffmpeg/libavcodec/jfdctfst.c

ffmpeg/libavcodec/jfdctint.c

ffmpeg/libavcodec/jrevdct.c

ffmpeg/libavcodec/liba52

ffmpeg/libavcodec/liba52/a52.h

ffmpeg/libavcodec/liba52/a52_internal.h

ffmpeg/libavcodec/liba52/a52_util.h

ffmpeg/libavcodec/liba52/bit_allocate.c

ffmpeg/libavcodec/liba52/bitstream.c

ffmpeg/libavcodec/liba52/bitstream.h

ffmpeg/libavcodec/liba52/crc.c

ffmpeg/libavcodec/liba52/downmix.c

ffmpeg/libavcodec/liba52/imdct.c

ffmpeg/libavcodec/liba52/mm_accel.h

ffmpeg/libavcodec/liba52/parse.c

ffmpeg/libavcodec/liba52/resample.c

ffmpeg/libavcodec/liba52/resample_c.c

ffmpeg/libavcodec/liba52/resample_mmx.c

ffmpeg/libavcodec/liba52/tables.h

ffmpeg/libavcodec/libpostproc

ffmpeg/libavcodec/libpostproc/.nbattrs

ffmpeg/libavcodec/libpostproc/Makefile

ffmpeg/libavcodec/libpostproc/mangle.h

ffmpeg/libavcodec/libpostproc/postprocess.c

ffmpeg/libavcodec/libpostproc/postprocess.h

ffmpeg/libavcodec/libpostproc/postprocess_internal.h

ffmpeg/libavcodec/libpostproc/postprocess_template.c

ffmpeg/libavcodec/mace.c

ffmpeg/libavcodec/mdct.c

ffmpeg/libavcodec/mdec.c

ffmpeg/libavcodec/mem.c

ffmpeg/libavcodec/mjpeg.c

ffmpeg/libavcodec/mlib

ffmpeg/libavcodec/mlib/dsputil_mlib.c

ffmpeg/libavcodec/motion_est.c

ffmpeg/libavcodec/motion_est_template.c

ffmpeg/libavcodec/motion_test.c

ffmpeg/libavcodec/mp3lameaudio.c

ffmpeg/libavcodec/mpeg12.c

ffmpeg/libavcodec/mpeg12data.h

ffmpeg/libavcodec/mpeg4data.h

ffmpeg/libavcodec/mpegaudio.c

ffmpeg/libavcodec/mpegaudio.h

ffmpeg/libavcodec/mpegaudiodec.c

ffmpeg/libavcodec/mpegaudiodectab.h

ffmpeg/libavcodec/mpegaudiotab.h

ffmpeg/libavcodec/mpegvideo.c

ffmpeg/libavcodec/mpegvideo.h

ffmpeg/libavcodec/msmpeg4.c

ffmpeg/libavcodec/msmpeg4data.h

ffmpeg/libavcodec/oggvorbis.c

ffmpeg/libavcodec/oggvorbis.h

ffmpeg/libavcodec/opts.c

ffmpeg/libavcodec/pcm.c

ffmpeg/libavcodec/ppc

ffmpeg/libavcodec/ppc/dsputil_altivec.c

ffmpeg/libavcodec/ppc/dsputil_altivec.h

ffmpeg/libavcodec/ppc/dsputil_ppc.c

ffmpeg/libavcodec/ppc/dsputil_ppc.h

ffmpeg/libavcodec/ppc/fft_altivec.c

ffmpeg/libavcodec/ppc/gcc_fixes.h

ffmpeg/libavcodec/ppc/gmc_altivec.c

ffmpeg/libavcodec/ppc/idct_altivec.c

ffmpeg/libavcodec/ppc/mpegvideo_altivec.c

ffmpeg/libavcodec/ppc/mpegvideo_ppc.c

ffmpeg/libavcodec/ps2

ffmpeg/libavcodec/ps2/dsputil_mmi.c

ffmpeg/libavcodec/ps2/idct_mmi.c

ffmpeg/libavcodec/ps2/mmi.h

ffmpeg/libavcodec/ps2/mpegvideo_mmi.c

ffmpeg/libavcodec/ra144.c

ffmpeg/libavcodec/ra144.h

ffmpeg/libavcodec/ra288.c

ffmpeg/libavcodec/ra288.h

ffmpeg/libavcodec/ratecontrol.c

ffmpeg/libavcodec/raw.c

ffmpeg/libavcodec/resample.c

ffmpeg/libavcodec/roqvideo.c

ffmpeg/libavcodec/rv10.c

ffmpeg/libavcodec/sh4

ffmpeg/libavcodec/sh4/dsputil_align.c

ffmpeg/libavcodec/sh4/dsputil_sh4.c

ffmpeg/libavcodec/sh4/idct_sh4.c

ffmpeg/libavcodec/sh4/qpel.c

ffmpeg/libavcodec/simple_idct.c

ffmpeg/libavcodec/simple_idct.h

ffmpeg/libavcodec/svq1.c

ffmpeg/libavcodec/svq1_cb.h

ffmpeg/libavcodec/svq1_vlc.h

ffmpeg/libavcodec/svq3.c

ffmpeg/libavcodec/utils.c

ffmpeg/libavcodec/vcr1.c

ffmpeg/libavcodec/vp3.c

ffmpeg/libavcodec/vp3data.h

ffmpeg/libavcodec/wmadata.h

ffmpeg/libavcodec/wmadec.c

ffmpeg/libavcodec/wmv2.c

ffmpeg/libavcodec/xan.c

ffmpeg/libavcodec/xvmcvideo.c

ffmpeg/libavformat

ffmpeg/libavformat/.nbattrs

ffmpeg/libavformat/4xm.c

ffmpeg/libavformat/Makefile

ffmpeg/libavformat/allformats.c

ffmpeg/libavformat/amr.c

ffmpeg/libavformat/asf.c

ffmpeg/libavformat/au.c

ffmpeg/libavformat/audio.c

ffmpeg/libavformat/avformat.h

ffmpeg/libavformat/avi.h

ffmpeg/libavformat/avidec.c

ffmpeg/libavformat/avienc.c

ffmpeg/libavformat/avio.c

ffmpeg/libavformat/avio.h

ffmpeg/libavformat/aviobuf.c

ffmpeg/libavformat/barpainet.c

ffmpeg/libavformat/barpainet.h

ffmpeg/libavformat/beosaudio.cpp

ffmpeg/libavformat/crc.c

ffmpeg/libavformat/cutils.c

ffmpeg/libavformat/dv.c

ffmpeg/libavformat/dv1394.c

ffmpeg/libavformat/dv1394.h

ffmpeg/libavformat/dvcore.c

ffmpeg/libavformat/dvcore.h

ffmpeg/libavformat/ffm.c

ffmpeg/libavformat/file.c

ffmpeg/libavformat/flvdec.c

ffmpeg/libavformat/flvenc.c

ffmpeg/libavformat/framehook.c

ffmpeg/libavformat/framehook.h

ffmpeg/libavformat/gif.c

ffmpeg/libavformat/gifdec.c

ffmpeg/libavformat/grab.c

ffmpeg/libavformat/http.c

ffmpeg/libavformat/idroq.c

ffmpeg/libavformat/img.c

ffmpeg/libavformat/ipmovie.c

ffmpeg/libavformat/jpeg.c

ffmpeg/libavformat/mov.c

ffmpeg/libavformat/movenc.c

ffmpeg/libavformat/mp3.c

ffmpeg/libavformat/mpeg.c

ffmpeg/libavformat/mpegts.c

ffmpeg/libavformat/mpegts.h

ffmpeg/libavformat/mpegtsenc.c

ffmpeg/libavformat/mpjpeg.c

ffmpeg/libavformat/nut.c

ffmpeg/libavformat/ogg.c

ffmpeg/libavformat/os_support.c

ffmpeg/libavformat/os_support.h

ffmpeg/libavformat/png.c

ffmpeg/libavformat/pnm.c

ffmpeg/libavformat/psxstr.c

ffmpeg/libavformat/raw.c

ffmpeg/libavformat/rm.c

ffmpeg/libavformat/rtp.c

ffmpeg/libavformat/rtp.h

ffmpeg/libavformat/rtpproto.c

ffmpeg/libavformat/rtsp.c

ffmpeg/libavformat/rtsp.h

ffmpeg/libavformat/rtspcodes.h

ffmpeg/libavformat/swf.c

ffmpeg/libavformat/tcp.c

ffmpeg/libavformat/udp.c

ffmpeg/libavformat/utils.c

ffmpeg/libavformat/wav.c

ffmpeg/libavformat/wc3movie.c

ffmpeg/libavformat/yuv.c

ffmpeg/libavformat/yuv4mpeg.c

ffmpeg/output_example.c

ffmpeg/tests

ffmpeg/tests/.nbattrs

ffmpeg/tests/Makefile

ffmpeg/tests/audiogen.c

ffmpeg/tests/dsptest.c

ffmpeg/tests/ffmpeg.regression.ref

ffmpeg/tests/ffserver.regression.ref

ffmpeg/tests/lena.pnm

ffmpeg/tests/libav.regression.ref

ffmpeg/tests/regression.sh

ffmpeg/tests/rotozoom.c

ffmpeg/tests/rotozoom.regression.ref

ffmpeg/tests/server-regression.sh

ffmpeg/tests/test.conf

ffmpeg/tests/tiny_psnr.c

ffmpeg/tests/videogen.c

ffmpeg/vhook

ffmpeg/vhook/.nbattrs

ffmpeg/vhook/Makefile

ffmpeg/vhook/drawtext.c

ffmpeg/vhook/fish.c

ffmpeg/vhook/imlib2.c

ffmpeg/vhook/null.c

ffmpeg/vhook/ppm.c

ffmpeg/xvmc_render.h

getopt

getopt/README

getopt/getopt.c

getopt/getopt.h

getopt/getopt1.c

gt/COPYING.LIB

gt/Makefile.am

gt/Makefile.in

gt/README

gt/gnuavi.c

gt/gnuavi.h

gt/gnuplay.c

gt/gt.c

gt/gt.h

gt/gtapi.c

gt/gtapi.h

gt/gtatoms.h

gt/gttypes.h

gt/gtvr.c

gt/gtvr.h

gt/parse_gt.c

gt/ppm2qt.c

gt/ppm2qtvr.c

gt/sound.c

gt/sound.h

gt/video.c

gt/video.h

gt/xt.c

gt/xt.h

install-sh

man/gvidcap.man

man/index.bt

man/xvidcap.man

missing

mkinstalldirs

src/Makefile.am

src/Makefile.in

src/app_data.h

src/capture.c

src/capture.h

src/codecs.h

src/colors.c

src/colors.h

src/control.h

src/fallback.h

src/frame.c

src/frame.h

src/gtk2_control.c

src/gtk2_control.h

src/gtk2_frame.c

src/gtk2_frame.h

src/gtk2_options.c

src/gtk2_options.h

src/gtk2_support.c

src/gtk2_support.h

src/job.c

src/job.h

src/led_meter.c

src/led_meter.h

src/main.c

src/main.h

src/malloc.c

src/mkresfile.sh

src/mngutil.c

src/mngutil.h

src/options.c

src/realloc.c

src/util.c

src/util.h

src/video.c

src/video.h

src/xt_control.c

src/xt_control.h

src/xt_frame.c

src/xt_frame.h

src/xt_options.c

src/xt_options.h

src/xtoffmpeg.c

src/xtoffmpeg.h

src/xtojpg.c

src/xtojpg.h

src/xtomng.c

src/xtomng.h

src/xtopng.c

src/xtopng.h

src/xtopnm.c

src/xtopnm.h

src/xtoqtf.c

src/xtoqtf.h

src/xtoxwd.c

src/xtoxwd.h

src/xutil.c

src/xutil.h

xbm/animate.png

xbm/animate.xbm

xbm/edit.png

xbm/edit.xbm

xbm/help.xbm

xbm/mkvideo.xbm

xbm/move.png

xbm/move.xbm

xbm/next.png

xbm/next.xbm

xbm/pause.png

xbm/pause.xbm

xbm/prev.png

xbm/prev.xbm

xbm/record.png

xbm/record.xbm

xbm/record_off.png

xbm/record_on.png

xbm/select.png

xbm/select.xbm

xbm/step.png

xbm/step.xbm

xbm/stop.png

xbm/stop.xbm

Show diffs side-by-side

added added

removed removed

ffmpeg/libavcodec/dct-test.c

/**

* @file dct-test.c

* Started from sample code by Juan J. Sierralta P.

#include <stdlib.h>

#include <stdio.h>

#include <string.h>

#include <sys/time.h>

#include <unistd.h>

#include "dsputil.h"

#include "i386/mmx.h"

#include "simple_idct.h"

#ifndef MAX

#define MAX(a, b) (((a) > (b)) ? (a) : (b))

#endif

/* reference fdct/idct */

extern void fdct(DCTELEM *block);

extern void idct(DCTELEM *block);

extern void init_fdct();

extern void j_rev_dct(DCTELEM *data);

extern void ff_mmx_idct(DCTELEM *data);

extern void ff_mmxext_idct(DCTELEM *data);

extern void odivx_idct_c (short *block);

#define AANSCALE_BITS 12

static const unsigned short aanscales[64] = {

/* precomputed values scaled up by 14 bits */

16384, 22725, 21407, 19266, 16384, 12873, 8867, 4520,

22725, 31521, 29692, 26722, 22725, 17855, 12299, 6270,

21407, 29692, 27969, 25172, 21407, 16819, 11585, 5906,

19266, 26722, 25172, 22654, 19266, 15137, 10426, 5315,

16384, 22725, 21407, 19266, 16384, 12873, 8867, 4520,

12873, 17855, 16819, 15137, 12873, 10114, 6967, 3552,

8867, 12299, 11585, 10426, 8867, 6967, 4799, 2446,

4520, 6270, 5906, 5315, 4520, 3552, 2446, 1247

};

uint8_t cropTbl[256 + 2 * MAX_NEG_CROP];

int64_t gettime(void)

{

struct timeval tv;

gettimeofday(&tv,NULL);

return (int64_t)tv.tv_sec * 1000000 + tv.tv_usec;

}

#define NB_ITS 20000

#define NB_ITS_SPEED 50000

static short idct_mmx_perm[64];

static short idct_simple_mmx_perm[64]={

0x00, 0x08, 0x04, 0x09, 0x01, 0x0C, 0x05, 0x0D,

0x10, 0x18, 0x14, 0x19, 0x11, 0x1C, 0x15, 0x1D,

0x20, 0x28, 0x24, 0x29, 0x21, 0x2C, 0x25, 0x2D,

0x12, 0x1A, 0x16, 0x1B, 0x13, 0x1E, 0x17, 0x1F,

0x02, 0x0A, 0x06, 0x0B, 0x03, 0x0E, 0x07, 0x0F,

0x30, 0x38, 0x34, 0x39, 0x31, 0x3C, 0x35, 0x3D,

0x22, 0x2A, 0x26, 0x2B, 0x23, 0x2E, 0x27, 0x2F,

0x32, 0x3A, 0x36, 0x3B, 0x33, 0x3E, 0x37, 0x3F,

};

void idct_mmx_init(void)

{

int i;

/* the mmx/mmxext idct uses a reordered input, so we patch scan tables */

for (i = 0; i < 64; i++) {

idct_mmx_perm[i] = (i & 0x38) | ((i & 6) >> 1) | ((i & 1) << 2);

// idct_simple_mmx_perm[i] = simple_block_permute_op(i);

}

static DCTELEM block[64] __attribute__ ((aligned (8)));

static DCTELEM block1[64] __attribute__ ((aligned (8)));

static DCTELEM block_org[64] __attribute__ ((aligned (8)));

void dct_error(const char *name, int is_idct,

void (*fdct_func)(DCTELEM *block),

void (*fdct_ref)(DCTELEM *block), int test)

{

int it, i, scale;

int err_inf, v;

int64_t err2, ti, ti1, it1;

int64_t sysErr[64], sysErrMax=0;

int maxout=0;

int blockSumErrMax=0, blockSumErr;

srandom(0);

err_inf = 0;

100

err2 = 0;

101

for(i=0; i<64; i++) sysErr[i]=0;

102

for(it=0;it<NB_ITS;it++) {

103

for(i=0;i<64;i++)

104

block1[i] = 0;

105

switch(test){

106

case 0:

107

for(i=0;i<64;i++)

108

block1[i] = (random() % 512) -256;

109

if (is_idct){

110

fdct(block1);

111

112

for(i=0;i<64;i++)

113

block1[i]>>=3;

114

}

115

break;

116

case 1:{

117

int num= (random()%10)+1;

118

for(i=0;i<num;i++)

119

block1[random()%64] = (random() % 512) -256;

120

}break;

121

case 2:

122

block1[0]= (random()%4096)-2048;

123

block1[63]= (block1[0]&1)^1;

124

break;

125

}

126

127

#if 0 // simulate mismatch control

128

{ int sum=0;

129

for(i=0;i<64;i++)

130

sum+=block1[i];

131

132

if((sum&1)==0) block1[63]^=1;

133

}

134

#endif

135

136

for(i=0; i<64; i++)

137

block_org[i]= block1[i];

138

139

if (fdct_func == ff_mmx_idct ||

140

fdct_func == j_rev_dct || fdct_func == ff_mmxext_idct) {

141

for(i=0;i<64;i++)

142

block[idct_mmx_perm[i]] = block1[i];

143

} else if(fdct_func == ff_simple_idct_mmx ) {

144

for(i=0;i<64;i++)

145

block[idct_simple_mmx_perm[i]] = block1[i];

146

147

} else {

148

for(i=0; i<64; i++)

149

block[i]= block1[i];

150

}

151

#if 0 // simulate mismatch control for tested IDCT but not the ref

152

{ int sum=0;

153

for(i=0;i<64;i++)

154

sum+=block[i];

155

156

if((sum&1)==0) block[63]^=1;

157

}

158

#endif

159

160

fdct_func(block);

161

emms(); /* for ff_mmx_idct */

162

163

if (fdct_func == fdct_ifast) {

164

for(i=0; i<64; i++) {

165

scale = 8*(1 << (AANSCALE_BITS + 11)) / aanscales[i];

166

block[i] = (block[i] * scale /*+ (1<<(AANSCALE_BITS-1))*/) >> AANSCALE_BITS;

167

}

168

}

169

170

fdct_ref(block1);

171

172

blockSumErr=0;

173

for(i=0;i<64;i++) {

174

v = abs(block[i] - block1[i]);

175

if (v > err_inf)

176

err_inf = v;

177

err2 += v * v;

178

sysErr[i] += block[i] - block1[i];

179

blockSumErr += v;

180

if( abs(block[i])>maxout) maxout=abs(block[i]);

181

}

182

if(blockSumErrMax < blockSumErr) blockSumErrMax= blockSumErr;

183

#if 0 // print different matrix pairs

184

if(blockSumErr){

185

printf("\n");

186

for(i=0; i<64; i++){

187

if((i&7)==0) printf("\n");

188

printf("%4d ", block_org[i]);

189

}

190

for(i=0; i<64; i++){

191

if((i&7)==0) printf("\n");

192

printf("%4d ", block[i] - block1[i]);

193

}

194

}

195

#endif

196

}

197

for(i=0; i<64; i++) sysErrMax= MAX(sysErrMax, ABS(sysErr[i]));

198

199

#if 1 // dump systematic errors

200

for(i=0; i<64; i++){

201

if(i%8==0) printf("\n");

202

printf("%5d ", (int)sysErr[i]);

203

}

204

printf("\n");

205

#endif

206

207

printf("%s %s: err_inf=%d err2=%0.8f syserr=%0.8f maxout=%d blockSumErr=%d\n",

208

is_idct ? "IDCT" : "DCT",

209

name, err_inf, (double)err2 / NB_ITS / 64.0, (double)sysErrMax / NB_ITS, maxout, blockSumErrMax);

210

#if 1 //Speed test

211

/* speed test */

212

for(i=0;i<64;i++)

213

block1[i] = 0;

214

switch(test){

215

case 0:

216

for(i=0;i<64;i++)

217

block1[i] = (random() % 512) -256;

218

if (is_idct){

219

fdct(block1);

220

221

for(i=0;i<64;i++)

222

block1[i]>>=3;

223

}

224

break;

225

case 1:{

226

case 2:

227

block1[0] = (random() % 512) -256;

228

block1[1] = (random() % 512) -256;

229

block1[2] = (random() % 512) -256;

230

block1[3] = (random() % 512) -256;

231

}break;

232

}

233

234

if (fdct_func == ff_mmx_idct ||

235

fdct_func == j_rev_dct || fdct_func == ff_mmxext_idct) {

236

for(i=0;i<64;i++)

237

block[idct_mmx_perm[i]] = block1[i];

238

} else if(fdct_func == ff_simple_idct_mmx ) {

239

for(i=0;i<64;i++)

240

block[idct_simple_mmx_perm[i]] = block1[i];

241

} else {

242

for(i=0; i<64; i++)

243

block[i]= block1[i];

244

}

245

246

ti = gettime();

247

it1 = 0;

248

do {

249

for(it=0;it<NB_ITS_SPEED;it++) {

250

for(i=0; i<64; i++)

251

block[i]= block1[i];

252

// memcpy(block, block1, sizeof(DCTELEM) * 64);

253

// dont memcpy especially not fastmemcpy because it does movntq !!!

254

fdct_func(block);

255

}

256

it1 += NB_ITS_SPEED;

257

ti1 = gettime() - ti;

258

} while (ti1 < 1000000);

259

emms();

260

261

printf("%s %s: %0.1f kdct/s\n",

262

is_idct ? "IDCT" : "DCT",

263

name, (double)it1 * 1000.0 / (double)ti1);

264

#endif

265

}

266

267

static uint8_t img_dest[64] __attribute__ ((aligned (8)));

268

static uint8_t img_dest1[64] __attribute__ ((aligned (8)));

269

270

void idct248_ref(uint8_t *dest, int linesize, int16_t *block)

271

{

272

static int init;

273

static double c8[8][8];

274

static double c4[4][4];

275

double block1[64], block2[64], block3[64];

276

double s, sum, v;

277

int i, j, k;

278

279

if (!init) {

280

init = 1;

281

282

for(i=0;i<8;i++) {

283

sum = 0;

284

for(j=0;j<8;j++) {

285

s = (i==0) ? sqrt(1.0/8.0) : sqrt(1.0/4.0);

286

c8[i][j] = s * cos(M_PI * i * (j + 0.5) / 8.0);

287

sum += c8[i][j] * c8[i][j];

288

}

289

}

290

291

for(i=0;i<4;i++) {

292

sum = 0;

293

for(j=0;j<4;j++) {

294

s = (i==0) ? sqrt(1.0/4.0) : sqrt(1.0/2.0);

295

c4[i][j] = s * cos(M_PI * i * (j + 0.5) / 4.0);

296

sum += c4[i][j] * c4[i][j];

297

}

298

}

299

}

300

301

/* butterfly */

302

s = 0.5 * sqrt(2.0);

303

for(i=0;i<4;i++) {

304

for(j=0;j<8;j++) {

305

block1[8*(2*i)+j] = (block[8*(2*i)+j] + block[8*(2*i+1)+j]) * s;

306

block1[8*(2*i+1)+j] = (block[8*(2*i)+j] - block[8*(2*i+1)+j]) * s;

307

}

308

}

309

310

/* idct8 on lines */

311

for(i=0;i<8;i++) {

312

for(j=0;j<8;j++) {

313

sum = 0;

314

for(k=0;k<8;k++)

315

sum += c8[k][j] * block1[8*i+k];

316

block2[8*i+j] = sum;

317

}

318

}

319

320

/* idct4 */

321

for(i=0;i<8;i++) {

322

for(j=0;j<4;j++) {

323

/* top */

324

sum = 0;

325

for(k=0;k<4;k++)

326

sum += c4[k][j] * block2[8*(2*k)+i];

327

block3[8*(2*j)+i] = sum;

328

329

/* bottom */

330

sum = 0;

331

for(k=0;k<4;k++)

332

sum += c4[k][j] * block2[8*(2*k+1)+i];

333

block3[8*(2*j+1)+i] = sum;

334

}

335

}

336

337

/* clamp and store the result */

338

for(i=0;i<8;i++) {

339

for(j=0;j<8;j++) {

340

v = block3[8*i+j];

341

if (v < 0)

342

v = 0;

343

else if (v > 255)

344

v = 255;

345

dest[i * linesize + j] = (int)rint(v);

346

}

347

}

348

}

349

350

void idct248_error(const char *name,

351

void (*idct248_put)(uint8_t *dest, int line_size, int16_t *block))

352

{

353

int it, i, it1, ti, ti1, err_max, v;

354

355

srandom(0);

356

357

/* just one test to see if code is correct (precision is less

358

important here) */

359

err_max = 0;

360

for(it=0;it<NB_ITS;it++) {

361

362

/* XXX: use forward transform to generate values */

363

for(i=0;i<64;i++)

364

block1[i] = (random() % 256) - 128;

365

block1[0] += 1024;

366

367

for(i=0; i<64; i++)

368

block[i]= block1[i];

369

idct248_ref(img_dest1, 8, block);

370

371

for(i=0; i<64; i++)

372

block[i]= block1[i];

373

idct248_put(img_dest, 8, block);

374

375

for(i=0;i<64;i++) {

376

v = abs((int)img_dest[i] - (int)img_dest1[i]);

377

if (v == 255)

378

printf("%d %d\n", img_dest[i], img_dest1[i]);

379

if (v > err_max)

380

err_max = v;

381

}

382

#if 0

383

printf("ref=\n");

384

for(i=0;i<8;i++) {

385

int j;

386

for(j=0;j<8;j++) {

387

printf(" %3d", img_dest1[i*8+j]);

388

}

389

printf("\n");

390

}

391

392

printf("out=\n");

393

for(i=0;i<8;i++) {

394

int j;

395

for(j=0;j<8;j++) {

396

printf(" %3d", img_dest[i*8+j]);

397

}

398

printf("\n");

399

}

400

#endif

401

}

402

printf("%s %s: err_inf=%d\n",

403

1 ? "IDCT248" : "DCT248",

404

name, err_max);

405

406

ti = gettime();

407

it1 = 0;

408

do {

409

for(it=0;it<NB_ITS_SPEED;it++) {

410

for(i=0; i<64; i++)

411

block[i]= block1[i];

412

// memcpy(block, block1, sizeof(DCTELEM) * 64);

413

// dont memcpy especially not fastmemcpy because it does movntq !!!

414

idct248_put(img_dest, 8, block);

415

}

416

it1 += NB_ITS_SPEED;

417

ti1 = gettime() - ti;

418

} while (ti1 < 1000000);

419

emms();

420

421

printf("%s %s: %0.1f kdct/s\n",

422

1 ? "IDCT248" : "DCT248",

423

name, (double)it1 * 1000.0 / (double)ti1);

424

}

425

426

void help(void)

427

{

428

printf("dct-test [-i] [<test-number>]\n"

429

"test-number 0 -> test with random matrixes\n"

430

" 1 -> test with random sparse matrixes\n"

431

" 2 -> do 3. test from mpeg4 std\n"

432

"-i test IDCT implementations\n"

433

"-4 test IDCT248 implementations\n");

434

exit(1);

435

}

436

437

int main(int argc, char **argv)

438

{

439

int test_idct = 0, test_248_dct = 0;

440

int c,i;

441

int test=1;

442

443

init_fdct();

444

idct_mmx_init();

445

446

for(i=0;i<256;i++) cropTbl[i + MAX_NEG_CROP] = i;

447

for(i=0;i<MAX_NEG_CROP;i++) {

448

cropTbl[i] = 0;

449

cropTbl[i + MAX_NEG_CROP + 256] = 255;

450

}

451

452

for(;;) {

453

c = getopt(argc, argv, "ih4");

454

if (c == -1)

455

break;

456

switch(c) {

457

case 'i':

458

test_idct = 1;

459

break;

460

case '4':

461

test_248_dct = 1;

462

break;

463

default :

464

case 'h':

465

help();

466

break;

467

}

468

}

469

470

if(optind <argc) test= atoi(argv[optind]);

471

472

printf("ffmpeg DCT/IDCT test\n");

473

474

if (test_248_dct) {

475

idct248_error("SIMPLE-C", simple_idct248_put);

476

} else {

477

if (!test_idct) {

478

dct_error("REF-DBL", 0, fdct, fdct, test); /* only to verify code ! */

479

dct_error("IJG-AAN-INT", 0, fdct_ifast, fdct, test);

480

dct_error("IJG-LLM-INT", 0, ff_jpeg_fdct_islow, fdct, test);

481

dct_error("MMX", 0, ff_fdct_mmx, fdct, test);

482

} else {

483

dct_error("REF-DBL", 1, idct, idct, test);

484

dct_error("INT", 1, j_rev_dct, idct, test);

485

dct_error("LIBMPEG2-MMX", 1, ff_mmx_idct, idct, test);

486

dct_error("LIBMPEG2-MMXEXT", 1, ff_mmxext_idct, idct, test);

487

dct_error("SIMPLE-C", 1, simple_idct, idct, test);

488

dct_error("SIMPLE-MMX", 1, ff_simple_idct_mmx, idct, test);

489

// dct_error("ODIVX-C", 1, odivx_idct_c, idct);

490

//printf(" test against odivx idct\n");

491

// dct_error("REF", 1, idct, odivx_idct_c);

492

// dct_error("INT", 1, j_rev_dct, odivx_idct_c);

493

// dct_error("MMX", 1, ff_mmx_idct, odivx_idct_c);

494

// dct_error("MMXEXT", 1, ff_mmxext_idct, odivx_idct_c);

495

// dct_error("SIMPLE-C", 1, simple_idct, odivx_idct_c);

496

// dct_error("SIMPLE-MMX", 1, ff_simple_idct_mmx, odivx_idct_c);

497

// dct_error("ODIVX-C", 1, odivx_idct_c, odivx_idct_c);

498

}

499

}

500

return 0;

501

}

Older »