~ubuntu-branches/ubuntu/raring/libjpeg-turbo/raring-security

« back to all changes in this revision

Viewing changes to jfdctfst.c

Committer: Package Import Robot
Author(s): Tom Gall
Date: 2011-09-13 03:53:56 UTC
Revision ID: package-import@ubuntu.com-20110913035356-1jybp1r6on1l3son

Tags: upstream-1.1.90+svn702

Import upstream version 1.1.90+svn702

files added:

BUILDING.txt

CMakeLists.txt

ChangeLog.txt

Makefile.am

README

README-turbo.txt

acinclude.m4

bmp.c

bmp.h

cderror.h

cdjpeg.c

cdjpeg.h

change.log

cjpeg.1

cjpeg.c

cmakescripts

cmakescripts/getdate.bat

cmakescripts/testclean.cmake

coderules.txt

configure.ac

djpeg.1

djpeg.c

doc/html

doc/html/annotated.html

doc/html/bc_s.png

doc/html/classes.html

doc/html/closed.png

doc/html/doxygen.css

doc/html/doxygen.png

doc/html/functions.html

doc/html/functions_vars.html

doc/html/group___turbo_j_p_e_g.html

doc/html/index.html

doc/html/installdox

doc/html/jquery.js

doc/html/modules.html

doc/html/nav_f.png

doc/html/nav_h.png

doc/html/open.png

doc/html/search

doc/html/search/all_64.html

doc/html/search/all_68.html

doc/html/search/all_6e.html

doc/html/search/all_6f.html

doc/html/search/all_72.html

doc/html/search/all_74.html

doc/html/search/all_77.html

doc/html/search/all_78.html

doc/html/search/all_79.html

doc/html/search/classes_74.html

doc/html/search/close.png

doc/html/search/mag_sel.png

doc/html/search/nomatches.html

doc/html/search/search.css

doc/html/search/search.js

doc/html/search/search_l.png

doc/html/search/search_m.png

doc/html/search/search_r.png

doc/html/search/variables_64.html

doc/html/search/variables_68.html

doc/html/search/variables_6e.html

doc/html/search/variables_6f.html

doc/html/search/variables_72.html

doc/html/search/variables_77.html

doc/html/search/variables_78.html

doc/html/search/variables_79.html

doc/html/structtjregion.html

doc/html/structtjscalingfactor.html

doc/html/structtjtransform.html

doc/html/tab_a.png

doc/html/tab_b.png

doc/html/tab_h.png

doc/html/tab_s.png

doc/html/tabs.css

doxygen.config

example.c

filelist.txt

install.txt

jaricom.c

java

java/CMakeLists.txt

java/MANIFEST.MF

java/Makefile.am

java/README

java/TJExample.java

java/TJUnitTest.java

java/doc

java/doc/allclasses-frame.html

java/doc/allclasses-noframe.html

java/doc/constant-values.html

java/doc/deprecated-list.html

java/doc/help-doc.html

java/doc/index-all.html

java/doc/index.html

java/doc/org

java/doc/org/libjpegturbo

java/doc/org/libjpegturbo/turbojpeg

java/doc/org/libjpegturbo/turbojpeg/TJ.html

java/doc/org/libjpegturbo/turbojpeg/TJCompressor.html

java/doc/org/libjpegturbo/turbojpeg/TJDecompressor.html

java/doc/org/libjpegturbo/turbojpeg/TJScalingFactor.html

java/doc/org/libjpegturbo/turbojpeg/TJTransform.html

java/doc/org/libjpegturbo/turbojpeg/TJTransformer.html

java/doc/org/libjpegturbo/turbojpeg/package-frame.html

java/doc/org/libjpegturbo/turbojpeg/package-summary.html

java/doc/org/libjpegturbo/turbojpeg/package-tree.html

java/doc/overview-tree.html

java/doc/package-list

java/doc/resources

java/doc/resources/inherit.gif

java/doc/serialized-form.html

java/doc/stylesheet.css

java/org

java/org/libjpegturbo

java/org/libjpegturbo/turbojpeg

java/org/libjpegturbo/turbojpeg/TJ.java

java/org/libjpegturbo/turbojpeg/TJCompressor.java

java/org/libjpegturbo/turbojpeg/TJDecompressor.java

java/org/libjpegturbo/turbojpeg/TJLoader.java

java/org/libjpegturbo/turbojpeg/TJLoader.java.in

java/org/libjpegturbo/turbojpeg/TJScalingFactor.java

java/org/libjpegturbo/turbojpeg/TJTransform.java

java/org/libjpegturbo/turbojpeg/TJTransformer.java

java/org_libjpegturbo_turbojpeg_TJ.h

java/org_libjpegturbo_turbojpeg_TJCompressor.h

java/org_libjpegturbo_turbojpeg_TJDecompressor.h

java/org_libjpegturbo_turbojpeg_TJTransformer.h

jcapimin.c

jcapistd.c

jcarith.c

jccoefct.c

jccolext.c

jccolor.c

jcdctmgr.c

jchuff.c

jchuff.h

jcinit.c

jcmainct.c

jcmarker.c

jcmaster.c

jcomapi.c

jconfig.h.in

jconfig.txt

jcparam.c

jcphuff.c

jcprepct.c

jcsample.c

jctrans.c

jdapimin.c

jdapistd.c

jdarith.c

jdatadst-tj.c

jdatadst.c

jdatasrc-tj.c

jdatasrc.c

jdcoefct.c

jdcolext.c

jdcolor.c

jdct.h

jddctmgr.c

jdhuff.c

jdhuff.h

jdinput.c

jdmainct.c

jdmarker.c

jdmaster.c

jdmerge.c

jdmrgext.c

jdphuff.c

jdpostct.c

jdsample.c

jdtrans.c

jerror.c

jerror.h

jfdctflt.c

jfdctfst.c

jfdctint.c

jidctflt.c

jidctfst.c

jidctint.c

jidctred.c

jinclude.h

jmemmgr.c

jmemnobs.c

jmemsys.h

jmorecfg.h

jpegcomp.h

jpegint.h

jpeglib.h

jpegtran.1

jpegtran.c

jquant1.c

jquant2.c

jsimd.h

jsimd_none.c

jsimddct.h

jutils.c

jversion.h

libjpeg.map.in

libjpeg.txt

rdbmp.c

rdcolmap.c

rdgif.c

rdjpgcom.1

rdjpgcom.c

rdppm.c

rdrle.c

rdswitch.c

rdtarga.c

release

release/Description.plist.in

release/Info.plist.in

release/License.rtf

release/ReadMe.rtf

release/Welcome.rtf

release/copyright

release/deb-control.tmpl

release/libjpeg-turbo.nsi.in

release/libjpeg-turbo.spec.in

release/makecygwinpkg.in

release/makedpkg.in

release/makemacpkg.in

release/makesunpkg.in

release/pkginfo.in

release/uninstall.in

sharedlib

sharedlib/CMakeLists.txt

simd

simd/CMakeLists.txt

simd/Makefile.am

simd/jcclrmmx.asm

simd/jcclrss2-64.asm

simd/jcclrss2.asm

simd/jccolmmx.asm

simd/jccolss2-64.asm

simd/jccolss2.asm

simd/jcgrammx.asm

simd/jcgrass2-64.asm

simd/jcgrass2.asm

simd/jcgrymmx.asm

simd/jcgryss2-64.asm

simd/jcgryss2.asm

simd/jcolsamp.inc

simd/jcqnt3dn.asm

simd/jcqntmmx.asm

simd/jcqnts2f-64.asm

simd/jcqnts2f.asm

simd/jcqnts2i-64.asm

simd/jcqnts2i.asm

simd/jcqntsse.asm

simd/jcsammmx.asm

simd/jcsamss2-64.asm

simd/jcsamss2.asm

simd/jdclrmmx.asm

simd/jdclrss2-64.asm

simd/jdclrss2.asm

simd/jdcolmmx.asm

simd/jdcolss2-64.asm

simd/jdcolss2.asm

simd/jdct.inc

simd/jdmermmx.asm

simd/jdmerss2-64.asm

simd/jdmerss2.asm

simd/jdmrgmmx.asm

simd/jdmrgss2-64.asm

simd/jdmrgss2.asm

simd/jdsammmx.asm

simd/jdsamss2-64.asm

simd/jdsamss2.asm

simd/jf3dnflt.asm

simd/jfmmxfst.asm

simd/jfmmxint.asm

simd/jfss2fst-64.asm

simd/jfss2fst.asm

simd/jfss2int-64.asm

simd/jfss2int.asm

simd/jfsseflt-64.asm

simd/jfsseflt.asm

simd/ji3dnflt.asm

simd/jimmxfst.asm

simd/jimmxint.asm

simd/jimmxred.asm

simd/jiss2flt-64.asm

simd/jiss2flt.asm

simd/jiss2fst-64.asm

simd/jiss2fst.asm

simd/jiss2int-64.asm

simd/jiss2int.asm

simd/jiss2red-64.asm

simd/jiss2red.asm

simd/jisseflt.asm

simd/jsimd.h

simd/jsimd_arm.c

simd/jsimd_arm_neon.S

simd/jsimd_i386.c

simd/jsimd_x86_64.c

simd/jsimdcfg.inc.h

simd/jsimdcpu.asm

simd/jsimdext.inc

simd/nasm_lt.sh

structure.txt

testimg.bmp

testimgari.jpg

testimgari.ppm

testimgcrop.jpg

testimgflt-nosimd.jpg

testimgflt.jpg

testimgflt.ppm

testimgfst.jpg

testimgfst.ppm

testimgfst100.jpg

testimgfst1_2.ppm

testimgfst1_4.ppm

testimgfst1_8.ppm

testimggray.jpg

testimgint.jpg

testimgint.ppm

testimgint1_2.ppm

testimgint1_4.ppm

testimgint1_8.ppm

testimgp.jpg

testorig.jpg

testorig.ppm

tjbench.c

tjunittest.c

tjutil.c

tjutil.h

transupp.c

transupp.h

turbojpeg-jni.c

turbojpeg-mapfile

turbojpeg-mapfile.jni

turbojpeg.c

turbojpeg.h

usage.txt

win/config.h.in

win/jconfig.h.in

win/jpeg62.def

win/jpeg7.def

win/jpeg8.def

win/jsimdcfg.inc

wizard.txt

wrbmp.c

wrgif.c

wrjpgcom.1

wrjpgcom.c

wrppm.c

wrrle.c

wrtarga.c

Show diffs side-by-side

added added

removed removed

jfdctfst.c

* jfdctfst.c

* This file is part of the Independent JPEG Group's software.

* For conditions of distribution and use, see the accompanying README file.

* This file contains a fast, not so accurate integer implementation of the

* forward DCT (Discrete Cosine Transform).

* A 2-D DCT can be done by 1-D DCT on each row followed by 1-D DCT

* on each column. Direct algorithms are also available, but they are

* much more complex and seem not to be any faster when reduced to code.

* This implementation is based on Arai, Agui, and Nakajima's algorithm for

* scaled DCT. Their original paper (Trans. IEICE E-71(11):1095) is in

* Japanese, but the algorithm is described in the Pennebaker & Mitchell

* JPEG textbook (see REFERENCES section in file README). The following code

* is based directly on figure 4-8 in P&M.

* While an 8-point DCT cannot be done in less than 11 multiplies, it is

* possible to arrange the computation so that many of the multiplies are

* simple scalings of the final outputs. These multiplies can then be

* folded into the multiplications or divisions by the JPEG quantization

* table entries. The AA&N method leaves only 5 multiplies and 29 adds

* to be done in the DCT itself.

* The primary disadvantage of this method is that with fixed-point math,

* accuracy is lost due to imprecise representation of the scaled

* quantization values. The smaller the quantization table entry, the less

* precise the scaled value, so this implementation does worse with high-

* quality-setting files than with low-quality ones.

#define JPEG_INTERNALS

#include "jinclude.h"

#include "jpeglib.h"

#include "jdct.h" /* Private declarations for DCT subsystem */

#ifdef DCT_IFAST_SUPPORTED

* This module is specialized to the case DCTSIZE = 8.

#if DCTSIZE != 8

Sorry, this code only copes with 8x8 DCTs. /* deliberate syntax err */

#endif

/* Scaling decisions are generally the same as in the LL&M algorithm;

* see jfdctint.c for more details. However, we choose to descale

* (right shift) multiplication products as soon as they are formed,

* rather than carrying additional fractional bits into subsequent additions.

* This compromises accuracy slightly, but it lets us save a few shifts.

* More importantly, 16-bit arithmetic is then adequate (for 8-bit samples)

* everywhere except in the multiplications proper; this saves a good deal

* of work on 16-bit-int machines.

* Again to save a few shifts, the intermediate results between pass 1 and

* pass 2 are not upscaled, but are represented only to integral precision.

* A final compromise is to represent the multiplicative constants to only

* 8 fractional bits, rather than 13. This saves some shifting work on some

* machines, and may also reduce the cost of multiplication (since there

* are fewer one-bits in the constants).

#define CONST_BITS 8

/* Some C compilers fail to reduce "FIX(constant)" at compile time, thus

* causing a lot of useless floating-point operations at run time.

* To get around this we use the following pre-calculated constants.

* If you change CONST_BITS you may want to add appropriate values.

* (With a reasonable C compiler, you can just rely on the FIX() macro...)

#if CONST_BITS == 8

#define FIX_0_382683433 ((INT32) 98) /* FIX(0.382683433) */

#define FIX_0_541196100 ((INT32) 139) /* FIX(0.541196100) */

#define FIX_0_707106781 ((INT32) 181) /* FIX(0.707106781) */

#define FIX_1_306562965 ((INT32) 334) /* FIX(1.306562965) */

#else

#define FIX_0_382683433 FIX(0.382683433)

#define FIX_0_541196100 FIX(0.541196100)

#define FIX_0_707106781 FIX(0.707106781)

#define FIX_1_306562965 FIX(1.306562965)

#endif

/* We can gain a little more speed, with a further compromise in accuracy,

* by omitting the addition in a descaling shift. This yields an incorrectly

* rounded result half the time...

#ifndef USE_ACCURATE_ROUNDING

#undef DESCALE

#define DESCALE(x,n) RIGHT_SHIFT(x, n)

#endif

100

101

102

/* Multiply a DCTELEM variable by an INT32 constant, and immediately

103

* descale to yield a DCTELEM result.

104

105

106

#define MULTIPLY(var,const) ((DCTELEM) DESCALE((var) * (const), CONST_BITS))

107

108

109

110

* Perform the forward DCT on one block of samples.

111

112

113

GLOBAL(void)

114

jpeg_fdct_ifast (DCTELEM * data)

115

{

116

DCTELEM tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;

117

DCTELEM tmp10, tmp11, tmp12, tmp13;

118

DCTELEM z1, z2, z3, z4, z5, z11, z13;

119

DCTELEM *dataptr;

120

int ctr;

121

SHIFT_TEMPS

122

123

/* Pass 1: process rows. */

124

125

dataptr = data;

126

for (ctr = DCTSIZE-1; ctr >= 0; ctr--) {

127

tmp0 = dataptr[0] + dataptr[7];

128

tmp7 = dataptr[0] - dataptr[7];

129

tmp1 = dataptr[1] + dataptr[6];

130

tmp6 = dataptr[1] - dataptr[6];

131

tmp2 = dataptr[2] + dataptr[5];

132

tmp5 = dataptr[2] - dataptr[5];

133

tmp3 = dataptr[3] + dataptr[4];

134

tmp4 = dataptr[3] - dataptr[4];

135

136

/* Even part */

137

138

tmp10 = tmp0 + tmp3; /* phase 2 */

139

tmp13 = tmp0 - tmp3;

140

tmp11 = tmp1 + tmp2;

141

tmp12 = tmp1 - tmp2;

142

143

dataptr[0] = tmp10 + tmp11; /* phase 3 */

144

dataptr[4] = tmp10 - tmp11;

145

146

z1 = MULTIPLY(tmp12 + tmp13, FIX_0_707106781); /* c4 */

147

dataptr[2] = tmp13 + z1; /* phase 5 */

148

dataptr[6] = tmp13 - z1;

149

150

/* Odd part */

151

152

tmp10 = tmp4 + tmp5; /* phase 2 */

153

tmp11 = tmp5 + tmp6;

154

tmp12 = tmp6 + tmp7;

155

156

/* The rotator is modified from fig 4-8 to avoid extra negations. */

157

z5 = MULTIPLY(tmp10 - tmp12, FIX_0_382683433); /* c6 */

158

z2 = MULTIPLY(tmp10, FIX_0_541196100) + z5; /* c2-c6 */

159

z4 = MULTIPLY(tmp12, FIX_1_306562965) + z5; /* c2+c6 */

160

z3 = MULTIPLY(tmp11, FIX_0_707106781); /* c4 */

161

162

z11 = tmp7 + z3; /* phase 5 */

163

z13 = tmp7 - z3;

164

165

dataptr[5] = z13 + z2; /* phase 6 */

166

dataptr[3] = z13 - z2;

167

dataptr[1] = z11 + z4;

168

dataptr[7] = z11 - z4;

169

170

dataptr += DCTSIZE; /* advance pointer to next row */

171

}

172

173

/* Pass 2: process columns. */

174

175

dataptr = data;

176

for (ctr = DCTSIZE-1; ctr >= 0; ctr--) {

177

tmp0 = dataptr[DCTSIZE*0] + dataptr[DCTSIZE*7];

178

tmp7 = dataptr[DCTSIZE*0] - dataptr[DCTSIZE*7];

179

tmp1 = dataptr[DCTSIZE*1] + dataptr[DCTSIZE*6];

180

tmp6 = dataptr[DCTSIZE*1] - dataptr[DCTSIZE*6];

181

tmp2 = dataptr[DCTSIZE*2] + dataptr[DCTSIZE*5];

182

tmp5 = dataptr[DCTSIZE*2] - dataptr[DCTSIZE*5];

183

tmp3 = dataptr[DCTSIZE*3] + dataptr[DCTSIZE*4];

184

tmp4 = dataptr[DCTSIZE*3] - dataptr[DCTSIZE*4];

185

186

/* Even part */

187

188

tmp10 = tmp0 + tmp3; /* phase 2 */

189

tmp13 = tmp0 - tmp3;

190

tmp11 = tmp1 + tmp2;

191

tmp12 = tmp1 - tmp2;

192

193

dataptr[DCTSIZE*0] = tmp10 + tmp11; /* phase 3 */

194

dataptr[DCTSIZE*4] = tmp10 - tmp11;

195

196

z1 = MULTIPLY(tmp12 + tmp13, FIX_0_707106781); /* c4 */

197

dataptr[DCTSIZE*2] = tmp13 + z1; /* phase 5 */

198

dataptr[DCTSIZE*6] = tmp13 - z1;

199

200

/* Odd part */

201

202

tmp10 = tmp4 + tmp5; /* phase 2 */

203

tmp11 = tmp5 + tmp6;

204

tmp12 = tmp6 + tmp7;

205

206

/* The rotator is modified from fig 4-8 to avoid extra negations. */

207

z5 = MULTIPLY(tmp10 - tmp12, FIX_0_382683433); /* c6 */

208

z2 = MULTIPLY(tmp10, FIX_0_541196100) + z5; /* c2-c6 */

209

z4 = MULTIPLY(tmp12, FIX_1_306562965) + z5; /* c2+c6 */

210

z3 = MULTIPLY(tmp11, FIX_0_707106781); /* c4 */

211

212

z11 = tmp7 + z3; /* phase 5 */

213

z13 = tmp7 - z3;

214

215

dataptr[DCTSIZE*5] = z13 + z2; /* phase 6 */

216

dataptr[DCTSIZE*3] = z13 - z2;

217

dataptr[DCTSIZE*1] = z11 + z4;

218

dataptr[DCTSIZE*7] = z11 - z4;

219

220

dataptr++; /* advance pointer to next column */

221

}

222

}

223

224

#endif /* DCT_IFAST_SUPPORTED */

Older »