~ubuntu-branches/debian/sid/v4l-utils/sid

Viewing changes to lib/libv4lconvert/jidctflt.c

Committer: Bazaar Package Importer
Author(s): Gregor Jasny
Date: 2010-05-07 20:48:34 UTC
mfrom: (1.1.2 upstream)
Revision ID: james.westby@ubuntu.com-20100507204834-ga01cxhz3fekk47r

Tags: 0.8.0-1

http://bugs.debian.org/576422

* New upstream version
* Switch to 3.0 (quilt) source format
* Re-enable pristine-tar
* Split utils package into command line and the Qt based qv4l2
(Closes: #576422)
* Update upstream URL

files added:
contrib/qv4l2-qt3

contrib/qv4l2-qt3/Makefile.install

contrib/qv4l2-qt3/ctrl-tab.cpp

contrib/qv4l2-qt3/fileopen.xpm

contrib/qv4l2-qt3/general-tab.cpp

contrib/qv4l2-qt3/general-tab.h

contrib/qv4l2-qt3/qv4l2-qt3.pro

contrib/qv4l2-qt3/qv4l2.cpp

contrib/qv4l2-qt3/qv4l2.h

debian/qv4l2.install

debian/qv4l2.links

debian/source

debian/source/format

utils/keytable/rc_keymaps

utils/keytable/rc_keymaps/a800_rc_keys

utils/keytable/rc_keymaps/adstech_dvb_t_pci

utils/keytable/rc_keymaps/af9005_rc_keys

utils/keytable/rc_keymaps/af9015_rc_keys_a_link

utils/keytable/rc_keymaps/af9015_rc_keys_avermedia

utils/keytable/rc_keymaps/af9015_rc_keys_digittrade

utils/keytable/rc_keymaps/af9015_rc_keys_leadtek

utils/keytable/rc_keymaps/af9015_rc_keys_msi

utils/keytable/rc_keymaps/af9015_rc_keys_msi_digivox_iii

utils/keytable/rc_keymaps/af9015_rc_keys_mygictv

utils/keytable/rc_keymaps/af9015_rc_keys_trekstor

utils/keytable/rc_keymaps/af9015_rc_keys_twinhan

utils/keytable/rc_keymaps/anysee_rc_keys

utils/keytable/rc_keymaps/apac_viewcomp

utils/keytable/rc_keymaps/asus_pc39

utils/keytable/rc_keymaps/ati_tv_wonder_hd_600

utils/keytable/rc_keymaps/avermedia

utils/keytable/rc_keymaps/avermedia_a16d

utils/keytable/rc_keymaps/avermedia_cardbus

utils/keytable/rc_keymaps/avermedia_dvbt

utils/keytable/rc_keymaps/avermedia_m135a

utils/keytable/rc_keymaps/avertv_303

utils/keytable/rc_keymaps/behold

utils/keytable/rc_keymaps/behold_columbus

utils/keytable/rc_keymaps/budget_ci_old

utils/keytable/rc_keymaps/cinergy

utils/keytable/rc_keymaps/cinergy_1400

utils/keytable/rc_keymaps/cinergyt2_rc_keys

utils/keytable/rc_keymaps/d680_dmb_rc_keys

utils/keytable/rc_keymaps/dib0700_rc_keys

utils/keytable/rc_keymaps/dibusb_rc_keys

utils/keytable/rc_keymaps/digitv_rc_keys

utils/keytable/rc_keymaps/dm1105_nec

utils/keytable/rc_keymaps/dntv_live_dvb_t

utils/keytable/rc_keymaps/dntv_live_dvbt_pro

utils/keytable/rc_keymaps/dtt200u_rc_keys

utils/keytable/rc_keymaps/dvico_mce_rc_keys

utils/keytable/rc_keymaps/dvico_portable_rc_keys

utils/keytable/rc_keymaps/dw210x_rc_keys

utils/keytable/rc_keymaps/em_terratec

utils/keytable/rc_keymaps/empty

utils/keytable/rc_keymaps/encore_enltv

utils/keytable/rc_keymaps/encore_enltv2

utils/keytable/rc_keymaps/encore_enltv_fm53

utils/keytable/rc_keymaps/evga_indtube

utils/keytable/rc_keymaps/eztv

utils/keytable/rc_keymaps/flydvb

utils/keytable/rc_keymaps/flyvideo

utils/keytable/rc_keymaps/fusionhdtv_mce

utils/keytable/rc_keymaps/gadmei_rm008z

utils/keytable/rc_keymaps/genius_tvgo_a11mce

utils/keytable/rc_keymaps/gotview7135

utils/keytable/rc_keymaps/haupp_rc_keys

utils/keytable/rc_keymaps/hauppauge_new

utils/keytable/rc_keymaps/iodata_bctv7e

utils/keytable/rc_keymaps/kaiomy

utils/keytable/rc_keymaps/kworld_315u

utils/keytable/rc_keymaps/kworld_plus_tv_analog

utils/keytable/rc_keymaps/manli

utils/keytable/rc_keymaps/megasky_rc_keys

utils/keytable/rc_keymaps/msi_tvanywhere

utils/keytable/rc_keymaps/msi_tvanywhere_plus

utils/keytable/rc_keymaps/nebula

utils/keytable/rc_keymaps/nec_terratec_cinergy_xs

utils/keytable/rc_keymaps/norwood

utils/keytable/rc_keymaps/npgtech

utils/keytable/rc_keymaps/opera1_rc_keys

utils/keytable/rc_keymaps/pctv_sedna

utils/keytable/rc_keymaps/pinnacle310e_rc_keys

utils/keytable/rc_keymaps/pinnacle_color

utils/keytable/rc_keymaps/pinnacle_grey

utils/keytable/rc_keymaps/pinnacle_pctv_hd

utils/keytable/rc_keymaps/pixelview

utils/keytable/rc_keymaps/pixelview_new

utils/keytable/rc_keymaps/powercolor_real_angel

utils/keytable/rc_keymaps/proteus_2309

utils/keytable/rc_keymaps/purpletv

utils/keytable/rc_keymaps/pv951

utils/keytable/rc_keymaps/rc5_hauppauge_new

utils/keytable/rc_keymaps/rc5_tv

utils/keytable/rc_keymaps/real_audio_220_32_keys

utils/keytable/rc_keymaps/tbs_nec

utils/keytable/rc_keymaps/tbs_rc_keys

utils/keytable/rc_keymaps/terratec_cinergy_xs

utils/keytable/rc_keymaps/tevii_nec

utils/keytable/rc_keymaps/tevii_rc_keys

utils/keytable/rc_keymaps/tt_1500

utils/keytable/rc_keymaps/tvwalkertwin_rc_keys

utils/keytable/rc_keymaps/videomate_s350

utils/keytable/rc_keymaps/videomate_tv_pvr

utils/keytable/rc_keymaps/vp702x_rc_keys

utils/keytable/rc_keymaps/vp7045_rc_keys

utils/keytable/rc_keymaps/winfast

utils/keytable/rc_keymaps/winfast_usbii_deluxe

utils/keytable/rc_maps.cfg.example

utils/qv4l2

utils/qv4l2/Makefile.install

utils/qv4l2/capture-win.cpp

utils/qv4l2/capture-win.h

utils/qv4l2/ctrl-tab.cpp

utils/qv4l2/exit.png

utils/qv4l2/fileclose.png

utils/qv4l2/fileopen.png

utils/qv4l2/general-tab.cpp

utils/qv4l2/general-tab.h

utils/qv4l2/qv4l2.cpp

utils/qv4l2/qv4l2.h

utils/qv4l2/qv4l2.png

utils/qv4l2/qv4l2.pro

utils/qv4l2/qv4l2.qrc

utils/qv4l2/record.png

utils/qv4l2/v4l2-api.cpp

utils/qv4l2/v4l2-api.h

utils/v4l2-compliance/v4l2-compliance.h

utils/v4l2-compliance/v4l2-test-debug.cpp

files removed:
.gitignore

include/linux/i2c-id.h

lib/libv4lconvert/.gitignore

utils/decode_tm6000/.gitignore

utils/keytable/.gitignore

utils/keytable/keycodes

utils/keytable/keycodes/a800_rc_keys

utils/keytable/keycodes/adstech_dvb_t_pci

utils/keytable/keycodes/af9005_rc_keys

utils/keytable/keycodes/af9015_rc_keys_a_link

utils/keytable/keycodes/af9015_rc_keys_avermedia

utils/keytable/keycodes/af9015_rc_keys_digittrade

utils/keytable/keycodes/af9015_rc_keys_leadtek

utils/keytable/keycodes/af9015_rc_keys_msi

utils/keytable/keycodes/af9015_rc_keys_msi_digivox_iii

utils/keytable/keycodes/af9015_rc_keys_mygictv

utils/keytable/keycodes/af9015_rc_keys_trekstor

utils/keytable/keycodes/af9015_rc_keys_twinhan

utils/keytable/keycodes/anysee_rc_keys

utils/keytable/keycodes/apac_viewcomp

utils/keytable/keycodes/asus_pc39

utils/keytable/keycodes/ati_tv_wonder_hd_600

utils/keytable/keycodes/avermedia

utils/keytable/keycodes/avermedia_a16d

utils/keytable/keycodes/avermedia_cardbus

utils/keytable/keycodes/avermedia_dvbt

utils/keytable/keycodes/avermedia_m135a

utils/keytable/keycodes/avertv_303

utils/keytable/keycodes/behold

utils/keytable/keycodes/behold_columbus

utils/keytable/keycodes/budget_ci_old

utils/keytable/keycodes/cinergy

utils/keytable/keycodes/cinergy_1400

utils/keytable/keycodes/cinergyt2_rc_keys

utils/keytable/keycodes/d680_dmb_rc_keys

utils/keytable/keycodes/dib0700_rc_keys

utils/keytable/keycodes/dibusb_rc_keys

utils/keytable/keycodes/digitv_rc_keys

utils/keytable/keycodes/dm1105_nec

utils/keytable/keycodes/dntv_live_dvb_t

utils/keytable/keycodes/dntv_live_dvbt_pro

utils/keytable/keycodes/dtt200u_rc_keys

utils/keytable/keycodes/dvico_mce_rc_keys

utils/keytable/keycodes/dvico_portable_rc_keys

utils/keytable/keycodes/dw210x_rc_keys

utils/keytable/keycodes/em_terratec

utils/keytable/keycodes/empty

utils/keytable/keycodes/encore_enltv

utils/keytable/keycodes/encore_enltv2

utils/keytable/keycodes/encore_enltv_fm53

utils/keytable/keycodes/evga_indtube

utils/keytable/keycodes/eztv

utils/keytable/keycodes/flydvb

utils/keytable/keycodes/flyvideo

utils/keytable/keycodes/fusionhdtv_mce

utils/keytable/keycodes/gadmei_rm008z

utils/keytable/keycodes/genius_tvgo_a11mce

utils/keytable/keycodes/gotview7135

utils/keytable/keycodes/haupp_rc_keys

utils/keytable/keycodes/hauppauge_new

utils/keytable/keycodes/iodata_bctv7e

utils/keytable/keycodes/kaiomy

utils/keytable/keycodes/kworld_plus_tv_analog

utils/keytable/keycodes/manli

utils/keytable/keycodes/megasky_rc_keys

utils/keytable/keycodes/msi_tvanywhere

utils/keytable/keycodes/msi_tvanywhere_plus

utils/keytable/keycodes/nebula

utils/keytable/keycodes/nec_terratec_cinergy_xs

utils/keytable/keycodes/norwood

utils/keytable/keycodes/npgtech

utils/keytable/keycodes/opera1_rc_keys

utils/keytable/keycodes/pctv_sedna

utils/keytable/keycodes/pinnacle310e_rc_keys

utils/keytable/keycodes/pinnacle_color

utils/keytable/keycodes/pinnacle_grey

utils/keytable/keycodes/pinnacle_pctv_hd

utils/keytable/keycodes/pixelview

utils/keytable/keycodes/pixelview_new

utils/keytable/keycodes/powercolor_real_angel

utils/keytable/keycodes/proteus_2309

utils/keytable/keycodes/purpletv

utils/keytable/keycodes/pv951

utils/keytable/keycodes/rc5_hauppauge_new

utils/keytable/keycodes/rc5_tv

utils/keytable/keycodes/real_audio_220_32_keys

utils/keytable/keycodes/tbs_nec

utils/keytable/keycodes/tbs_rc_keys

utils/keytable/keycodes/terratec_cinergy_xs

utils/keytable/keycodes/tevii_nec

utils/keytable/keycodes/tevii_rc_keys

utils/keytable/keycodes/tt_1500

utils/keytable/keycodes/tvwalkertwin_rc_keys

utils/keytable/keycodes/videomate_s350

utils/keytable/keycodes/videomate_tv_pvr

utils/keytable/keycodes/vp702x_rc_keys

utils/keytable/keycodes/vp7045_rc_keys

utils/keytable/keycodes/winfast

utils/keytable/keycodes/winfast_usbii_deluxe

utils/qv4l2-qt3

utils/qv4l2-qt3/.gitignore

utils/qv4l2-qt3/Makefile.install

utils/qv4l2-qt3/ctrl-tab.cpp

utils/qv4l2-qt3/fileopen.xpm

utils/qv4l2-qt3/general-tab.cpp

utils/qv4l2-qt3/general-tab.h

utils/qv4l2-qt3/qv4l2.cpp

utils/qv4l2-qt3/qv4l2.h

utils/qv4l2-qt3/qv4l2.pro

utils/qv4l2-qt4

utils/qv4l2-qt4/.gitignore

utils/qv4l2-qt4/Makefile.install

utils/qv4l2-qt4/capture-win.cpp

utils/qv4l2-qt4/capture-win.h

utils/qv4l2-qt4/ctrl-tab.cpp

utils/qv4l2-qt4/exit.png

utils/qv4l2-qt4/fileclose.png

utils/qv4l2-qt4/fileopen.png

utils/qv4l2-qt4/general-tab.cpp

utils/qv4l2-qt4/general-tab.h

utils/qv4l2-qt4/qv4l2.cpp

utils/qv4l2-qt4/qv4l2.h

utils/qv4l2-qt4/qv4l2.png

utils/qv4l2-qt4/qv4l2.pro

utils/qv4l2-qt4/qv4l2.qrc

utils/qv4l2-qt4/record.png

utils/qv4l2-qt4/v4l2-api.cpp

utils/qv4l2-qt4/v4l2-api.h

utils/rds/.gitignore

utils/v4l2-compliance/.gitignore

utils/v4l2-ctl/.gitignore

utils/v4l2-dbg/.gitignore

utils/v4l2-sysfs-path/.gitignore

utils/xc3028-firmware/.gitignore

files modified:
ChangeLog

Make.rules

Makefile

debian/changelog

debian/control

debian/copyright

debian/gbp.conf

debian/v4l-utils.install

debian/watch

include/linux/videodev2.h

lib/include/libv4l1.h

lib/include/libv4l2.h

lib/include/libv4lconvert.h

lib/libv4l1/libv4l1-priv.h

lib/libv4l1/libv4l1.c

lib/libv4l1/log.c

lib/libv4l1/v4l1compat.c

lib/libv4l2/libv4l2-priv.h

lib/libv4l2/libv4l2.c

lib/libv4l2/log.c

lib/libv4l2/v4l2convert.c

lib/libv4lconvert/bayer.c

lib/libv4lconvert/control/libv4lcontrol-priv.h

lib/libv4lconvert/control/libv4lcontrol.c

lib/libv4lconvert/control/libv4lcontrol.h

lib/libv4lconvert/cpia1.c

lib/libv4lconvert/crop.c

lib/libv4lconvert/flip.c

lib/libv4lconvert/helper.c

lib/libv4lconvert/jidctflt.c

lib/libv4lconvert/libv4lconvert-priv.h

lib/libv4lconvert/libv4lconvert.c

lib/libv4lconvert/libv4lsyscall-priv.h

lib/libv4lconvert/mr97310a.c

lib/libv4lconvert/ov511-decomp.c

lib/libv4lconvert/ov518-decomp.c

lib/libv4lconvert/pac207.c

lib/libv4lconvert/processing/autogain.c

lib/libv4lconvert/processing/gamma.c

lib/libv4lconvert/processing/libv4lprocessing-priv.h

lib/libv4lconvert/processing/libv4lprocessing.c

lib/libv4lconvert/processing/whitebalance.c

lib/libv4lconvert/rgbyuv.c

lib/libv4lconvert/sn9c10x.c

lib/libv4lconvert/sn9c2028-decomp.c

lib/libv4lconvert/sn9c20x.c

lib/libv4lconvert/spca501.c

lib/libv4lconvert/spca561-decompress.c

lib/libv4lconvert/sq905c.c

lib/libv4lconvert/stv0680.c

lib/libv4lconvert/tinyjpeg-internal.h

lib/libv4lconvert/tinyjpeg.c

lib/libv4lconvert/tinyjpeg.h

utils/Makefile

utils/keytable/Makefile

utils/keytable/gen_keytables.pl

utils/keytable/keytable.c

utils/keytable/parse.h

utils/v4l2-compliance/Makefile

utils/v4l2-compliance/v4l2-compliance.cpp

utils/v4l2-ctl/v4l2-ctl.cpp

utils/v4l2-dbg/v4l2-dbg.cpp

Show diffs side-by-side

added added

removed removed

lib/libv4lconvert/jidctflt.c

* implementation, accuracy is lost due to imprecise representation of the

* scaled quantization values. However, that problem does not arise if

* we use floating point arithmetic.

#include <stdint.h>

#include "tinyjpeg-internal.h"

#define FAST_FLOAT float

#define DCTSIZE 8

#define DCTSIZE2 (DCTSIZE*DCTSIZE)

#define DCTSIZE2 (DCTSIZE * DCTSIZE)

#define DEQUANTIZE(coef,quantval) (((FAST_FLOAT) (coef)) * (quantval))

#define DEQUANTIZE(coef, quantval) (((FAST_FLOAT) (coef)) * (quantval))

#if defined(__GNUC__) && (defined(__i686__) || defined(__x86_64__))

static inline unsigned char descale_and_clamp(int x, int shift)

{

__asm__ (

"add %3,%1\n"

"\tsar %2,%1\n"

"\tsub $-128,%1\n"

"\tcmovl %5,%1\n" /* Use the sub to compare to 0 */

"\tcmpl %4,%1\n"

"\tcmovg %4,%1\n"

: "=r"(x)

: "0"(x), "Ic"((unsigned char)shift), "ir"(1U<<(shift-1)), "r" (0xff), "r" (0)

);

return x;

__asm__ (

"add %3,%1\n"

"\tsar %2,%1\n"

"\tsub $-128,%1\n"

"\tcmovl %5,%1\n" /* Use the sub to compare to 0 */

"\tcmpl %4,%1\n"

"\tcmovg %4,%1\n"

: "=r"(x)

: "0"(x), "Ic"((unsigned char)shift), "ir" (1U << (shift - 1)), "r" (0xff), "r" (0)

);

return x;

}

100

#else

101

static inline unsigned char descale_and_clamp(int x, int shift)

102

{

103

x += (1UL<<(shift-1));

104

if (x<0)

105

x = (x >> shift) | ((~(0UL)) << (32-(shift)));

106

else

107

x >>= shift;

108

x += 128;

109

if (x>255)

110

return 255;

111

else if (x<0)

112

return 0;

113

else

114

return x;

103

x += 1UL << (shift - 1);

104

if (x < 0)

105

x = (x >> shift) | ((~(0UL)) << (32 - (shift)));

106

else

107

x >>= shift;

108

x += 128;

109

if (x > 255)

110

return 255;

111

if (x < 0)

112

return 0;

113

return x;

115

114

}

116

115

#endif

117

116

119

118

* Perform dequantization and inverse DCT on one block of coefficients.

120

119

121

120

122

void

123

tinyjpeg_idct_float (struct component *compptr, uint8_t *output_buf, int stride)

121

void tinyjpeg_idct_float(struct component *compptr, uint8_t *output_buf, int stride)

124

122

{

125

FAST_FLOAT tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;

126

FAST_FLOAT tmp10, tmp11, tmp12, tmp13;

127

FAST_FLOAT z5, z10, z11, z12, z13;

128

int16_t *inptr;

129

FAST_FLOAT *quantptr;

130

FAST_FLOAT *wsptr;

131

uint8_t *outptr;

132

int ctr;

133

FAST_FLOAT workspace[DCTSIZE2]; /* buffers data between passes */

134

135

/* Pass 1: process columns from input, store into work array. */

136

137

inptr = compptr->DCT;

138

quantptr = compptr->Q_table;

139

wsptr = workspace;

140

for (ctr = DCTSIZE; ctr > 0; ctr--) {

141

/* Due to quantization, we will usually find that many of the input

142

* coefficients are zero, especially the AC terms. We can exploit this

143

* by short-circuiting the IDCT calculation for any column in which all

144

* the AC terms are zero. In that case each output is equal to the

145

* DC coefficient (with scale factor as needed).

146

* With typical images and quantization tables, half or more of the

147

* column DCT calculations can be simplified this way.

148

149

150

if (inptr[DCTSIZE*1] == 0 && inptr[DCTSIZE*2] == 0 &&

151

inptr[DCTSIZE*3] == 0 && inptr[DCTSIZE*4] == 0 &&

152

inptr[DCTSIZE*5] == 0 && inptr[DCTSIZE*6] == 0 &&

153

inptr[DCTSIZE*7] == 0) {

154

/* AC terms all zero */

155

FAST_FLOAT dcval = DEQUANTIZE(inptr[DCTSIZE*0], quantptr[DCTSIZE*0]);

156

157

wsptr[DCTSIZE*0] = dcval;

158

wsptr[DCTSIZE*1] = dcval;

159

wsptr[DCTSIZE*2] = dcval;

160

wsptr[DCTSIZE*3] = dcval;

161

wsptr[DCTSIZE*4] = dcval;

162

wsptr[DCTSIZE*5] = dcval;

163

wsptr[DCTSIZE*6] = dcval;

164

wsptr[DCTSIZE*7] = dcval;

165

166

inptr++; /* advance pointers to next column */

167

quantptr++;

168

wsptr++;

169

continue;

170

}

171

172

/* Even part */

173

174

tmp0 = DEQUANTIZE(inptr[DCTSIZE*0], quantptr[DCTSIZE*0]);

175

tmp1 = DEQUANTIZE(inptr[DCTSIZE*2], quantptr[DCTSIZE*2]);

176

tmp2 = DEQUANTIZE(inptr[DCTSIZE*4], quantptr[DCTSIZE*4]);

177

tmp3 = DEQUANTIZE(inptr[DCTSIZE*6], quantptr[DCTSIZE*6]);

178

179

tmp10 = tmp0 + tmp2; /* phase 3 */

180

tmp11 = tmp0 - tmp2;

181

182

tmp13 = tmp1 + tmp3; /* phases 5-3 */

183

tmp12 = (tmp1 - tmp3) * ((FAST_FLOAT) 1.414213562) - tmp13; /* 2*c4 */

184

185

tmp0 = tmp10 + tmp13; /* phase 2 */

186

tmp3 = tmp10 - tmp13;

187

tmp1 = tmp11 + tmp12;

188

tmp2 = tmp11 - tmp12;

189

190

/* Odd part */

191

192

tmp4 = DEQUANTIZE(inptr[DCTSIZE*1], quantptr[DCTSIZE*1]);

193

tmp5 = DEQUANTIZE(inptr[DCTSIZE*3], quantptr[DCTSIZE*3]);

194

tmp6 = DEQUANTIZE(inptr[DCTSIZE*5], quantptr[DCTSIZE*5]);

195

tmp7 = DEQUANTIZE(inptr[DCTSIZE*7], quantptr[DCTSIZE*7]);

196

197

z13 = tmp6 + tmp5; /* phase 6 */

198

z10 = tmp6 - tmp5;

199

z11 = tmp4 + tmp7;

200

z12 = tmp4 - tmp7;

201

202

tmp7 = z11 + z13; /* phase 5 */

203

tmp11 = (z11 - z13) * ((FAST_FLOAT) 1.414213562); /* 2*c4 */

204

205

z5 = (z10 + z12) * ((FAST_FLOAT) 1.847759065); /* 2*c2 */

206

tmp10 = ((FAST_FLOAT) 1.082392200) * z12 - z5; /* 2*(c2-c6) */

207

tmp12 = ((FAST_FLOAT) -2.613125930) * z10 + z5; /* -2*(c2+c6) */

208

209

tmp6 = tmp12 - tmp7; /* phase 2 */

210

tmp5 = tmp11 - tmp6;

211

tmp4 = tmp10 + tmp5;

212

213

wsptr[DCTSIZE*0] = tmp0 + tmp7;

214

wsptr[DCTSIZE*7] = tmp0 - tmp7;

215

wsptr[DCTSIZE*1] = tmp1 + tmp6;

216

wsptr[DCTSIZE*6] = tmp1 - tmp6;

217

wsptr[DCTSIZE*2] = tmp2 + tmp5;

218

wsptr[DCTSIZE*5] = tmp2 - tmp5;

219

wsptr[DCTSIZE*4] = tmp3 + tmp4;

220

wsptr[DCTSIZE*3] = tmp3 - tmp4;

221

222

inptr++; /* advance pointers to next column */

223

quantptr++;

224

wsptr++;

225

}

226

227

/* Pass 2: process rows from work array, store into output array. */

228

/* Note that we must descale the results by a factor of 8 == 2**3. */

229

230

wsptr = workspace;

231

outptr = output_buf;

232

for (ctr = 0; ctr < DCTSIZE; ctr++) {

233

/* Rows of zeroes can be exploited in the same way as we did with columns.

234

* However, the column calculation has created many nonzero AC terms, so

235

* the simplification applies less often (typically 5% to 10% of the time).

236

* And testing floats for zero is relatively expensive, so we don't bother.

237

238

239

/* Even part */

240

241

tmp10 = wsptr[0] + wsptr[4];

242

tmp11 = wsptr[0] - wsptr[4];

243

244

tmp13 = wsptr[2] + wsptr[6];

245

tmp12 = (wsptr[2] - wsptr[6]) * ((FAST_FLOAT) 1.414213562) - tmp13;

246

247

tmp0 = tmp10 + tmp13;

248

tmp3 = tmp10 - tmp13;

249

tmp1 = tmp11 + tmp12;

250

tmp2 = tmp11 - tmp12;

251

252

/* Odd part */

253

254

z13 = wsptr[5] + wsptr[3];

255

z10 = wsptr[5] - wsptr[3];

256

z11 = wsptr[1] + wsptr[7];

257

z12 = wsptr[1] - wsptr[7];

258

259

tmp7 = z11 + z13;

260

tmp11 = (z11 - z13) * ((FAST_FLOAT) 1.414213562);

261

262

z5 = (z10 + z12) * ((FAST_FLOAT) 1.847759065); /* 2*c2 */

263

tmp10 = ((FAST_FLOAT) 1.082392200) * z12 - z5; /* 2*(c2-c6) */

264

tmp12 = ((FAST_FLOAT) -2.613125930) * z10 + z5; /* -2*(c2+c6) */

265

266

tmp6 = tmp12 - tmp7;

267

tmp5 = tmp11 - tmp6;

268

tmp4 = tmp10 + tmp5;

269

270

/* Final output stage: scale down by a factor of 8 and range-limit */

271

272

outptr[0] = descale_and_clamp((int)(tmp0 + tmp7), 3);

273

outptr[7] = descale_and_clamp((int)(tmp0 - tmp7), 3);

274

outptr[1] = descale_and_clamp((int)(tmp1 + tmp6), 3);

275

outptr[6] = descale_and_clamp((int)(tmp1 - tmp6), 3);

276

outptr[2] = descale_and_clamp((int)(tmp2 + tmp5), 3);

277

outptr[5] = descale_and_clamp((int)(tmp2 - tmp5), 3);

278

outptr[4] = descale_and_clamp((int)(tmp3 + tmp4), 3);

279

outptr[3] = descale_and_clamp((int)(tmp3 - tmp4), 3);

280

281

282

wsptr += DCTSIZE; /* advance pointer to next row */

283

outptr += stride;

284

}

123

FAST_FLOAT tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;

124

FAST_FLOAT tmp10, tmp11, tmp12, tmp13;

125

FAST_FLOAT z5, z10, z11, z12, z13;

126

int16_t *inptr;

127

FAST_FLOAT *quantptr;

128

FAST_FLOAT *wsptr;

129

uint8_t *outptr;

130

int ctr;

131

FAST_FLOAT workspace[DCTSIZE2]; /* buffers data between passes */

132

133

/* Pass 1: process columns from input, store into work array. */

134

135

inptr = compptr->DCT;

136

quantptr = compptr->Q_table;

137

wsptr = workspace;

138

for (ctr = DCTSIZE; ctr > 0; ctr--) {

139

/* Due to quantization, we will usually find that many of the input

140

* coefficients are zero, especially the AC terms. We can exploit this

141

* by short-circuiting the IDCT calculation for any column in which all

142

* the AC terms are zero. In that case each output is equal to the

143

* DC coefficient (with scale factor as needed).

144

* With typical images and quantization tables, half or more of the

145

* column DCT calculations can be simplified this way.

146

147

148

if (inptr[DCTSIZE*1] == 0 && inptr[DCTSIZE*2] == 0 &&

149

inptr[DCTSIZE*3] == 0 && inptr[DCTSIZE*4] == 0 &&

150

inptr[DCTSIZE*5] == 0 && inptr[DCTSIZE*6] == 0 &&

151

inptr[DCTSIZE*7] == 0) {

152

/* AC terms all zero */

153

FAST_FLOAT dcval = DEQUANTIZE(inptr[DCTSIZE*0], quantptr[DCTSIZE*0]);

154

155

wsptr[DCTSIZE*0] = dcval;

156

wsptr[DCTSIZE*1] = dcval;

157

wsptr[DCTSIZE*2] = dcval;

158

wsptr[DCTSIZE*3] = dcval;

159

wsptr[DCTSIZE*4] = dcval;

160

wsptr[DCTSIZE*5] = dcval;

161

wsptr[DCTSIZE*6] = dcval;

162

wsptr[DCTSIZE*7] = dcval;

163

164

inptr++; /* advance pointers to next column */

165

quantptr++;

166

wsptr++;

167

continue;

168

}

169

170

/* Even part */

171

172

tmp0 = DEQUANTIZE(inptr[DCTSIZE*0], quantptr[DCTSIZE*0]);

173

tmp1 = DEQUANTIZE(inptr[DCTSIZE*2], quantptr[DCTSIZE*2]);

174

tmp2 = DEQUANTIZE(inptr[DCTSIZE*4], quantptr[DCTSIZE*4]);

175

tmp3 = DEQUANTIZE(inptr[DCTSIZE*6], quantptr[DCTSIZE*6]);

176

177

tmp10 = tmp0 + tmp2; /* phase 3 */

178

tmp11 = tmp0 - tmp2;

179

180

tmp13 = tmp1 + tmp3; /* phases 5-3 */

181

tmp12 = (tmp1 - tmp3) * ((FAST_FLOAT) 1.414213562) - tmp13; /* 2*c4 */

182

183

tmp0 = tmp10 + tmp13; /* phase 2 */

184

tmp3 = tmp10 - tmp13;

185

tmp1 = tmp11 + tmp12;

186

tmp2 = tmp11 - tmp12;

187

188

/* Odd part */

189

190

tmp4 = DEQUANTIZE(inptr[DCTSIZE*1], quantptr[DCTSIZE*1]);

191

tmp5 = DEQUANTIZE(inptr[DCTSIZE*3], quantptr[DCTSIZE*3]);

192

tmp6 = DEQUANTIZE(inptr[DCTSIZE*5], quantptr[DCTSIZE*5]);

193

tmp7 = DEQUANTIZE(inptr[DCTSIZE*7], quantptr[DCTSIZE*7]);

194

195

z13 = tmp6 + tmp5; /* phase 6 */

196

z10 = tmp6 - tmp5;

197

z11 = tmp4 + tmp7;

198

z12 = tmp4 - tmp7;

199

200

tmp7 = z11 + z13; /* phase 5 */

201

tmp11 = (z11 - z13) * ((FAST_FLOAT) 1.414213562); /* 2*c4 */

202

203

z5 = (z10 + z12) * ((FAST_FLOAT) 1.847759065); /* 2*c2 */

204

tmp10 = ((FAST_FLOAT) 1.082392200) * z12 - z5; /* 2*(c2-c6) */

205

tmp12 = ((FAST_FLOAT) -2.613125930) * z10 + z5; /* -2*(c2+c6) */

206

207

tmp6 = tmp12 - tmp7; /* phase 2 */

208

tmp5 = tmp11 - tmp6;

209

tmp4 = tmp10 + tmp5;

210

211

wsptr[DCTSIZE*0] = tmp0 + tmp7;

212

wsptr[DCTSIZE*7] = tmp0 - tmp7;

213

wsptr[DCTSIZE*1] = tmp1 + tmp6;

214

wsptr[DCTSIZE*6] = tmp1 - tmp6;

215

wsptr[DCTSIZE*2] = tmp2 + tmp5;

216

wsptr[DCTSIZE*5] = tmp2 - tmp5;

217

wsptr[DCTSIZE*4] = tmp3 + tmp4;

218

wsptr[DCTSIZE*3] = tmp3 - tmp4;

219

220

inptr++; /* advance pointers to next column */

221

quantptr++;

222

wsptr++;

223

}

224

225

/* Pass 2: process rows from work array, store into output array. */

226

/* Note that we must descale the results by a factor of 8 == 2**3. */

227

228

wsptr = workspace;

229

outptr = output_buf;

230

for (ctr = 0; ctr < DCTSIZE; ctr++) {

231

/* Rows of zeroes can be exploited in the same way as we did with columns.

232

* However, the column calculation has created many nonzero AC terms, so

233

* the simplification applies less often (typically 5% to 10% of the time).

234

* And testing floats for zero is relatively expensive, so we don't bother.

235

236

237

/* Even part */

238

239

tmp10 = wsptr[0] + wsptr[4];

240

tmp11 = wsptr[0] - wsptr[4];

241

242

tmp13 = wsptr[2] + wsptr[6];

243

tmp12 = (wsptr[2] - wsptr[6]) * ((FAST_FLOAT) 1.414213562) - tmp13;

244

245

tmp0 = tmp10 + tmp13;

246

tmp3 = tmp10 - tmp13;

247

tmp1 = tmp11 + tmp12;

248

tmp2 = tmp11 - tmp12;

249

250

/* Odd part */

251

252

z13 = wsptr[5] + wsptr[3];

253

z10 = wsptr[5] - wsptr[3];

254

z11 = wsptr[1] + wsptr[7];

255

z12 = wsptr[1] - wsptr[7];

256

257

tmp7 = z11 + z13;

258

tmp11 = (z11 - z13) * ((FAST_FLOAT) 1.414213562);

259

260

z5 = (z10 + z12) * ((FAST_FLOAT) 1.847759065); /* 2*c2 */

261

tmp10 = ((FAST_FLOAT) 1.082392200) * z12 - z5; /* 2*(c2-c6) */

262

tmp12 = ((FAST_FLOAT) -2.613125930) * z10 + z5; /* -2*(c2+c6) */

263

264

tmp6 = tmp12 - tmp7;

265

tmp5 = tmp11 - tmp6;

266

tmp4 = tmp10 + tmp5;

267

268

/* Final output stage: scale down by a factor of 8 and range-limit */

269

270

outptr[0] = descale_and_clamp((int)(tmp0 + tmp7), 3);

271

outptr[7] = descale_and_clamp((int)(tmp0 - tmp7), 3);

272

outptr[1] = descale_and_clamp((int)(tmp1 + tmp6), 3);

273

outptr[6] = descale_and_clamp((int)(tmp1 - tmp6), 3);

274

outptr[2] = descale_and_clamp((int)(tmp2 + tmp5), 3);

275

outptr[5] = descale_and_clamp((int)(tmp2 - tmp5), 3);

276

outptr[4] = descale_and_clamp((int)(tmp3 + tmp4), 3);

277

outptr[3] = descale_and_clamp((int)(tmp3 - tmp4), 3);

278

279

280

wsptr += DCTSIZE; /* advance pointer to next row */

281

outptr += stride;

282

}

285

283

}

286

284

Older »