~ubuntu-branches/debian/sid/mjpegtools/sid

« back to all changes in this revision

Viewing changes to y4mdenoise/implementation.html

Committer: Package Import Robot
Author(s): Reinhard Tartler
Date: 2012-09-02 16:29:46 UTC
Revision ID: package-import@ubuntu.com-20120902162946-i1zpl8cjngq9hd6w

Tags: upstream-2.0.0+debian

Import upstream version 2.0.0+debian

files added:

AUTHORS

BUGS

CHANGES

COPYING

ChangeLog

HINTS

INSTALL

INSTALL.real

Makefile.am

Makefile.in

NEWS

PLANS

README

README.AltiVec

README.DV

README.avilib

README.glav

README.lavpipe

README.transist

TODO

acinclude.m4

aclocal.m4

aenc

aenc/Makefile.am

aenc/Makefile.in

aenc/README

aenc/common.c

aenc/common.h

aenc/encode.c

aenc/encoder.h

aenc/fft.c

aenc/musicin.c

aenc/psy.c

aenc/table_absthr.h

aenc/table_alloc.h

aenc/table_cb.h

aenc/table_enwindow.h

aenc/table_th.h

aenc/tables.c

aenc/tonal.c

aenc/wav_io.c

aenc/wav_io.h

autogen.sh

compile

config.guess

config.h.in

config.sub

configure

configure.ac

cpuinfo.sh

depcomp

docs

docs/FAQ.txt

docs/Makefile.am

docs/Makefile.in

docs/authors.sgml

docs/jpeg2yuv.1

docs/lav2mpeg.1

docs/lav2wav.1

docs/lav2yuv.1

docs/lavpipe.1

docs/lavplay.1

docs/lavrec.1

docs/lavtools.sgml

docs/lavtrans.1

docs/mjpeg-howto.info

docs/mjpegtools.1

docs/mp2enc.1

docs/mpeg2enc.1

docs/mplex.1

docs/pgmtoy4m.1

docs/png2yuv.1

docs/pnmtoy4m.1

docs/ppmtoy4m.1

docs/y4mcolorbars.1

docs/y4mdenoise.1

docs/y4mtopnm.1

docs/y4mtoppm.1

docs/y4munsharp.1

docs/yuv2lav.1

docs/yuv4mpeg.5

docs/yuvdenoise.1

docs/yuvfps.1

docs/yuvinactive.1

docs/yuvkineco.1

docs/yuvmedianfilter.1

docs/yuvplay.1

docs/yuvscaler.1

docs/yuvycsnoise.1

install-sh

lavtools

lavtools/Makefile.am

lavtools/Makefile.in

lavtools/audiolib.c

lavtools/audiolib.h

lavtools/avilib.c

lavtools/avilib.h

lavtools/colorspace.c

lavtools/colorspace.h

lavtools/editlist.c

lavtools/editlist.h

lavtools/frequencies.c

lavtools/frequencies.h

lavtools/glav.c

lavtools/glav.h

lavtools/glav_main.c

lavtools/jpeg2yuv.c

lavtools/jpegutils.c

lavtools/jpegutils.h

lavtools/lav2wav.c

lavtools/lav2yuv.c

lavtools/lav_common.c

lavtools/lav_common.h

lavtools/lav_io.c

lavtools/lav_io.h

lavtools/lavaddwav.c

lavtools/lavinfo.c

lavtools/lavpipe.c

lavtools/lavplay.c

lavtools/lavrec.c

lavtools/lavtrans.c

lavtools/lavvideo.c

lavtools/liblavplay.c

lavtools/liblavplay.h

lavtools/liblavrec.c

lavtools/liblavrec.h

lavtools/matteblend.flt.c

lavtools/mjpeg_simd_helper.c

lavtools/multiblend.flt.c

lavtools/pipelist.c

lavtools/pipelist.h

lavtools/png2yuv.c

lavtools/pnmtoy4m.c

lavtools/ppmtoy4m.c

lavtools/subsample.c

lavtools/subsample.h

lavtools/testrec.c

lavtools/transist.flt.c

lavtools/y4mcolorbars.c

lavtools/y4mstabilizer.c

lavtools/y4mtopnm.c

lavtools/y4mtoppm.c

lavtools/ypipe.c

lavtools/yuv2lav.c

lavtools/yuvfps.c

lavtools/yuvinactive.c

lavtools/yuvplay.c

ltmain.sh

missing

mjpeg_howto.txt

mjpegtools.pc

mjpegtools.pc.in

mjpegtools.spec

mjpegtools.spec.in

mpeg2enc

mpeg2enc/ChangeLog

mpeg2enc/INSTALL

mpeg2enc/Makefile.am

mpeg2enc/Makefile.in

mpeg2enc/NOTES

mpeg2enc/README

mpeg2enc/TODO

mpeg2enc/channel.hh

mpeg2enc/conform.cc

mpeg2enc/elemstrmwriter.cc

mpeg2enc/elemstrmwriter.hh

mpeg2enc/encoderparams.cc

mpeg2enc/encoderparams.hh

mpeg2enc/encodertypes.h

mpeg2enc/fdct.c

mpeg2enc/fdct_mmx.c

mpeg2enc/fdct_x86.c

mpeg2enc/idct.c

mpeg2enc/idct_mmx.c

mpeg2enc/imageplanes.cc

mpeg2enc/imageplanes.hh

mpeg2enc/macroblock.cc

mpeg2enc/macroblock.hh

mpeg2enc/motionest.cc

mpeg2enc/mpeg2coder.cc

mpeg2enc/mpeg2coder.hh

mpeg2enc/mpeg2enc.cc

mpeg2enc/mpeg2encoder.cc

mpeg2enc/mpeg2encoder.hh

mpeg2enc/mpeg2encoptions.cc

mpeg2enc/mpeg2encoptions.hh

mpeg2enc/mpeg2encparams.h

mpeg2enc/mpeg2syntaxcodes.h

mpeg2enc/ontheflyratectlpass1.cc

mpeg2enc/ontheflyratectlpass1.hh

mpeg2enc/ontheflyratectlpass2.cc

mpeg2enc/ontheflyratectlpass2.hh

mpeg2enc/picture.cc

mpeg2enc/picture.hh

mpeg2enc/picturereader.cc

mpeg2enc/picturereader.hh

mpeg2enc/predcomp_mmx.c

mpeg2enc/predcomp_mmxe.c

mpeg2enc/predict.cc

mpeg2enc/predict_mmx.c

mpeg2enc/predict_ref.c

mpeg2enc/predict_ref.h

mpeg2enc/predict_x86.c

mpeg2enc/putpic.cc

mpeg2enc/quant_mmx.c

mpeg2enc/quantize.cc

mpeg2enc/quantize.hh

mpeg2enc/quantize_precomp.h

mpeg2enc/quantize_ref.c

mpeg2enc/quantize_ref.h

mpeg2enc/quantize_x86.c

mpeg2enc/rate_complexity_model.cc

mpeg2enc/rate_complexity_model.hh

mpeg2enc/ratectl.cc

mpeg2enc/ratectl.hh

mpeg2enc/seqencoder.cc

mpeg2enc/seqencoder.hh

mpeg2enc/seqstats.cc

mpeg2enc/seqstats.hh

mpeg2enc/simd.h

mpeg2enc/stats.cc

mpeg2enc/streamstate.cc

mpeg2enc/streamstate.h

mpeg2enc/synchrolib.cc

mpeg2enc/synchrolib.h

mpeg2enc/syntaxconsts.h

mpeg2enc/tables.c

mpeg2enc/tables.h

mpeg2enc/transfrm.cc

mpeg2enc/transfrm_ref.c

mpeg2enc/transfrm_ref.h

mpeg2enc/transfrm_x86.c

mplex

mplex/COPYING

mplex/Doxyfile

mplex/INSTRUCT

mplex/Makefile.am

mplex/Makefile.in

mplex/README

mplex/TODO

mplex/ac3strm_in.cpp

mplex/audiostrm.hpp

mplex/audiostrm_out.cpp

mplex/aunit.hpp

mplex/aunitbuffer.hpp

mplex/bits.cpp

mplex/bits.hpp

mplex/decodebufmodel.cpp

mplex/decodebufmodel.hpp

mplex/dtsstrm_in.cpp

mplex/inputstrm.cpp

mplex/inputstrm.hpp

mplex/interact.cpp

mplex/interact.hpp

mplex/lpcmstrm_in.cpp

mplex/main.cpp

mplex/mpastrm_in.cpp

mplex/mpeg_systems_paper_0.99.ps.gz

mplex/mplexconsts.hpp

mplex/multiplexor.cpp

mplex/multiplexor.hpp

mplex/outputstrm.hpp

mplex/padstrm.cpp

mplex/padstrm.hpp

mplex/stillsstream.cpp

mplex/stillsstream.hpp

mplex/stream_params.cpp

mplex/stream_params.hpp

mplex/subpstream.cpp

mplex/systems.cpp

mplex/systems.hpp

mplex/videostrm.hpp

mplex/videostrm_in.cpp

mplex/videostrm_out.cpp

scripts

scripts/Makefile.am

scripts/Makefile.in

scripts/anytovcd.sh

scripts/aufnahme

scripts/berechne

scripts/codiere

scripts/frameber

scripts/lav2avi.sh

scripts/lav2mpeg

scripts/lavtc.sh

scripts/makePLI.py

scripts/mpegtranscode

utils

utils/Makefile.am

utils/Makefile.in

utils/altivec

utils/altivec/Makefile.am

utils/altivec/Makefile.in

utils/altivec/README

utils/altivec/add_pred.c

utils/altivec/altivec_conf.h

utils/altivec/altivec_motion.h

utils/altivec/altivec_predict.h

utils/altivec/altivec_quantize.h

utils/altivec/altivec_transform.h

utils/altivec/amber.c

utils/altivec/amber.h

utils/altivec/benchmark.c

utils/altivec/benchmark.h

utils/altivec/bsad.c

utils/altivec/bsumsq.c

utils/altivec/bsumsq_sub22.c

utils/altivec/build_sub22_mests.c

utils/altivec/build_sub44_mests.c

utils/altivec/detect.c

utils/altivec/fdct.c

utils/altivec/fdct_idct.c

utils/altivec/field_dct_best.c

utils/altivec/find_best_one_pel.c

utils/altivec/idct.c

utils/altivec/iquant_intra.c

utils/altivec/iquant_non_intra.c

utils/altivec/motion.c

utils/altivec/pred_comp.c

utils/altivec/quant_non_intra.c

utils/altivec/quant_weight_coeff_sum.c

utils/altivec/quantize.c

utils/altivec/sad_00.c

utils/altivec/sad_01.c

utils/altivec/sad_10.c

utils/altivec/sad_11.c

utils/altivec/sub_mean_reduction.c

utils/altivec/sub_mean_reduction_ppc.S

utils/altivec/sub_pred.c

utils/altivec/subsample_image.c

utils/altivec/sumsq.c

utils/altivec/sumsq_sub22.c

utils/altivec/variance.c

utils/altivec/vectorize.h

utils/altivec/verify.h

utils/cpu_accel.c

utils/cpu_accel.h

utils/cpuinfo.c

utils/fastintfns.h

utils/format_codes.h

utils/mjpeg_logging.c

utils/mjpeg_logging.h

utils/mjpeg_types.h

utils/mmx.h

utils/mmxsse

utils/mmxsse/Makefile.am

utils/mmxsse/Makefile.in

utils/mmxsse/build_sub22_mests.c

utils/mmxsse/build_sub44_mests.c

utils/mmxsse/find_best_one_pel.c

utils/mmxsse/mblock_bsad_mmx.c

utils/mmxsse/mblock_bsumsq_mmx.c

utils/mmxsse/mblock_sad_mmx.c

utils/mmxsse/mblock_sad_mmxe.c

utils/mmxsse/mblock_sub44_sads_x86.c

utils/mmxsse/mblock_sub44_sads_x86.h

utils/mmxsse/mblock_sub44_sads_x86_h.c

utils/mmxsse/mblock_sumsq_mmx.c

utils/mmxsse/mmxsse_motion.h

utils/mmxsse/motion.c

utils/motionsearch.c

utils/motionsearch.h

utils/mpegconsts.c

utils/mpegconsts.h

utils/mpegtimecode.c

utils/mpegtimecode.h

utils/videodev_mjpeg.h

utils/yuv4mpeg.c

utils/yuv4mpeg.h

utils/yuv4mpeg_intern.h

utils/yuv4mpeg_ratio.c

y4mdenoise

y4mdenoise/Allocator.hh

y4mdenoise/BitmapRegion2D.hh

y4mdenoise/DoublyLinkedList.hh

y4mdenoise/Limits.hh

y4mdenoise/Makefile.am

y4mdenoise/Makefile.in

y4mdenoise/MotionSearcher.hh

y4mdenoise/PlacementAllocator.hh

y4mdenoise/ReferenceFrame.hh

y4mdenoise/Region2D.hh

y4mdenoise/SearchBorder.hh

y4mdenoise/SearchWindow.hh

y4mdenoise/Set.hh

y4mdenoise/SetRegion2D.hh

y4mdenoise/SkipList.hh

y4mdenoise/Status_t.h

y4mdenoise/TemplateLib.hh

y4mdenoise/VariableSizeAllocator.hh

y4mdenoise/Vector.hh

y4mdenoise/implementation.html

y4mdenoise/main.c

y4mdenoise/newdenoise.cc

y4mdenoise/newdenoise.hh

y4mdenoise/regiontest.cc

y4munsharp

y4munsharp/Makefile.am

y4munsharp/Makefile.in

y4munsharp/y4munsharp.c

y4mutils

y4mutils/Makefile.am

y4mutils/Makefile.in

y4mutils/pgmtoy4m.c

y4mutils/qttoy4m.c

y4mutils/y4mblack.c

y4mutils/y4mhist.c

y4mutils/y4minterlace.c

y4mutils/y4mivtc.c

y4mutils/y4mshift.c

y4mutils/y4mspatialfilter.c

y4mutils/y4mtoqt.c

y4mutils/y4mtoyuv.c

y4mutils/yuv4mpeg.c

y4mutils/yuvmedianfilter.c

y4mutils/yuyvtoy4m.c

yuvcorrect

yuvcorrect/Makefile.am

yuvcorrect/Makefile.in

yuvcorrect/yuvcorrect.c

yuvcorrect/yuvcorrect.h

yuvcorrect/yuvcorrect_functions.c

yuvcorrect/yuvcorrect_tune.c

yuvdeinterlace

yuvdeinterlace/Makefile.am

yuvdeinterlace/Makefile.in

yuvdeinterlace/yuvdeinterlace.cc

yuvdenoise

yuvdenoise/Makefile.am

yuvdenoise/Makefile.in

yuvdenoise/main.c

yuvfilters

yuvfilters/ChangeLog

yuvfilters/Makefile.am

yuvfilters/Makefile.in

yuvfilters/README.2-3pulldown

yuvfilters/TODO

yuvfilters/addtask.c

yuvfilters/alloctask.c

yuvfilters/initframe.c

yuvfilters/main.c

yuvfilters/putframe.c

yuvfilters/yuvfilters.h

yuvfilters/yuvkineco.c

yuvfilters/yuvstdin.c

yuvfilters/yuvstdout.c

yuvfilters/yuvycsnoise.c

yuvscaler

yuvscaler/Makefile.am

yuvscaler/Makefile.in

yuvscaler/yuvscaler.c

yuvscaler/yuvscaler.h

yuvscaler/yuvscaler_bicubic.c

yuvscaler/yuvscaler_implementation.txt

yuvscaler/yuvscaler_resample.c

Show diffs side-by-side

added added

removed removed

y4mdenoise/implementation.html

<html>

<title>Design and implementation of the new denoiser</title>

<center><h1>Design and implementation of the new denoiser</h1></center>

<p>In theory, the design of the denoiser is pretty simple; getting it

to perform was the hard part.

<p>It maintains a list of the last several frames, called <i>reference

frames</i>. Each reference frame is composed of <i>reference

pixels</i>, which accumulate the values of several pixels.

Every time a pixel in one frame is proven to be a moved instance of a

pixel in another frame, the reference-pixel incorporates its value,

and produces an average value for the pixel. The oldest reference

frame, therefore, gets a pretty good idea of the real value of every

pixel, but of course output is delayed by the number of reference

frames.

<p>It compares every pixel in the current frame with all pixels

in the previous frame, within a given search-radius, and any pixels

that are equal within the given error tolerance are assumed to be the

same pixel. It builds contiguous regions of matched pixels, with

the motion vector that's common to the region.

<p>If there are too many matches for a particular area of the image, or

if the largest contiguous match in the area is too large, it's applied

to the image right then, and then searching continues. Applying a

region means to flood-fill the region (to make it the largest size

possible, and to flesh out its borders to pixel accuracy), then

hooking up the corresponding reference-frame pixels to the new frame

at their new location, and incorporating the values of all the new

pixels into the corresponding reference pixels. Doing this before

the end of searching the frame means the affected areas don't have

to be part of the search any more, helping to reduce the amount of

work needed to search the rest of the frame.

<p>At the end of the frame, matches are applied to the new frame, from

the largest to the smallest, discounting any areas that have

already been resolved. Any new-frame pixels not resolved by now

are considered to be new information, and a new reference-pixel is

generated for each one.

<p>The search is not actually done one pixel at a time; it's done in

terms of pixel groups. An entire pixel-group has to match for any

match to be found, but all possible pixel-groups are tested (i.e. all

possible overlaps are checked). Using pixel-groups helps to establish

a minimum standard for what may be considered a match, in order to

avoid finding lots of really small (and really useless) matches.

The flood-fill still extends the matches out to pixel accuracy,

so the only details that can't be found by motion-detection are the

ones smaller than a pixel-group, which is not a bad sacrifice for

performance's sake.

<p><br>Table of contents:

<ul>

<li><a href="#Overview">Overview</a>

<li><a href="#Implementation">Implementation</a>

<ul>

<li><a href="#ImplementationSkipList">SkipList, Set</a>

<li><a href="#ImplementationRegion2D">Region2D, SetRegion2D,

BitmapRegion2D</a>

<li><a href="#ImplementationReferenceFrame">Pixel, ReferencePixel,

ReferenceFrame</a>

<li><a href="#ImplementationMotionSearcher">MotionSearcher,

SearchWindow, SearchBorder</a>

<ul>

<li><a href="#ImplementationMotionSearcherVersion1">Version 1</a>

<li><a href="#ImplementationMotionSearcherVersion2">Version 2</a>

</ul>

<li><a href="#FutureExtensions">Future Extensions</a>

</ul>

<a name="Overview"><h1>Overview</h1>

<p><tt>main.c</tt> parses command-line options and the YUV stream header.

<tt>newdenoise.cc</tt> converts between YUV format and the denoiser's

internal format, and calls the denoiser. <tt>MotionSearcher.hh</tt> is

the denoiser's top-level file. <tt>SearchWindow.hh</tt> and

<tt>SearchBorder.hh</tt> are two high-level pieces of the denoiser that

were broken out into their own classes, for use in other contexts.

<tt>ReferenceFrame.hh</tt> contains the definitions for pixels,

reference pixels, and reference frames.

<tt>Region2D.hh</tt> is the base class for 2-dimensional region classes;

<tt>SetRegion2D.hh</tt> implements a region using a Set of horizontal

extents, and <tt>BitmapRegion2D.hh</tt> uses an array of integers to

implement a bitmap. <tt>Set.hh</tt> is much like the STL "set" class,

except that it's based on <tt>SkipList.hh</tt>. <tt>Allocator.hh</tt>,

<tt>DoublyLinkedList.hh</tt>, <tt>Limits.hh</tt>, <tt>Status_t.h</tt>, and

<tt>TemplateLib.hh</tt> contain other basic definitions, most of which

should be standardly available; I'm just not sure they're standardly

available on all supported platforms.

<p>The denoiser classes are highly templated and highly reconfigurable;

<tt>newdenoise.cc</tt> uses them in a way suited to YUV420P video.

Intensity pixels are one 8-bit unsigned integer, color pixels are

two 8-bit unsigned integers, intensity pixel-groups are 4x2, color

pixel-groups are 2x2, intensity is denoised separately from color, and

the search-radius used for color is proportional to the relative size

of the intensity and color planes (and may, in effect, be

rectangular).

<br>

<a name="Implementation"><h1>Implementation</h1></a>

<p><tt>newdenoise.cc</tt> gives a good top-level view of how to use the

denoiser for YUV420P video. Although the top-level class of the

denoiser is <tt>MotionSearcher</tt>, a small army of classes is

100

responsible for implementing all the necessary pieces.

101

102

<a name="ImplementationSkipList"><h2>SkipList, Set</h2></a>

103

<p><tt>SkipList</tt> is a highly optimized version of the famous

104

probabilistically-balanced logarithmic-complexity sorted list

105

structure. Skip lists are well-described in other documents. Note

106

that this skip-list uses the "fix the dice" and "search finger"

107

extensions described in the literature, and its p value is

108

<sup>1</sup>/e, which maximizes speed & causes nodes to have an

109

average of 1.71 forward pointers. (A tree node would have to have

110

2 pointers, one for left and one for right, so a skip-list is more

111

space-efficient than a tree structure also.)

112

<p>One big advantage of skip-lists over tree structures, given the way

113

the denoiser uses them, is that iterator forward/backward operations

114

are small-constant complexity; they're implemented by a single pointer

115

dereference. The typical tree-structure iterator forward/backward is

116

logarithmic. Iterator forward/backward is used constantly throughout

117

the denoiser.

118

<p><tt>Set</tt> is much like STL's <tt>set</tt> class, except that it's

119

based on <tt>SkipList</tt>.

120

121

<a name="ImplementationRegion2D"><h2>Region2D, SetRegion2D,

122

BitmapRegion2D</h2></a>

123

<p><tt>SetRegion2D</tt> was the first region class written for the

124

denoiser; later, <tt>Region2D</tt> and <tt>SetRegion2D</tt> were split

125

into two classes, and <tt>BitmapRegion2D</tt> was made a subclass of

126

<tt>Region2D</tt>. It was not a perfect separation, and <tt>Region2D</tt>

127

remains a sketch of what I'd like to see, rather than a completed

128

product. I could solve its problem using virtual methods, but that

129

would prevent a lot of function-inlining from happening, and for

130

performance reasons I don't want to do that.

131

<p><tt>SetRegion2D</tt> uses <tt>Set</tt> to implement regions as a set of

132

horizontal extents, i.e. as y/x-start/x-end triplets. Quite a bit of

133

work went into writing efficient union/subtraction methods.

134

<p><tt>BitmapRegion2D</tt> uses an array of integers, treated like a bit

135

field, to implement regions. It's faster to use them in some cases,

136

though they're a lot less memory-efficient than <tt>SetRegion2D</tt>,

137

and have to be created with a maximum size.

138

139

<a name="ImplementationReferenceFrame"><h2>Pixel, ReferencePixel,

140

ReferenceFrame</h2></a>

141

<p>The <tt>Pixel</tt> class is templated with a numeric type for storing

142

pixel values, the number of dimensions in the pixel's value, and

143

a numeric type to use when doing tolerance calculations. The rule of

144

thumb is, the tolerance type should be able to hold the value of two

145

pixel-value types multiplied together.

146

<p>For YUV420P video, a Y pixel is

147

<tt>Pixel<uint_8,1,int32_t></tt> and a color (i.e. CbCr) pixel

148

is <tt>Pixel<uint8_t,2,int32_t></tt>.

149

<p>The <tt>Pixel</tt> class contains methods to get and set the value of

150

pixels, and to compare two pixels within a given tolerance. It also

151

contains methods to generate tolerance values from integers, in case

152

the pixel type has special rules. (For instance, the tolerance value

153

for a color pixel is the square of its integer counterpart, since CbCr

154

color is 2-dimensional.)

155

<p>The <tt>ReferencePixel</tt> is templated much like the <tt>Pixel</tt>

156

class. It holds a sum of pixel values, and the number of pixel values

157

summed so far. It also counts the number of reference-frames that

158

point to it. It's intended to represent a single pixel that's found

159

to exist over several frames, and to produce an average value for the

160

pixel, so as to smooth away errors.

161

<p>The <tt>ReferenceFrame</tt> is a rectangular array of

162

<tt>ReferencePixel</tt>s, representing each frame and the parts of the

163

image that it has in common with other frames.

164

165

<a name="ImplementationMotionSearcher"><h2>MotionSearcher,

166

SearchWindow, SearchBorder</h2></a>

167

<p>OK, so much for the easy part.

168

<p><tt>MotionSearcher</tt> maintains a circular list of

169

<tt>ReferenceFrame</tt>s. To make space for a new frame, the oldest

170

frame is returned to the client.

171

<p><tt>AddFrame()</tt> is responsible for processing new frames. It does

172

so in several stages. First, it looks for pixels that haven't moved,

173

i.e. new pixels whose corresponding reference-pixels are within the

174

error tolerance. That resolves most of the average frame.

175

<p>Next, it detects moved areas, i.e. parts of the new frame that match

176

parts of the previous frame except that they've moved.

177

<p>It could iterate through the frame in any order, but to keep the

178

implementation of <tt>SearchWindow</tt> and <tt>SearchBorder</tt> simple

179

and efficient, it iterates through the frame in a zigzag pattern,

180

i.e. starting at the upper-left corner, it moves right to the edge,

181

then down a line, then left to the edge, then down a line, and so on

182

to the end of the frame.

183

<p>The search-window consists of the reference-frame's pixels,

184

partitioned into search-window cells. Each cell contains a

185

pixel-group (i.e. a rectangular array of pixels, containing the

186

minimum pixel pattern that can be searched for). The pixel-groups

187

in each cell overlap other cells; although the motion-search is done

188

in terms of pixel-groups, it still looks at all all possible

189

combinations of pixels that could form a pixel-group.

190

<p>The pixel-sorter is a tree structure that partitions pixel-groups

191

(actually, search-window cells, which contain a pixel-group).

192

The total number of dimensions of a pixel-group is the number of

193

pixels in the group, times the dimension of a pixel. For the

194

YUV420 implementation, 4x2 pixel-groups are used for intensity pixels,

195

which consist of 1 dimension, for a total of 8, and 2x2 pixel groups

196

are used for color pixels, which consist of 2 dimensions, again for a

197

total of 8. Partitioning n dimensions requires 2<sup>n</sup>

198

branches per tree node; in this example, that's 256. (So if the

199

pixel-sorter tree is well-balanced, then descending to a child branch

200

cuts out all but <sup>1</sup>/256 of the remaining pixel-groups, which

201

is supposed to make searching for matching pixel-groups very efficient.)

202

Search-window cells are inserted into the pixel-sorter tree, and

203

descend into child branches based on their value. But if any of the

204

pixel-group's pixel dimension values are within the error tolerance of

205

the split-point for that dimension in the current pixel-sorter branch

206

node, then that pixel-group won't fit neatly into any of the children

207

nodes, and thus the search-window cell has to stay at that level of

208

the tree. (Alternately, a copy of it could be placed in multiple

209

children, but this design opts not to do that.) Each pixel-sorter

210

branch node maintains a doubly-linked list of search-window cells that

211

are attached to it. As an optimization, once a search-window cell is

212

inserted into the pixel-sorter, that result is used for the rest of

213

the frame, as the search-window cell is added to and removed from the

214

pixel-sorter, depending on whether that search-window cell is within

215

the search radius of the current new-frame pixel-group.

216

<p>To look for matches between the current pixel-group from the new

217

frame, and all pixel-groups from the previous frame within the search

218

radius, one just matches the current pixel-group to every

219

search-window cell attached to the pixel-sorter branch nodes, and

220

descend the tree according to the new pixel-group's values. (One

221

optimization is possible here: If the search-window cell was forced

222

to stop at that level of the pixel-sorter because one of its pixel

223

values was within the tolerance of the split value of that

224

pixel-sorter branch node, and none of the current pixel-group's

225

pixel values are within twice the tolerance of the split value

226

of that pixel-sorter branch node, then we can save time and avoid the

227

comparison, for no search-window cell that had to stop at that level

228

could possibly intersect the new pixel-group. This especially helps

229

in the presence of low error thresholds.)

230

<p>As matches are found, the search-border builds contiguous regions of

231

matches that all have the same motion-vector. (The "border" is the

232

border between the searched area and the not-yet-searched area.)

233

It's designed to move through the regions of matches in a zigzag

234

pattern, and constantly maintain a list of all regions that would

235

be contiguous with the current new-frame pixel-group. When a match

236

is found, all such regions with the same motion-vector are now

237

contiguous, once the current pixel-group's area is added.

238

<p>The search-border is implemented by sets of startpoints/endpoints.

239

Every horizontal extent (that could potentially intersect a

240

new-frame pixel-group) of every region under construction along the

241

border is represented in the set of startpoints/endpoints. The

242

search-border also has two arrays of set iterators, one for

243

startpoints, one for endpoints. As the search zig-zags across the

244

new frame, these two arrays of iterators keep track of all regions

245

that will be contiguous with the current new-frame pixel-group, and

246

all regions that are no longer contiguous with the current new-frame

247

pixel-group; by doing this, it's very efficient to maintain the set

248

of border regions that would be contiguous with the current new-frame

249

pixel-group.

250

<p>The general idea is to analyze the entire frame like this, then run

251

through the found regions from largest to smallest, and apply them to

252

the new frame. This can be a lot of data, too much in fact. To

253

limit the search to a reasonable complexity, two throttles exist --

254

one on the number of matches in the area of the current pixel-group,

255

and one on the size of the the largest match in the area of the

256

current pixel-group. If there are too many regions in the area,

257

or if the biggest region in the area is too large, then the best

258

region found so far is chosen, all other regions in the area are

259

thrown away, and that best region is applied to the new frame right

260

then. This will eliminate pixel-groups from consideration in the

261

search-window and pixel-sorter, which will save time in the search.

262

This will also resolve new-frame pixels; only pixel-groups that

263

contain nothing but unresolved pixels can be searched for in the

264

pixel-sorter, which also saves time in the remainder of the search.

265

Only after the entire frame is analyzed are regions applied from

266

largest to smallest.

267

<p>Before a match is applied to the new frame, it's flood-filled in

268

order to resolve its entire extent. Searching is done in terms of

269

pixel-groups, so it won't be able to find any detail that's smaller

270

than a pixel-group. Also, the region may not have been completed, if

271

it was chosen because a throttle value was exceeded, so its full

272

extent is not known. Plus, parts of that match may have already

273

been resolved. The flood-fill takes care of all of these situations.

274

<p>Any pixels not found by the above searches are declared to be new

275

information, and new reference-pixels are allocated for all such

276

new-frame pixels.

277

<p>The whole point of this design is to use as many high-level-design

278

features as possible to reduce the amount of work necessary to perform

279

the job. It attempts to accomplish this with a heavy reliance on

280

data structures over more mathematical algorithms, a drive to

281

locate sub-linear/sub-quadratic algorithms for common tasks (e.g.

282

the pixel-sorter tree, which reduced quadratic to logarithmic, and

283

the iterator arrays in the search-border, which reduced logarithmic

284

to small-constant), and to use data structure design to understand

285

the problem in ways that directly lead to efficient implementations.

286

287

<a name="ImplementationMotionSearcherVersion1"><h3>Version 1</h3></a>

288

<p>The above discussion describes the intent of the first version of

289

the denoiser (which I'm calling version 0). However, the very last

290

high-level change I made to it, right before releasing it under GPL,

291

was defective! In effect, the match-count throttle was always 1, and

292

the best match was applied every pixel-group! It was intended

293

to be a performance increase, and it was, but obviously it broke the

294

code...except that this bugged change also vastly increased the

295

quality! There is every reason in the world to believe that such a

296

bug should have broken the denoiser's quality, except that it didn't.

297

What a stroke of luck!

298

<p>I decided to take the implications of this accidental discovery to

299

the next logical level. Before, I wouldn't have believed that the

300

best match could be found without amassing a large list of

301

possibilities from several pixel-group searches. Now, each match

302

found is flood-filled, and the first one to exceed the match-size

303

throttle is applied to the image right then and there, and all other

304

possibilities aren't considered. So there is no big list of regions

305

to try at the end.

306

<p>This version performed better than the bugged version, which is

307

surprising enough, but the quality was vastly improved too.

308

<p>Parallel processing was added at this time too. Color can be

309

denoised in a thread separate from intensity denoising, and

310

reading/writing frames can be moved into separate threads too.

311

312

<a name="ImplementationMotionSearcherVersion2"><h3>Version 2</h3></a>

313

<p>If match-size-throttling is in use (which is usually is), now it

314

picks the largest such match, instead of the first match that's larger

315

than the throttle size. This led to a pretty serious increase in quality!

316

<p>Parallel processing was modified so that the reader/writer threads can be

317

used independently of the denoiser threads. This may not be very useful,

318

but there was no good reason to prevent it.

319

320

<!--

321

322

<p>

323

-->

324

325

<a name="FutureExtensions"><h1>Future Extensions</h1></a>

326

<p>The motion-detector is highly parallel, and a better multi-threaded

327

version should be written. So far, color and intensity can be

328

analyzed separately. But a thread could conceivably denoise one half of

329

the remaining area of an image plane. The pixel-sorter would have to

330

become its own class for this to work, since there'd now be more than

331

one per search-window, and the search-window would have to keep

332

pixel-sorters from colliding with each other (i.e. the areas being

333

searched by each can't overlap). Also, depending on how efficient

334

the thread-synchronization methods are, the pixel-sorter could feed

335

results to the flood-filling stage. Perhaps both approaches can be

336

taken. Anything that allows the denoiser to fill up processors is

337

probably worth trying.

338

<p>The motion-detector should probably be able to find matches in

339

more than one previous frame. I'd probably want to avoid later-frame

340

matches that occur in earlier frames, for efficiency's sake.

341

<p>The search-border should allow the insertion of new regions. It

342

would need a method, implemented somewhat like <tt>AddNewMatch()</tt>,

343

to generate a startpoint/endpoint for every horizontal extent in the

344

region that intersected the border area. This could be used to make

345

a <tt>ChooseBestActiveRegion()</tt> that eliminated flood-filled areas

346

from the other regions on the border and then put those regions back

347

into the border. I don't know if this would speed things up, though.

348

<p>I think the search-border can be used to implement removal of

349

transient phenomena, e.g. film lint/scratches, LaserDisc rot,

350

analog-broadcast static, etc. After the new frame has had motion

351

detection run on it, look at the 2nd-to-oldest frame, and build

352

contiguous regions of pixels that have the same reference count.

353

(Film lint/scratches will be limited to 1 reference count; I think

354

LaserDisc rot can extend over several frames.) If a region has

355

the right shape and the expected contents for a known sort of

356

artifact, it's declared to be an instance of that artifact, and a

357

blend involving the next/previous frame is used to generate the values

358

of pixels affected by the artifact. We'll probably want to take the

359

result of motion-detection into account too.

360

<p>I think the search-window could replace the radius-search in

361

yuvmedianfilter. It could even do motion-detection for mpeg2enc.

362

363

364

<a href="mailto:ulatec@users.sourceforge.net">Steven Boswell</a>.

365

366

<br>Released to the public under the GNU General Public License v2.

367

See the file COPYING for more information.

368

</body>

369

</html>

Older »