~timo-jyrinki/ubuntu/trusty/pitivi/backport_utopic

~timo-jyrinki/ubuntu/trusty/pitivi/backport_utopic_fixes

Viewing changes to pitivi/timeline/alignalgs.py

Committer: Bazaar Package Importer
Author(s): Jeremy Bicha
Date: 2011-08-15 02:32:20 UTC
mfrom: (1.5.3 upstream)
Revision ID: james.westby@ubuntu.com-20110815023220-x2n5l0i4deiqn7dn

Tags: 0.14.2-0ubuntu1

* New upstream version.
  - New Mallard format help
* debian/control:
  - Add gnome-doc-utils to build-depends
  - Bump pygtk minimum to 2.24
* debian/patches/01_lpi.patch
  - Move LPI items below User Manual in Help menu
* debian/watch: Watch for 0.14.* tar.bz2

files added:
data/pixmaps/pitivi-align-24.svg

data/pixmaps/pitivi-align.svg

data/ui/cliptransformation.ui

data/ui/depsmanager.ui

gnome-doc-utils.make

help

help/C

help/C/about.page

help/C/crossfading.page

help/C/effects.page

help/C/effectsanimation.page

help/C/fadeinfadeout.page

help/C/figures

help/C/figures/fadestep1.png

help/C/figures/fadestep2.png

help/C/figures/fadestep3.png

help/C/figures/filechooser.png

help/C/figures/hovering.png

help/C/figures/keyframecurves.png

help/C/figures/layers.png

help/C/figures/logo.png

help/C/figures/previewsource.png

help/C/figures/ripple-after.png

help/C/figures/ripple-before.png

help/C/figures/roll-after.png

help/C/figures/roll-before.png

help/C/figures/ruler.png

help/C/figures/trimming-individual.png

help/C/gstreamer.page

help/C/importing.page

help/C/importingmpegts.page

help/C/index.page

help/C/insertintimeline.page

help/C/interface.page

help/C/keyframecurves.page

help/C/layers.page

help/C/license.page

help/C/mainwindow.page

help/C/makeselections.page

help/C/medialibrary.page

help/C/movearoundtimeline.page

help/C/othertransitions.page

help/C/projectsettings.page

help/C/rendering.page

help/C/saveproject.page

help/C/selectunusedfiles.page

help/C/splitting.page

help/C/sysreq.page

help/C/trimming.page

help/C/usingclips.page

help/C/welcomedialog.page

help/Makefile.am

help/Makefile.in

pitivi/elements/extractionsink.py

pitivi/timeline/align.py

pitivi/timeline/alignalgs.py

pitivi/timeline/extract.py

pitivi/ui/alignmentprogress.py

pitivi/ui/depsmanager.py

files modified:
.pc/01_lpi.patch/pitivi/ui/mainwindow.py

ChangeLog

Makefile.am

Makefile.in

aclocal.m4

autogen.sh

bin/Makefile.in

common/Makefile.in

common/m4/Makefile.in

configure

configure.ac

data/Makefile.in

data/icons/16x16/Makefile.in

data/icons/22x22/Makefile.in

data/icons/24x24/Makefile.in

data/icons/32x32/Makefile.in

data/icons/48x48/Makefile.in

data/icons/Makefile.in

data/icons/scalable/Makefile.in

data/pitivi.desktop.in

data/pixmaps/Makefile.am

data/pixmaps/Makefile.in

data/ui/Makefile.am

data/ui/Makefile.in

data/ui/elementsettingsdialog.ui

data/ui/mainwindow.xml

data/ui/preferences.ui

data/ui/startupwizard.ui

debian/changelog

debian/control

debian/patches/01_lpi.patch

debian/watch

pitivi.spec

pitivi.spec.in

pitivi/Makefile.in

pitivi/application.py

pitivi/check.py

pitivi/configure.py

pitivi/configure.py.in

pitivi/discoverer.py

pitivi/elements/Makefile.am

pitivi/elements/Makefile.in

pitivi/factories/Makefile.in

pitivi/formatters/Makefile.in

pitivi/formatters/base.py

pitivi/formatters/etree.py

pitivi/log/Makefile.in

pitivi/pipeline.py

pitivi/project.py

pitivi/projectmanager.py

pitivi/settings.py

pitivi/signalinterface.py

pitivi/timeline/Makefile.am

pitivi/timeline/Makefile.in

pitivi/timeline/timeline.py

pitivi/timeline/track.py

pitivi/ui/Makefile.am

pitivi/ui/Makefile.in

pitivi/ui/clipproperties.py

pitivi/ui/common.py

pitivi/ui/dynamic.py

pitivi/ui/effectlist.py

pitivi/ui/effectsconfiguration.py

pitivi/ui/encodingdialog.py

pitivi/ui/gstwidget.py

pitivi/ui/mainwindow.py

pitivi/ui/prefs.py

pitivi/ui/previewer.py

pitivi/ui/projectsettings.py

pitivi/ui/startupwizard.py

pitivi/ui/timeline.py

pitivi/ui/timelinecanvas.py

pitivi/ui/trackobject.py

pitivi/ui/viewer.py

pitivi/utils.py

po/ca.po

po/cs.po

po/de.po

po/es.po

po/fr.po

po/ru.po

po/sk.po

po/sl.po

po/sr.po

po/sr@latin.po

po/uk.po

tests/Makefile.in

tests/test_pipeline.py

tests/test_signallable.py

Show diffs side-by-side

added added

removed removed

pitivi/timeline/alignalgs.py

# PiTiVi , Non-linear video editor

# timeline/alignalgs.py

# This program is free software; you can redistribute it and/or

# modify it under the terms of the GNU Lesser General Public

# License as published by the Free Software Foundation; either

# version 2.1 of the License, or (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU

# Lesser General Public License for more details.

# You should have received a copy of the GNU Lesser General Public

# License along with this program; if not, write to the

# Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,

# Boston, MA 02110-1301, USA.

"""

Algorithms for aligning (i.e. registering, synchronizing) time series

"""

try:

import numpy

except ImportError:

numpy = None

def nextpow2(x):

a = 1

while a < x:

a *= 2

return a

def submax(left, middle, right):

"""

Find the maximum of a quadratic function from three samples.

Given samples from a quadratic P(x) at x=-1, 0, and 1, find the x

that extremizes P. This is useful for determining the subsample

position of the extremum given three samples around the observed

extreme.

@param left: value at x=-1

@type left: L{float}

@param middle: value at x=0

@type middle: L{float}

@param right: value at x=1

@type right: L{float}

@returns: value of x that extremizes the interpolating quadratic

@rtype: L{float}

"""

L = middle - left # L and R are both positive if middle is the

R = middle - right # observed max of the integer samples

return 0.5 * (R - L) / (R + L)

# Derivation: Consider a quadratic q(x) := P(0) - P(x). Then q(x) has

# two roots, one at 0 and one at z, and the extreme is at (0+z)/2

# (i.e. at z/2)

# q(x) = bx*(x-z) # a may be positive or negative

# q(1) = b*(1 - z) = R

# q(-1) = b*(1 + z) = L

# (1+z)/(1-z) = L/R (from here it's just algebra to find a)

# z + 1 = R/L - (R/L)*z

# z*(1+R/L) = R/L - 1

# z = (R/L - 1)/(R/L + 1) = (R-L)/(R+L)

def rigidalign(reference, targets):

"""

Estimate the relative shift between reference and targets.

The algorithm works by subtracting the mean, and then locating

the maximum of the cross-correlation. For inputs of length M{N},

the running time is M{O(C{len(targets)}*N*log(N))}.

@param reference: the waveform to regard as fixed

@type reference: Sequence(Number)

@param targets: the waveforms that should be aligned to reference

@type targets: Sequence(Sequence(Number))

@returns: The shift necessary to bring each target into alignment

with the reference. The returned shift may not be an integer,

indicating that the best alignment would be achieved by a

non-integer shift and appropriate interpolation.

@rtype: Sequence(Number)

"""

# L is the maximum size of a cross-correlation between the

# reference and any of the targets.

L = len(reference) + max(len(t) for t in targets) - 1

# We round up L to the next power of 2 for speed in the FFT.

L = nextpow2(L)

reference = reference - numpy.mean(reference)

fref = numpy.fft.rfft(reference, L).conj()

shifts = []

100

for t in targets:

101

t = t - numpy.mean(t)

102

# Compute cross-correlation

103

xcorr = numpy.fft.irfft(fref * numpy.fft.rfft(t, L))

104

# shift maximizes dotproduct(t[shift:],reference)

105

# int() to convert numpy.int32 to python int

106

shift = int(numpy.argmax(xcorr))

107

subsample_shift = submax(xcorr[(shift - 1) % L],

108

xcorr[shift],

109

xcorr[(shift + 1) % L])

110

shift = shift + subsample_shift

111

# shift is now a float indicating the interpolated maximum

112

if shift >= len(t): # Negative shifts appear large and positive

113

shift -= L # This corrects them to be negative

114

shifts.append(-shift)

115

# Sign reversed to move the target instead of the reference

116

return shifts

117

118

119

def _findslope(a):

120

# Helper function for affinealign

121

# The provided matrix a contains a bright line whose slope we want to know,

122

# against a noisy background.

123

# The line starts at 0,0. If the slope is positive, it runs toward the

124

# center of the matrix (i.e. toward (-1,-1))

125

# If the slope is negative, it wraps from 0,0 to 0,-1 and continues toward

126

# the center, (i.e. toward (-1,0)).

127

# The line segment terminates at the midline along the X direction.

128

# We locate the line by simply checking the sum along each possible line

129

# up to the Y-max edge of a. The caller sets the limit by choosing the

130

# size of a.

131

# The function returns a floating-point slope assuming that the matrix

132

# has "square pixels".

133

Y, X = a.shape

134

X /= 2

135

x_pos = numpy.arange(1, X)

136

x_neg = numpy.arange(2 * X - 1, X, -1)

137

best_end = 0

138

max_sum = 0

139

for end in xrange(Y):

140

y = (x_pos * end) // X

141

s = numpy.sum(a[y, x_pos])

142

if s > max_sum:

143

max_sum = s

144

best_end = end

145

s = numpy.sum(a[y, x_neg])

146

if s > max_sum:

147

max_sum = s

148

best_end = -end

149

return float(best_end) / X

150

151

152

def affinealign(reference, targets, max_drift=0.02):

153

""" EXPERIMENTAL FUNCTION.

154

155

Perform an affine registration between a reference and a number of

156

targets. Designed for aligning the amplitude envelopes of recordings of

157

the same event by different devices.

158

159

NOTE: This method is currently NOT USED by PiTiVi, as it has proven both

160

unnecessary and unusable. So far every test case has been registered

161

successfully by rigidalign, and until PiTiVi supports time-stretching of

162

audio, the drift calculation cannot actually be used.

163

164

@param reference: the reference signal to which others will be registered

165

@type reference: array(number)

166

@param targets: the signals to register

167

@type targets: ordered iterable(array(number))

168

@param max_drift: the maximum absolute clock drift rate

169

(i.e. stretch factor) that will be considered during search

170

@type max_drift: positive L{float}

171

@return: (offsets, drifts). offsets[i] is the point in reference at which

172

targets[i] starts. drifts[i] is the speed of targets[i] relative to

173

the reference (positive is faster, meaning the target should be

174

slowed down to be in sync with the reference)

175

"""

176

L = len(reference) + max(len(t) for t in targets) - 1

177

L2 = nextpow2(L)

178

bsize = int(20. / max_drift) # NEEDS TUNING

179

num_blocks = nextpow2(1.0 * len(reference) // bsize) # NEEDS TUNING

180

bspace = (len(reference) - bsize) // num_blocks

181

reference -= numpy.mean(reference)

182

183

# Construct FFT'd reference blocks

184

freference_blocks = numpy.zeros((L2 / 2 + 1, num_blocks),

185

dtype=numpy.complex)

186

for i in xrange(num_blocks):

187

s = i * bspace

188

tmp = numpy.zeros((L2,))

189

tmp[s:s + bsize] = reference[s:s + bsize]

190

freference_blocks[:, i] = numpy.fft.rfft(tmp, L2).conj()

191

freference_blocks[:10, :] = 0 # High-pass to ignore slow volume variations

192

193

offsets = []

194

drifts = []

195

for t in targets:

196

t -= numpy.mean(t)

197

ft = numpy.fft.rfft(t, L2)

198

#fxcorr is the FFT'd cross-correlation with the reference blocks

199

fxcorr_blocks = numpy.zeros((L2 / 2 + 1, num_blocks),

200

dtype=numpy.complex)

201

for i in xrange(num_blocks):

202

fxcorr_blocks[:, i] = ft * freference_blocks[:, i]

203

fxcorr_blocks[:, i] /= numpy.sqrt(numpy.sum(

204

fxcorr_blocks[:, i] ** 2))

205

del ft

206

# At this point xcorr_blocks would show a distinct bright line, nearly

207

# orthogonal to time, indicating where each of these blocks found their

208

# peak. Each point on this line represents the time in t where block i

209

# found its match. The time-intercept gives the time in b at which the

210

# reference starts, and the slope gives the amount by which the

211

# reference is faster relative to b.

212

213

# The challenge now is to find this line. Our strategy is to reduce the

214

# search to one dimension by first finding the slope.

215

# The Fourier Transform of a smooth real line in 2D is an orthogonal

216

# line through the origin, with phase that gives its position.

217

# Unfortunately this line is not clearly visible in fxcorr_blocks, so

218

# we discard the phase (by taking the absolute value) and then inverse

219

# transform. This places the line at the origin, so we can find its

220

# slope.

221

222

# Construct the half-autocorrelation matrix

223

# (A true autocorrelation matrix would be ifft(abs(fft(x))**2), but this

224

# is just ifft(abs(fft(x))).)

225

# Construction is stepwise partly in an attempt to save memory

226

# The width is 2*num_blocks in order to avoid overlapping positive and

227

# negative correlations

228

halfautocorr = numpy.fft.fft(fxcorr_blocks, 2 * num_blocks, 1)

229

halfautocorr = numpy.abs(halfautocorr)

230

halfautocorr = numpy.fft.ifft(halfautocorr, None, 1)

231

halfautocorr = numpy.fft.irfft(halfautocorr, None, 0)

232

# Now it's actually the half-autocorrelation.

233

# Chop out the bit we don't care about

234

halfautocorr = halfautocorr[:bspace * num_blocks * max_drift, :]

235

# Remove the local-correlation peak.

236

halfautocorr[-1:2, -1:2] = 0 # NEEDS TUNING

237

# Normalize each column (appears to be necessary)

238

for i in xrange(2 * num_blocks):

239

halfautocorr[:, i] /= numpy.sqrt(numpy.sum(

240

halfautocorr[:, i] ** 2))

241

#from matplotlib.pyplot import imshow,show

242

#imshow(halfautocorr,interpolation='nearest',aspect='auto');show()

243

drift = _findslope(halfautocorr) / bspace

244

del halfautocorr

245

246

#inverse transform and shift everything into alignment

247

xcorr_blocks = numpy.fft.irfft(fxcorr_blocks, None, 0)

248

del fxcorr_blocks

249

#TODO: see if phase ramps are worthwhile here

250

for i in xrange(num_blocks):

251

blockcenter = i * bspace + bsize / 2

252

shift = int(blockcenter * drift)

253

if shift > 0:

254

temp = xcorr_blocks[:shift, i].copy()

255

xcorr_blocks[:-shift, i] = xcorr_blocks[shift:, i].copy()

256

xcorr_blocks[-shift:, i] = temp

257

elif shift < 0:

258

temp = xcorr_blocks[shift:, i].copy()

259

xcorr_blocks[-shift:, i] = xcorr_blocks[:shift, i].copy()

260

xcorr_blocks[:-shift, i] = temp

261

262

#from matplotlib.pyplot import imshow,show

263

#imshow(xcorr_blocks,interpolation='nearest',aspect='auto');show()

264

265

# xcorr is the drift-compensated cross-correlation

266

xcorr = numpy.sum(xcorr_blocks, axis=1)

267

del xcorr_blocks

268

269

offset = numpy.argmax(xcorr)

270

#from matplotlib.pyplot import plot,show

271

#plot(xcorr);show()

272

del xcorr

273

if offset >= len(t):

274

offset -= L2

275

276

# now offset is the point in target at which reference starts and

277

# drift is the speed with which the reference drifts relative to the

278

# target. We reverse these relationships for the caller.

279

slope = 1 + drift

280

offsets.append(-offset / slope)

281

drifts.append(1 / slope - 1)

282

return offsets, drifts

283

284

if __name__ == '__main__':

285

# Simple command-line test

286

from sys import argv

287

names = argv[1:]

288

envelopes = [numpy.fromfile(n) for n in names]

289

reference = envelopes[-1]

290

offsets, drifts = affinealign(reference, envelopes, 0.02)

291

print offsets, drifts

292

from matplotlib.pyplot import *

293

clf()

294

for i in xrange(len(envelopes)):

295

t = offsets[i] + (1 + drifts[i]) * numpy.arange(len(envelopes[i]))

296

plot(t, envelopes[i] / numpy.sqrt(numpy.sum(envelopes[i] ** 2)))

297

show()

Older »