~ubuntu-branches/debian/wheezy/bzr/wheezy

Viewing changes to .pc/07_lazy_import_scope/bzrlib/fetch.py

Committer: Bazaar Package Importer
Author(s): Jelmer Vernooij, Jelmer Vernooij, John Ferlito
Date: 2011-04-05 14:38:50 UTC
Revision ID: james.westby@ubuntu.com-20110405143850-oi7cy895yzwwpeaz

Tags: 2.3.1-2

[ Jelmer Vernooij ]
* Add python-medusa, python-lzma and python-meliae as build
dependencies (used by the test suite).

[ John Ferlito ]
* Remove John Ferlito from Uploaders.

[ Jelmer Vernooij ]
* Prefer cython as build dependency.
* Remove generated C files during clean.

files added:
.pc/07_lazy_import_scope

.pc/07_lazy_import_scope/bzrlib

.pc/07_lazy_import_scope/bzrlib/api.py

.pc/07_lazy_import_scope/bzrlib/btree_index.py

.pc/07_lazy_import_scope/bzrlib/bundle

.pc/07_lazy_import_scope/bzrlib/bundle/commands.py

.pc/07_lazy_import_scope/bzrlib/bzrdir.py

.pc/07_lazy_import_scope/bzrlib/chk_map.py

.pc/07_lazy_import_scope/bzrlib/cmd_version_info.py

.pc/07_lazy_import_scope/bzrlib/commands.py

.pc/07_lazy_import_scope/bzrlib/config.py

.pc/07_lazy_import_scope/bzrlib/diff.py

.pc/07_lazy_import_scope/bzrlib/directory_service.py

.pc/07_lazy_import_scope/bzrlib/fetch.py

.pc/07_lazy_import_scope/bzrlib/foreign.py

.pc/07_lazy_import_scope/bzrlib/generate_ids.py

.pc/07_lazy_import_scope/bzrlib/hooks.py

.pc/07_lazy_import_scope/bzrlib/index.py

.pc/07_lazy_import_scope/bzrlib/inventory.py

.pc/07_lazy_import_scope/bzrlib/knit.py

.pc/07_lazy_import_scope/bzrlib/lockable_files.py

.pc/07_lazy_import_scope/bzrlib/log.py

.pc/07_lazy_import_scope/bzrlib/merge.py

.pc/07_lazy_import_scope/bzrlib/merge_directive.py

.pc/07_lazy_import_scope/bzrlib/multiparent.py

.pc/07_lazy_import_scope/bzrlib/mutabletree.py

.pc/07_lazy_import_scope/bzrlib/patiencediff.py

.pc/07_lazy_import_scope/bzrlib/plugin.py

.pc/07_lazy_import_scope/bzrlib/plugins

.pc/07_lazy_import_scope/bzrlib/plugins/launchpad

.pc/07_lazy_import_scope/bzrlib/plugins/launchpad/__init__.py

.pc/07_lazy_import_scope/bzrlib/plugins/netrc_credential_store

.pc/07_lazy_import_scope/bzrlib/plugins/netrc_credential_store/__init__.py

.pc/07_lazy_import_scope/bzrlib/repofmt

.pc/07_lazy_import_scope/bzrlib/repofmt/pack_repo.py

.pc/07_lazy_import_scope/bzrlib/repository.py

.pc/07_lazy_import_scope/bzrlib/revision.py

.pc/07_lazy_import_scope/bzrlib/sign_my_commits.py

.pc/07_lazy_import_scope/bzrlib/smart

.pc/07_lazy_import_scope/bzrlib/smart/medium.py

.pc/07_lazy_import_scope/bzrlib/trace.py

.pc/07_lazy_import_scope/bzrlib/transform.py

.pc/07_lazy_import_scope/bzrlib/transport

.pc/07_lazy_import_scope/bzrlib/transport/local.py

.pc/07_lazy_import_scope/bzrlib/tree.py

.pc/07_lazy_import_scope/bzrlib/ui

.pc/07_lazy_import_scope/bzrlib/ui/__init__.py

.pc/07_lazy_import_scope/bzrlib/ui/text.py

.pc/07_lazy_import_scope/bzrlib/versionedfile.py

.pc/07_lazy_import_scope/bzrlib/workingtree.py

.pc/07_lazy_import_scope/bzrlib/workingtree_4.py

debian/patches/07_lazy_import_scope

files modified:
.pc/applied-patches

bzrlib/api.py

bzrlib/btree_index.py

bzrlib/bundle/commands.py

bzrlib/bzrdir.py

bzrlib/chk_map.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/config.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/fetch.py

bzrlib/foreign.py

bzrlib/generate_ids.py

bzrlib/hooks.py

bzrlib/index.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lockable_files.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge_directive.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/netrc_credential_store/__init__.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/sign_my_commits.py

bzrlib/smart/medium.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/versionedfile.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

debian/changelog

debian/control

debian/patches/series

debian/rules

Show diffs side-by-side

added added

removed removed

.pc/07_lazy_import_scope/bzrlib/fetch.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Copying of history from one branch to another.

The basic plan is that every branch knows the history of everything

that has merged into it. As the first step of a merge, pull, or

branch operation we copy history from the source into the destination

branch.

"""

import operator

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from bzrlib import (

tsort,

versionedfile,

)

""")

import bzrlib

from bzrlib import (

errors,

ui,

)

from bzrlib.revision import NULL_REVISION

from bzrlib.trace import mutter

class RepoFetcher(object):

"""Pull revisions and texts from one repository to another.

This should not be used directly, it's essential a object to encapsulate

the logic in InterRepository.fetch().

"""

def __init__(self, to_repository, from_repository, last_revision=None,

find_ghosts=True, fetch_spec=None):

"""Create a repo fetcher.

:param last_revision: If set, try to limit to the data this revision

references.

:param find_ghosts: If True search the entire history for ghosts.

"""

# repository.fetch has the responsibility for short-circuiting

# attempts to copy between a repository and itself.

self.to_repository = to_repository

self.from_repository = from_repository

self.sink = to_repository._get_sink()

# must not mutate self._last_revision as its potentially a shared instance

self._last_revision = last_revision

self._fetch_spec = fetch_spec

self.find_ghosts = find_ghosts

self.from_repository.lock_read()

mutter("Using fetch logic to copy between %s(%s) and %s(%s)",

self.from_repository, self.from_repository._format,

self.to_repository, self.to_repository._format)

try:

self.__fetch()

finally:

self.from_repository.unlock()

def __fetch(self):

"""Primary worker function.

This initialises all the needed variables, and then fetches the

requested revisions, finally clearing the progress bar.

"""

# Roughly this is what we're aiming for fetch to become:

# missing = self.sink.insert_stream(self.source.get_stream(search))

# if missing:

# missing = self.sink.insert_stream(self.source.get_items(missing))

# assert not missing

self.count_total = 0

self.file_ids_names = {}

pb = ui.ui_factory.nested_progress_bar()

pb.show_pct = pb.show_count = False

try:

pb.update("Finding revisions", 0, 2)

search = self._revids_to_fetch()

if search is None:

return

pb.update("Fetching revisions", 1, 2)

self._fetch_everything_for_search(search)

100

finally:

101

pb.finished()

102

103

def _fetch_everything_for_search(self, search):

104

"""Fetch all data for the given set of revisions."""

105

# The first phase is "file". We pass the progress bar for it directly

106

# into item_keys_introduced_by, which has more information about how

107

# that phase is progressing than we do. Progress updates for the other

108

# phases are taken care of in this function.

109

# XXX: there should be a clear owner of the progress reporting. Perhaps

110

# item_keys_introduced_by should have a richer API than it does at the

111

# moment, so that it can feed the progress information back to this

112

# function?

113

if (self.from_repository._format.rich_root_data and

114

not self.to_repository._format.rich_root_data):

115

raise errors.IncompatibleRepositories(

116

self.from_repository, self.to_repository,

117

"different rich-root support")

118

pb = ui.ui_factory.nested_progress_bar()

119

try:

120

pb.update("Get stream source")

121

source = self.from_repository._get_source(

122

self.to_repository._format)

123

stream = source.get_stream(search)

124

from_format = self.from_repository._format

125

pb.update("Inserting stream")

126

resume_tokens, missing_keys = self.sink.insert_stream(

127

stream, from_format, [])

128

if missing_keys:

129

pb.update("Missing keys")

130

stream = source.get_stream_for_missing_keys(missing_keys)

131

pb.update("Inserting missing keys")

132

resume_tokens, missing_keys = self.sink.insert_stream(

133

stream, from_format, resume_tokens)

134

if missing_keys:

135

raise AssertionError(

136

"second push failed to complete a fetch %r." % (

137

missing_keys,))

138

if resume_tokens:

139

raise AssertionError(

140

"second push failed to commit the fetch %r." % (

141

resume_tokens,))

142

pb.update("Finishing stream")

143

self.sink.finished()

144

finally:

145

pb.finished()

146

147

def _revids_to_fetch(self):

148

"""Determines the exact revisions needed from self.from_repository to

149

install self._last_revision in self.to_repository.

150

151

If no revisions need to be fetched, then this just returns None.

152

"""

153

if self._fetch_spec is not None:

154

return self._fetch_spec

155

mutter('fetch up to rev {%s}', self._last_revision)

156

if self._last_revision is NULL_REVISION:

157

# explicit limit of no revisions needed

158

return None

159

return self.to_repository.search_missing_revision_ids(

160

self.from_repository, self._last_revision,

161

find_ghosts=self.find_ghosts)

162

163

164

class Inter1and2Helper(object):

165

"""Helper for operations that convert data from model 1 and 2

166

167

This is for use by fetchers and converters.

168

"""

169

170

# This is a class variable so that the test suite can override it.

171

known_graph_threshold = 100

172

173

def __init__(self, source):

174

"""Constructor.

175

176

:param source: The repository data comes from

177

"""

178

self.source = source

179

180

def iter_rev_trees(self, revs):

181

"""Iterate through RevisionTrees efficiently.

182

183

Additionally, the inventory's revision_id is set if unset.

184

185

Trees are retrieved in batches of 100, and then yielded in the order

186

they were requested.

187

188

:param revs: A list of revision ids

189

"""

190

# In case that revs is not a list.

191

revs = list(revs)

192

while revs:

193

for tree in self.source.revision_trees(revs[:100]):

194

if tree.inventory.revision_id is None:

195

tree.inventory.revision_id = tree.get_revision_id()

196

yield tree

197

revs = revs[100:]

198

199

def _find_root_ids(self, revs, parent_map, graph):

200

revision_root = {}

201

for tree in self.iter_rev_trees(revs):

202

revision_id = tree.inventory.root.revision

203

root_id = tree.get_root_id()

204

revision_root[revision_id] = root_id

205

# Find out which parents we don't already know root ids for

206

parents = set()

207

for revision_parents in parent_map.itervalues():

208

parents.update(revision_parents)

209

parents.difference_update(revision_root.keys() + [NULL_REVISION])

210

# Limit to revisions present in the versionedfile

211

parents = graph.get_parent_map(parents).keys()

212

for tree in self.iter_rev_trees(parents):

213

root_id = tree.get_root_id()

214

revision_root[tree.get_revision_id()] = root_id

215

return revision_root

216

217

def generate_root_texts(self, revs):

218

"""Generate VersionedFiles for all root ids.

219

220

:param revs: the revisions to include

221

"""

222

graph = self.source.get_graph()

223

parent_map = graph.get_parent_map(revs)

224

rev_order = tsort.topo_sort(parent_map)

225

rev_id_to_root_id = self._find_root_ids(revs, parent_map, graph)

226

root_id_order = [(rev_id_to_root_id[rev_id], rev_id) for rev_id in

227

rev_order]

228

# Guaranteed stable, this groups all the file id operations together

229

# retaining topological order within the revisions of a file id.

230

# File id splits and joins would invalidate this, but they don't exist

231

# yet, and are unlikely to in non-rich-root environments anyway.

232

root_id_order.sort(key=operator.itemgetter(0))

233

# Create a record stream containing the roots to create.

234

if len(revs) > self.known_graph_threshold:

235

graph = self.source.get_known_graph_ancestry(revs)

236

new_roots_stream = _new_root_data_stream(

237

root_id_order, rev_id_to_root_id, parent_map, self.source, graph)

238

return [('texts', new_roots_stream)]

239

240

241

def _new_root_data_stream(

242

root_keys_to_create, rev_id_to_root_id_map, parent_map, repo, graph=None):

243

"""Generate a texts substream of synthesised root entries.

244

245

Used in fetches that do rich-root upgrades.

246

247

:param root_keys_to_create: iterable of (root_id, rev_id) pairs describing

248

the root entries to create.

249

:param rev_id_to_root_id_map: dict of known rev_id -> root_id mappings for

250

calculating the parents. If a parent rev_id is not found here then it

251

will be recalculated.

252

:param parent_map: a parent map for all the revisions in

253

root_keys_to_create.

254

:param graph: a graph to use instead of repo.get_graph().

255

"""

256

for root_key in root_keys_to_create:

257

root_id, rev_id = root_key

258

parent_keys = _parent_keys_for_root_version(

259

root_id, rev_id, rev_id_to_root_id_map, parent_map, repo, graph)

260

yield versionedfile.FulltextContentFactory(

261

root_key, parent_keys, None, '')

262

263

264

def _parent_keys_for_root_version(

265

root_id, rev_id, rev_id_to_root_id_map, parent_map, repo, graph=None):

266

"""Get the parent keys for a given root id.

267

268

A helper function for _new_root_data_stream.

269

"""

270

# Include direct parents of the revision, but only if they used the same

271

# root_id and are heads.

272

rev_parents = parent_map[rev_id]

273

parent_ids = []

274

for parent_id in rev_parents:

275

if parent_id == NULL_REVISION:

276

continue

277

if parent_id not in rev_id_to_root_id_map:

278

# We probably didn't read this revision, go spend the extra effort

279

# to actually check

280

try:

281

tree = repo.revision_tree(parent_id)

282

except errors.NoSuchRevision:

283

# Ghost, fill out rev_id_to_root_id in case we encounter this

284

# again.

285

# But set parent_root_id to None since we don't really know

286

parent_root_id = None

287

else:

288

parent_root_id = tree.get_root_id()

289

rev_id_to_root_id_map[parent_id] = None

290

# XXX: why not:

291

# rev_id_to_root_id_map[parent_id] = parent_root_id

292

# memory consumption maybe?

293

else:

294

parent_root_id = rev_id_to_root_id_map[parent_id]

295

if root_id == parent_root_id:

296

# With stacking we _might_ want to refer to a non-local revision,

297

# but this code path only applies when we have the full content

298

# available, so ghosts really are ghosts, not just the edge of

299

# local data.

300

parent_ids.append(parent_id)

301

else:

302

# root_id may be in the parent anyway.

303

try:

304

tree = repo.revision_tree(parent_id)

305

except errors.NoSuchRevision:

306

# ghost, can't refer to it.

307

pass

308

else:

309

try:

310

parent_ids.append(tree.inventory[root_id].revision)

311

except errors.NoSuchId:

312

# not in the tree

313

pass

314

# Drop non-head parents

315

if graph is None:

316

graph = repo.get_graph()

317

heads = graph.heads(parent_ids)

318

selected_ids = []

319

for parent_id in parent_ids:

320

if parent_id in heads and parent_id not in selected_ids:

321

selected_ids.append(parent_id)

322

parent_keys = [(root_id, parent_id) for parent_id in selected_ids]

323

return parent_keys

Older »