/brz/remove-bazaar : revision 3251.6.5

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/graph.py

Committer: John Arbash Meinel
Date: 2008-06-05 16:27:16 UTC
mfrom: (3475 +trunk)
mto: This revision was merged to the branch mainline in revision 3476.
Revision ID: john@arbash-meinel.com-20080605162716-a3hn238tnctbfd8j

merge bzr.dev, resolve NEWS

files added:
bzrlib/directory_service.py

bzrlib/smart/message.py

bzrlib/tests/blackbox/test_alias.py

bzrlib/tests/blackbox/test_hooks.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/file_utils.py

bzrlib/tests/interrepository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_get_parent_map.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_mutabletree.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/tree_implementations/test_annotate_iter.py

bzrlib/transport/nosmart.py

bzrlib/xml5.py

bzrlib/xml6.py

doc/developers/integration.txt

doc/developers/plugin-api.txt

doc/developers/releasing.txt

doc/developers/repository-stream.txt

doc/developers/tortoise-strategy.txt

doc/en/admin-guide

doc/en/admin-guide/index.txt

doc/en/user-guide/bzrtools_plugin.txt

doc/en/user-guide/svn_plugin.txt

doc/en/user-guide/web_browsing.txt

doc/es

doc/es/guia-desarrollador

doc/es/guia-usuario

doc/es/guia-usuario/index.txt

doc/es/guia-usuario/resolving_conflicts.txt

doc/es/guia-usuario/version_info.txt

doc/es/mini-tutorial

doc/es/mini-tutorial/index.txt

doc/es/notas-version

doc/es/referencia

doc/es/referencia-rapida

doc/es/referencia-rapida/Makefile

doc/es/referencia-rapida/referencia-rapida.svg

doc/index.es.txt

files removed:
bzrlib/xml6.py

files renamed:
bzrlib/plugins/launchpad/lp_indirect.py => bzrlib/plugins/launchpad/lp_directory.py

bzrlib/plugins/launchpad/test_lp_indirect.py => bzrlib/plugins/launchpad/test_lp_directory.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/tests/test_revisionspec.py

bzrlib/xml5.py => bzrlib/xml8.py

doc/en/user-guide/best_practice_intro.txt => doc/en/user-guide/part2_intro.txt

files modified:
Makefile

NEWS

README

bzrlib/__init__.py

bzrlib/_dirstate_helpers_py.py

bzrlib/_knit_load_data_c.pyx

bzrlib/_knit_load_data_py.py

bzrlib/_patiencediff_py.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/branch.py

bzrlib/bugtracker.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/delta.py

bzrlib/deprecated_graph.py

bzrlib/diff.py

bzrlib/dirstate.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/authentication.txt

bzrlib/help_topics/en/configuration.txt

bzrlib/help_topics/en/hooks.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lru_cache.py

bzrlib/mail_client.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/reconfigure.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_reconfigure.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/commands/__init__.py

bzrlib/tests/ftp_server.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/inventory_implementations/__init__.py

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_check_reconcile.py

bzrlib/tests/repository_implementations/test_fetch.py

bzrlib/tests/repository_implementations/test_has_same_location.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_reconfigure.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_switch.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/transport_util.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/timestamp.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml_serializer.py

doc/default.css

doc/developers/HACKING.txt

doc/developers/authentication-ring.txt

doc/developers/index.txt

doc/developers/lca-merge.txt

doc/developers/network-protocol.txt

doc/developers/repository.txt

doc/en/mini-tutorial/index.txt

doc/en/user-guide/annotating_changes.txt

doc/en/user-guide/bazaar_workflows.txt

doc/en/user-guide/branching_a_project.txt

doc/en/user-guide/bug_trackers.txt

doc/en/user-guide/configuring_bazaar.txt

doc/en/user-guide/controlling_registration.txt

doc/en/user-guide/core_concepts.txt

doc/en/user-guide/distributed_intro.txt

doc/en/user-guide/hooks.txt

doc/en/user-guide/http_smart_server.txt

doc/en/user-guide/index.txt

doc/en/user-guide/installing_bazaar.txt

doc/en/user-guide/introducing_bazaar.txt

doc/en/user-guide/partner_intro.txt

doc/en/user-guide/releasing_a_project.txt

doc/en/user-guide/resolving_conflicts.txt

doc/en/user-guide/sending_changes.txt

doc/en/user-guide/undoing_mistakes.txt

doc/en/user-guide/version_info.txt

doc/index.txt

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/graph.py

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

import time

from bzrlib import (

debug,

errors,

revision,

symbol_versioning,

trace,

tsort,

)

from bzrlib.deprecated_graph import (node_distances, select_farthest)

STEP_UNIQUE_SEARCHER_EVERY = 5

# DIAGRAM of terminology

# A

# /\

199

205

200

206

def find_difference(self, left_revision, right_revision):

201

207

"""Determine the graph difference between two revisions"""

202

border, common, (left, right) = self._find_border_ancestors(

208

border, common, searchers = self._find_border_ancestors(

203

209

[left_revision, right_revision])

204

return (left.difference(right).difference(common),

205

right.difference(left).difference(common))

210

self._search_for_extra_common(common, searchers)

211

left = searchers[0].seen

212

right = searchers[1].seen

213

return (left.difference(right), right.difference(left))

214

215

def find_distance_to_null(self, target_revision_id, known_revision_ids):

216

"""Find the left-hand distance to the NULL_REVISION.

217

218

(This can also be considered the revno of a branch at

219

target_revision_id.)

220

221

:param target_revision_id: A revision_id which we would like to know

222

the revno for.

223

:param known_revision_ids: [(revision_id, revno)] A list of known

224

revno, revision_id tuples. We'll use this to seed the search.

225

"""

226

# Map from revision_ids to a known value for their revno

227

known_revnos = dict(known_revision_ids)

228

cur_tip = target_revision_id

229

num_steps = 0

230

NULL_REVISION = revision.NULL_REVISION

231

known_revnos[NULL_REVISION] = 0

232

233

searching_known_tips = list(known_revnos.keys())

234

235

unknown_searched = {}

236

237

while cur_tip not in known_revnos:

238

unknown_searched[cur_tip] = num_steps

239

num_steps += 1

240

to_search = set([cur_tip])

241

to_search.update(searching_known_tips)

242

parent_map = self.get_parent_map(to_search)

243

parents = parent_map.get(cur_tip, None)

244

if not parents: # An empty list or None is a ghost

245

raise errors.GhostRevisionsHaveNoRevno(target_revision_id,

246

cur_tip)

247

cur_tip = parents[0]

248

next_known_tips = []

249

for revision_id in searching_known_tips:

250

parents = parent_map.get(revision_id, None)

251

if not parents:

252

continue

253

next = parents[0]

254

next_revno = known_revnos[revision_id] - 1

255

if next in unknown_searched:

256

# We have enough information to return a value right now

257

return next_revno + unknown_searched[next]

258

if next in known_revnos:

259

continue

260

known_revnos[next] = next_revno

261

next_known_tips.append(next)

262

searching_known_tips = next_known_tips

263

264

# We reached a known revision, so just add in how many steps it took to

265

# get there.

266

return known_revnos[cur_tip] + num_steps

267

268

def find_unique_ancestors(self, unique_revision, common_revisions):

269

"""Find the unique ancestors for a revision versus others.

270

271

This returns the ancestry of unique_revision, excluding all revisions

272

in the ancestry of common_revisions. If unique_revision is in the

273

ancestry, then the empty set will be returned.

274

275

:param unique_revision: The revision_id whose ancestry we are

276

interested in.

277

XXX: Would this API be better if we allowed multiple revisions on

278

to be searched here?

279

:param common_revisions: Revision_ids of ancestries to exclude.

280

:return: A set of revisions in the ancestry of unique_revision

281

"""

282

if unique_revision in common_revisions:

283

return set()

284

285

# Algorithm description

286

# 1) Walk backwards from the unique node and all common nodes.

287

# 2) When a node is seen by both sides, stop searching it in the unique

288

# walker, include it in the common walker.

289

# 3) Stop searching when there are no nodes left for the unique walker.

290

# At this point, you have a maximal set of unique nodes. Some of

291

# them may actually be common, and you haven't reached them yet.

292

# 4) Start new searchers for the unique nodes, seeded with the

293

# information you have so far.

294

# 5) Continue searching, stopping the common searches when the search

295

# tip is an ancestor of all unique nodes.

296

# 6) Aggregate together unique searchers when they are searching the

297

# same tips. When all unique searchers are searching the same node,

298

# stop move it to a single 'all_unique_searcher'.

299

# 7) The 'all_unique_searcher' represents the very 'tip' of searching.

300

# Most of the time this produces very little important information.

301

# So don't step it as quickly as the other searchers.

302

# 8) Search is done when all common searchers have completed.

303

304

unique_searcher, common_searcher = self._find_initial_unique_nodes(

305

[unique_revision], common_revisions)

306

307

unique_nodes = unique_searcher.seen.difference(common_searcher.seen)

308

if not unique_nodes:

309

return unique_nodes

310

311

(all_unique_searcher,

312

unique_tip_searchers) = self._make_unique_searchers(unique_nodes,

313

unique_searcher, common_searcher)

314

315

self._refine_unique_nodes(unique_searcher, all_unique_searcher,

316

unique_tip_searchers, common_searcher)

317

true_unique_nodes = unique_nodes.difference(common_searcher.seen)

318

if 'graph' in debug.debug_flags:

319

trace.mutter('Found %d truly unique nodes out of %d',

320

len(true_unique_nodes), len(unique_nodes))

321

return true_unique_nodes

322

323

def _find_initial_unique_nodes(self, unique_revisions, common_revisions):

324

"""Steps 1-3 of find_unique_ancestors.

325

326

Find the maximal set of unique nodes. Some of these might actually

327

still be common, but we are sure that there are no other unique nodes.

328

329

:return: (unique_searcher, common_searcher)

330

"""

331

332

unique_searcher = self._make_breadth_first_searcher(unique_revisions)

333

# we know that unique_revisions aren't in common_revisions, so skip

334

# past them.

335

unique_searcher.next()

336

common_searcher = self._make_breadth_first_searcher(common_revisions)

337

338

# As long as we are still finding unique nodes, keep searching

339

while unique_searcher._next_query:

340

next_unique_nodes = set(unique_searcher.step())

341

next_common_nodes = set(common_searcher.step())

342

343

# Check if either searcher encounters new nodes seen by the other

344

# side.

345

unique_are_common_nodes = next_unique_nodes.intersection(

346

common_searcher.seen)

347

unique_are_common_nodes.update(

348

next_common_nodes.intersection(unique_searcher.seen))

349

if unique_are_common_nodes:

350

ancestors = unique_searcher.find_seen_ancestors(

351

unique_are_common_nodes)

352

# TODO: This is a bit overboard, we only really care about

353

# the ancestors of the tips because the rest we

354

# already know. This is *correct* but causes us to

355

# search too much ancestry.

356

ancestors.update(common_searcher.find_seen_ancestors(ancestors))

357

unique_searcher.stop_searching_any(ancestors)

358

common_searcher.start_searching(ancestors)

359

360

return unique_searcher, common_searcher

361

362

def _make_unique_searchers(self, unique_nodes, unique_searcher,

363

common_searcher):

364

"""Create a searcher for all the unique search tips (step 4).

365

366

As a side effect, the common_searcher will stop searching any nodes

367

that are ancestors of the unique searcher tips.

368

369

:return: (all_unique_searcher, unique_tip_searchers)

370

"""

371

unique_tips = self._remove_simple_descendants(unique_nodes,

372

self.get_parent_map(unique_nodes))

373

374

if len(unique_tips) == 1:

375

unique_tip_searchers = []

376

ancestor_all_unique = unique_searcher.find_seen_ancestors(unique_tips)

377

else:

378

unique_tip_searchers = []

379

for tip in unique_tips:

380

revs_to_search = unique_searcher.find_seen_ancestors([tip])

381

revs_to_search.update(

382

common_searcher.find_seen_ancestors(revs_to_search))

383

searcher = self._make_breadth_first_searcher(revs_to_search)

384

# We don't care about the starting nodes.

385

searcher._label = tip

386

searcher.step()

387

unique_tip_searchers.append(searcher)

388

389

ancestor_all_unique = None

390

for searcher in unique_tip_searchers:

391

if ancestor_all_unique is None:

392

ancestor_all_unique = set(searcher.seen)

393

else:

394

ancestor_all_unique = ancestor_all_unique.intersection(

395

searcher.seen)

396

# Collapse all the common nodes into a single searcher

397

all_unique_searcher = self._make_breadth_first_searcher(

398

ancestor_all_unique)

399

if ancestor_all_unique:

400

# We've seen these nodes in all the searchers, so we'll just go to

401

# the next

402

all_unique_searcher.step()

403

404

# Stop any search tips that are already known as ancestors of the

405

# unique nodes

406

stopped_common = common_searcher.stop_searching_any(

407

common_searcher.find_seen_ancestors(ancestor_all_unique))

408

409

total_stopped = 0

410

for searcher in unique_tip_searchers:

411

total_stopped += len(searcher.stop_searching_any(

412

searcher.find_seen_ancestors(ancestor_all_unique)))

413

if 'graph' in debug.debug_flags:

414

trace.mutter('For %d unique nodes, created %d + 1 unique searchers'

415

' (%d stopped search tips, %d common ancestors'

416

' (%d stopped common)',

417

len(unique_nodes), len(unique_tip_searchers),

418

total_stopped, len(ancestor_all_unique),

419

len(stopped_common))

420

return all_unique_searcher, unique_tip_searchers

421

422

def _step_unique_and_common_searchers(self, common_searcher,

423

unique_tip_searchers,

424

unique_searcher):

425

"""Step all the searchers"""

426

newly_seen_common = set(common_searcher.step())

427

newly_seen_unique = set()

428

for searcher in unique_tip_searchers:

429

next = set(searcher.step())

430

next.update(unique_searcher.find_seen_ancestors(next))

431

next.update(common_searcher.find_seen_ancestors(next))

432

for alt_searcher in unique_tip_searchers:

433

if alt_searcher is searcher:

434

continue

435

next.update(alt_searcher.find_seen_ancestors(next))

436

searcher.start_searching(next)

437

newly_seen_unique.update(next)

438

return newly_seen_common, newly_seen_unique

439

440

def _find_nodes_common_to_all_unique(self, unique_tip_searchers,

441

all_unique_searcher,

442

newly_seen_unique, step_all_unique):

443

"""Find nodes that are common to all unique_tip_searchers.

444

445

If it is time, step the all_unique_searcher, and add its nodes to the

446

result.

447

"""

448

common_to_all_unique_nodes = newly_seen_unique.copy()

449

for searcher in unique_tip_searchers:

450

common_to_all_unique_nodes.intersection_update(searcher.seen)

451

common_to_all_unique_nodes.intersection_update(

452

all_unique_searcher.seen)

453

# Step all-unique less frequently than the other searchers.

454

# In the common case, we don't need to spider out far here, so

455

# avoid doing extra work.

456

if step_all_unique:

457

tstart = time.clock()

458

nodes = all_unique_searcher.step()

459

common_to_all_unique_nodes.update(nodes)

460

if 'graph' in debug.debug_flags:

461

tdelta = time.clock() - tstart

462

trace.mutter('all_unique_searcher step() took %.3fs'

463

'for %d nodes (%d total), iteration: %s',

464

tdelta, len(nodes), len(all_unique_searcher.seen),

465

all_unique_searcher._iterations)

466

return common_to_all_unique_nodes

467

468

def _collapse_unique_searchers(self, unique_tip_searchers,

469

common_to_all_unique_nodes):

470

"""Combine searchers that are searching the same tips.

471

472

When two searchers are searching the same tips, we can stop one of the

473

searchers. We also know that the maximal set of common ancestors is the

474

intersection of the two original searchers.

475

476

:return: A list of searchers that are searching unique nodes.

477

"""

478

# Filter out searchers that don't actually search different

479

# nodes. We already have the ancestry intersection for them

480

unique_search_tips = {}

481

for searcher in unique_tip_searchers:

482

stopped = searcher.stop_searching_any(common_to_all_unique_nodes)

483

will_search_set = frozenset(searcher._next_query)

484

if not will_search_set:

485

if 'graph' in debug.debug_flags:

486

trace.mutter('Unique searcher %s was stopped.'

487

' (%s iterations) %d nodes stopped',

488

searcher._label,

489

searcher._iterations,

490

len(stopped))

491

elif will_search_set not in unique_search_tips:

492

# This searcher is searching a unique set of nodes, let it

493

unique_search_tips[will_search_set] = [searcher]

494

else:

495

unique_search_tips[will_search_set].append(searcher)

496

# TODO: it might be possible to collapse searchers faster when they

497

# only have *some* search tips in common.

498

next_unique_searchers = []

499

for searchers in unique_search_tips.itervalues():

500

if len(searchers) == 1:

501

# Searching unique tips, go for it

502

next_unique_searchers.append(searchers[0])

503

else:

504

# These searchers have started searching the same tips, we

505

# don't need them to cover the same ground. The

506

# intersection of their ancestry won't change, so create a

507

# new searcher, combining their histories.

508

next_searcher = searchers[0]

509

for searcher in searchers[1:]:

510

next_searcher.seen.intersection_update(searcher.seen)

511

if 'graph' in debug.debug_flags:

512

trace.mutter('Combining %d searchers into a single'

513

' searcher searching %d nodes with'

514

' %d ancestry',

515

len(searchers),

516

len(next_searcher._next_query),

517

len(next_searcher.seen))

518

next_unique_searchers.append(next_searcher)

519

return next_unique_searchers

520

521

def _refine_unique_nodes(self, unique_searcher, all_unique_searcher,

522

unique_tip_searchers, common_searcher):

523

"""Steps 5-8 of find_unique_ancestors.

524

525

This function returns when common_searcher has stopped searching for

526

more nodes.

527

"""

528

# We step the ancestor_all_unique searcher only every

529

# STEP_UNIQUE_SEARCHER_EVERY steps.

530

step_all_unique_counter = 0

531

# While we still have common nodes to search

532

while common_searcher._next_query:

533

(newly_seen_common,

534

newly_seen_unique) = self._step_unique_and_common_searchers(

535

common_searcher, unique_tip_searchers, unique_searcher)

536

# These nodes are common ancestors of all unique nodes

537

common_to_all_unique_nodes = self._find_nodes_common_to_all_unique(

538

unique_tip_searchers, all_unique_searcher, newly_seen_unique,

539

step_all_unique_counter==0)

540

step_all_unique_counter = ((step_all_unique_counter + 1)

541

% STEP_UNIQUE_SEARCHER_EVERY)

542

543

if newly_seen_common:

544

# If a 'common' node is an ancestor of all unique searchers, we

545

# can stop searching it.

546

common_searcher.stop_searching_any(

547

all_unique_searcher.seen.intersection(newly_seen_common))

548

if common_to_all_unique_nodes:

549

common_to_all_unique_nodes.update(

550

common_searcher.find_seen_ancestors(

551

common_to_all_unique_nodes))

552

# The all_unique searcher can start searching the common nodes

553

# but everyone else can stop.

554

# This is the sort of thing where we would like to not have it

555

# start_searching all of the nodes, but only mark all of them

556

# as seen, and have it search only the actual tips. Otherwise

557

# it is another get_parent_map() traversal for it to figure out

558

# what we already should know.

559

all_unique_searcher.start_searching(common_to_all_unique_nodes)

560

common_searcher.stop_searching_any(common_to_all_unique_nodes)

561

562

next_unique_searchers = self._collapse_unique_searchers(

563

unique_tip_searchers, common_to_all_unique_nodes)

564

if len(unique_tip_searchers) != len(next_unique_searchers):

565

if 'graph' in debug.debug_flags:

566

trace.mutter('Collapsed %d unique searchers => %d'

567

' at %s iterations',

568

len(unique_tip_searchers),

569

len(next_unique_searchers),

570

all_unique_searcher._iterations)

571

unique_tip_searchers = next_unique_searchers

206

572

207

573

@symbol_versioning.deprecated_method(symbol_versioning.one_one)

208

574

def get_parents(self, revisions):

220

586

Deprecated in bzr 1.2 - please see get_parent_map.

221

587

"""

222

588

parents = self.get_parent_map(revisions)

223

return [parent.get(r, None) for r in revisions]

589

return [parents.get(r, None) for r in revisions]

224

590

225

591

def get_parent_map(self, revisions):

226

592

"""Get a map of key:parent_list for revisions.

253

619

"""

254

620

if None in revisions:

255

621

raise errors.InvalidRevisionId(None, self)

256

common_searcher = self._make_breadth_first_searcher([])

257

622

common_ancestors = set()

258

623

searchers = [self._make_breadth_first_searcher([r])

259

624

for r in revisions]

260

625

active_searchers = searchers[:]

261

626

border_ancestors = set()

262

def update_common(searcher, revisions):

263

w_seen_ancestors = searcher.find_seen_ancestors(

264

revision)

265

stopped = searcher.stop_searching_any(w_seen_ancestors)

266

common_ancestors.update(w_seen_ancestors)

267

common_searcher.start_searching(stopped)

268

627

269

628

while True:

270

if len(active_searchers) == 0:

271

return border_ancestors, common_ancestors, [s.seen for s in

272

searchers]

273

try:

274

new_common = common_searcher.next()

275

common_ancestors.update(new_common)

276

except StopIteration:

277

pass

278

else:

279

for searcher in active_searchers:

280

for revision in new_common.intersection(searcher.seen):

281

update_common(searcher, revision)

282

283

629

newly_seen = set()

284

new_active_searchers = []

285

for searcher in active_searchers:

286

try:

287

newly_seen.update(searcher.next())

288

except StopIteration:

289

pass

290

else:

291

new_active_searchers.append(searcher)

292

active_searchers = new_active_searchers

630

for searcher in searchers:

631

new_ancestors = searcher.step()

632

if new_ancestors:

633

newly_seen.update(new_ancestors)

634

new_common = set()

293

635

for revision in newly_seen:

294

636

if revision in common_ancestors:

295

for searcher in searchers:

296

update_common(searcher, revision)

637

# Not a border ancestor because it was seen as common

638

# already

639

new_common.add(revision)

297

640

continue

298

641

for searcher in searchers:

299

642

if revision not in searcher.seen:

300

643

break

301

644

else:

645

# This is a border because it is a first common that we see

646

# after walking for a while.

302

647

border_ancestors.add(revision)

303

for searcher in searchers:

304

update_common(searcher, revision)

648

new_common.add(revision)

649

if new_common:

650

for searcher in searchers:

651

new_common.update(searcher.find_seen_ancestors(new_common))

652

for searcher in searchers:

653

searcher.start_searching(new_common)

654

common_ancestors.update(new_common)

655

656

# Figure out what the searchers will be searching next, and if

657

# there is only 1 set being searched, then we are done searching,

658

# since all searchers would have to be searching the same data,

659

# thus it *must* be in common.

660

unique_search_sets = set()

661

for searcher in searchers:

662

will_search_set = frozenset(searcher._next_query)

663

if will_search_set not in unique_search_sets:

664

# This searcher is searching a unique set of nodes, let it

665

unique_search_sets.add(will_search_set)

666

667

if len(unique_search_sets) == 1:

668

nodes = unique_search_sets.pop()

669

uncommon_nodes = nodes.difference(common_ancestors)

670

if uncommon_nodes:

671

raise AssertionError("Somehow we ended up converging"

672

" without actually marking them as"

673

" in common."

674

"\nStart_nodes: %s"

675

"\nuncommon_nodes: %s"

676

% (revisions, uncommon_nodes))

677

break

678

return border_ancestors, common_ancestors, searchers

305

679

306

680

def heads(self, keys):

307

681

"""Return the heads from amongst keys.

387

761

new_common.add(ancestor)

388

762

for searcher in searchers.itervalues():

389

763

seen_ancestors =\

390

searcher.find_seen_ancestors(ancestor)

764

searcher.find_seen_ancestors([ancestor])

391

765

searcher.stop_searching_any(seen_ancestors)

392

766

common_walker.start_searching(new_common)

393

767

return candidate_heads

424

798

raise errors.NoCommonAncestor(left_revision, right_revision)

425

799

revisions = lca

426

800

801

def iter_ancestry(self, revision_ids):

802

"""Iterate the ancestry of this revision.

803

804

:param revision_ids: Nodes to start the search

805

:return: Yield tuples mapping a revision_id to its parents for the

806

ancestry of revision_id.

807

Ghosts will be returned with None as their parents, and nodes

808

with no parents will have NULL_REVISION as their only parent. (As

809

defined by get_parent_map.)

810

There will also be a node for (NULL_REVISION, ())

811

"""

812

pending = set(revision_ids)

813

processed = set()

814

while pending:

815

processed.update(pending)

816

next_map = self.get_parent_map(pending)

817

next_pending = set()

818

for item in next_map.iteritems():

819

yield item

820

next_pending.update(p for p in item[1] if p not in processed)

821

ghosts = pending.difference(next_map)

822

for ghost in ghosts:

823

yield (ghost, None)

824

pending = next_pending

825

427

826

def iter_topo_order(self, revisions):

428

827

"""Iterate through the input revisions in topological order.

429

828

444

843

return set([candidate_descendant]) == self.heads(

445

844

[candidate_ancestor, candidate_descendant])

446

845

846

def _search_for_extra_common(self, common, searchers):

847

"""Make sure that unique nodes are genuinely unique.

848

849

After _find_border_ancestors, all nodes marked "common" are indeed

850

common. Some of the nodes considered unique are not, due to history

851

shortcuts stopping the searches early.

852

853

We know that we have searched enough when all common search tips are

854

descended from all unique (uncommon) nodes because we know that a node

855

cannot be an ancestor of its own ancestor.

856

857

:param common: A set of common nodes

858

:param searchers: The searchers returned from _find_border_ancestors

859

:return: None

860

"""

861

# Basic algorithm...

862

# A) The passed in searchers should all be on the same tips, thus

863

# they should be considered the "common" searchers.

864

# B) We find the difference between the searchers, these are the

865

# "unique" nodes for each side.

866

# C) We do a quick culling so that we only start searching from the

867

# more interesting unique nodes. (A unique ancestor is more

868

# interesting than any of its children.)

869

# D) We start searching for ancestors common to all unique nodes.

870

# E) We have the common searchers stop searching any ancestors of

871

# nodes found by (D)

872

# F) When there are no more common search tips, we stop

873

874

# TODO: We need a way to remove unique_searchers when they overlap with

875

# other unique searchers.

876

if len(searchers) != 2:

877

raise NotImplementedError(

878

"Algorithm not yet implemented for > 2 searchers")

879

common_searchers = searchers

880

left_searcher = searchers[0]

881

right_searcher = searchers[1]

882

unique = left_searcher.seen.symmetric_difference(right_searcher.seen)

883

if not unique: # No unique nodes, nothing to do

884

return

885

total_unique = len(unique)

886

unique = self._remove_simple_descendants(unique,

887

self.get_parent_map(unique))

888

simple_unique = len(unique)

889

890

unique_searchers = []

891

for revision_id in unique:

892

if revision_id in left_searcher.seen:

893

parent_searcher = left_searcher

894

else:

895

parent_searcher = right_searcher

896

revs_to_search = parent_searcher.find_seen_ancestors([revision_id])

897

if not revs_to_search: # XXX: This shouldn't be possible

898

revs_to_search = [revision_id]

899

searcher = self._make_breadth_first_searcher(revs_to_search)

900

# We don't care about the starting nodes.

901

searcher.step()

902

unique_searchers.append(searcher)

903

904

# possible todo: aggregate the common searchers into a single common

905

# searcher, just make sure that we include the nodes into the .seen

906

# properties of the original searchers

907

908

ancestor_all_unique = None

909

for searcher in unique_searchers:

910

if ancestor_all_unique is None:

911

ancestor_all_unique = set(searcher.seen)

912

else:

913

ancestor_all_unique = ancestor_all_unique.intersection(

914

searcher.seen)

915

916

trace.mutter('Started %s unique searchers for %s unique revisions',

917

simple_unique, total_unique)

918

919

while True: # If we have no more nodes we have nothing to do

920

newly_seen_common = set()

921

for searcher in common_searchers:

922

newly_seen_common.update(searcher.step())

923

newly_seen_unique = set()

924

for searcher in unique_searchers:

925

newly_seen_unique.update(searcher.step())

926

new_common_unique = set()

927

for revision in newly_seen_unique:

928

for searcher in unique_searchers:

929

if revision not in searcher.seen:

930

break

931

else:

932

# This is a border because it is a first common that we see

933

# after walking for a while.

934

new_common_unique.add(revision)

935

if newly_seen_common:

936

# These are nodes descended from one of the 'common' searchers.

937

# Make sure all searchers are on the same page

938

for searcher in common_searchers:

939

newly_seen_common.update(

940

searcher.find_seen_ancestors(newly_seen_common))

941

# We start searching the whole ancestry. It is a bit wasteful,

942

# though. We really just want to mark all of these nodes as

943

# 'seen' and then start just the tips. However, it requires a

944

# get_parent_map() call to figure out the tips anyway, and all

945

# redundant requests should be fairly fast.

946

for searcher in common_searchers:

947

searcher.start_searching(newly_seen_common)

948

949

# If a 'common' node is an ancestor of all unique searchers, we

950

# can stop searching it.

951

stop_searching_common = ancestor_all_unique.intersection(

952

newly_seen_common)

953

if stop_searching_common:

954

for searcher in common_searchers:

955

searcher.stop_searching_any(stop_searching_common)

956

if new_common_unique:

957

# We found some ancestors that are common

958

for searcher in unique_searchers:

959

new_common_unique.update(

960

searcher.find_seen_ancestors(new_common_unique))

961

# Since these are common, we can grab another set of ancestors

962

# that we have seen

963

for searcher in common_searchers:

964

new_common_unique.update(

965

searcher.find_seen_ancestors(new_common_unique))

966

967

# We can tell all of the unique searchers to start at these

968

# nodes, and tell all of the common searchers to *stop*

969

# searching these nodes

970

for searcher in unique_searchers:

971

searcher.start_searching(new_common_unique)

972

for searcher in common_searchers:

973

searcher.stop_searching_any(new_common_unique)

974

ancestor_all_unique.update(new_common_unique)

975

976

# Filter out searchers that don't actually search different

977

# nodes. We already have the ancestry intersection for them

978

next_unique_searchers = []

979

unique_search_sets = set()

980

for searcher in unique_searchers:

981

will_search_set = frozenset(searcher._next_query)

982

if will_search_set not in unique_search_sets:

983

# This searcher is searching a unique set of nodes, let it

984

unique_search_sets.add(will_search_set)

985

next_unique_searchers.append(searcher)

986

unique_searchers = next_unique_searchers

987

for searcher in common_searchers:

988

if searcher._next_query:

989

break

990

else:

991

# All common searcher have stopped searching

992

return

993

994

def _remove_simple_descendants(self, revisions, parent_map):

995

"""remove revisions which are children of other ones in the set

996

997

This doesn't do any graph searching, it just checks the immediate

998

parent_map to find if there are any children which can be removed.

999

1000

:param revisions: A set of revision_ids

1001

:return: A set of revision_ids with the children removed

1002

"""

1003

simple_ancestors = revisions.copy()

1004

# TODO: jam 20071214 we *could* restrict it to searching only the

1005

# parent_map of revisions already present in 'revisions', but

1006

# considering the general use case, I think this is actually

1007

# better.

1008

1009

# This is the same as the following loop. I don't know that it is any

1010

# faster.

1011

## simple_ancestors.difference_update(r for r, p_ids in parent_map.iteritems()

1012

## if p_ids is not None and revisions.intersection(p_ids))

1013

## return simple_ancestors

1014

1015

# Yet Another Way, invert the parent map (which can be cached)

1016

## descendants = {}

1017

## for revision_id, parent_ids in parent_map.iteritems():

1018

## for p_id in parent_ids:

1019

## descendants.setdefault(p_id, []).append(revision_id)

1020

## for revision in revisions.intersection(descendants):

1021

## simple_ancestors.difference_update(descendants[revision])

1022

## return simple_ancestors

1023

for revision, parent_ids in parent_map.iteritems():

1024

if parent_ids is None:

1025

continue

1026

for parent_id in parent_ids:

1027

if parent_id in revisions:

1028

# This node has a parent present in the set, so we can

1029

# remove it

1030

simple_ancestors.discard(revision)

1031

break

1032

return simple_ancestors

1033

447

1034

448

1035

class HeadsCache(object):

449

1036

"""A cache of results for graph heads calls."""

473

1060

return set(heads)

474

1061

475

1062

1063

class FrozenHeadsCache(object):

1064

"""Cache heads() calls, assuming the caller won't modify them."""

1065

1066

def __init__(self, graph):

1067

self.graph = graph

1068

self._heads = {}

1069

1070

def heads(self, keys):

1071

"""Return the heads of keys.

1072

1073

Similar to Graph.heads(). The main difference is that the return value

1074

is a frozen set which cannot be mutated.

1075

1076

:see also: Graph.heads.

1077

:param keys: The keys to calculate heads for.

1078

:return: A frozenset containing the heads.

1079

"""

1080

keys = frozenset(keys)

1081

try:

1082

return self._heads[keys]

1083

except KeyError:

1084

heads = frozenset(self.graph.heads(keys))

1085

self._heads[keys] = heads

1086

return heads

1087

1088

def cache(self, keys, heads):

1089

"""Store a known value."""

1090

self._heads[frozenset(keys)] = frozenset(heads)

1091

1092

476

1093

class _BreadthFirstSearcher(object):

477

1094

"""Parallel search breadth-first the ancestry of revisions.

478

1095

527

1144

return SearchResult(self._started_keys, excludes, len(included_keys),

528

1145

included_keys)

529

1146

1147

def step(self):

1148

try:

1149

return self.next()

1150

except StopIteration:

1151

return ()

1152

530

1153

def next(self):

531

1154

"""Return the next ancestors of this revision.

532

1155

597

1220

:return: A tuple: (set(found_revisions), set(ghost_revisions),

598

1221

set(parents_of_found_revisions), dict(found_revisions:parents)).

599

1222

"""

600

found_parents = set()

1223

found_revisions = set()

601

1224

parents_of_found = set()

602

1225

# revisions may contain nodes that point to other nodes in revisions:

603

1226

# we want to filter them out.

604

1227

self.seen.update(revisions)

605

1228

parent_map = self._parents_provider.get_parent_map(revisions)

1229

found_revisions.update(parent_map)

606

1230

for rev_id, parents in parent_map.iteritems():

607

found_parents.add(rev_id)

608

parents_of_found.update(p for p in parents if p not in self.seen)

609

ghost_parents = revisions - found_parents

610

return found_parents, ghost_parents, parents_of_found, parent_map

1231

new_found_parents = [p for p in parents if p not in self.seen]

1232

if new_found_parents:

1233

# Calling set.update() with an empty generator is actually

1234

# rather expensive.

1235

parents_of_found.update(new_found_parents)

1236

ghost_revisions = revisions - found_revisions

1237

return found_revisions, ghost_revisions, parents_of_found, parent_map

611

1238

612

1239

def __iter__(self):

613

1240

return self

614

1241

615

def find_seen_ancestors(self, revision):

616

"""Find ancestors of this revision that have already been seen."""

617

searcher = _BreadthFirstSearcher([revision], self._parents_provider)

618

seen_ancestors = set()

619

for ancestors in searcher:

620

for ancestor in ancestors:

621

if ancestor not in self.seen:

622

searcher.stop_searching_any([ancestor])

623

else:

624

seen_ancestors.add(ancestor)

1242

def find_seen_ancestors(self, revisions):

1243

"""Find ancestors of these revisions that have already been seen.

1244

1245

This function generally makes the assumption that querying for the

1246

parents of a node that has already been queried is reasonably cheap.

1247

(eg, not a round trip to a remote host).

1248

"""

1249

# TODO: Often we might ask one searcher for its seen ancestors, and

1250

# then ask another searcher the same question. This can result in

1251

# searching the same revisions repeatedly if the two searchers

1252

# have a lot of overlap.

1253

all_seen = self.seen

1254

pending = set(revisions).intersection(all_seen)

1255

seen_ancestors = set(pending)

1256

1257

if self._returning == 'next':

1258

# self.seen contains what nodes have been returned, not what nodes

1259

# have been queried. We don't want to probe for nodes that haven't

1260

# been searched yet.

1261

not_searched_yet = self._next_query

1262

else:

1263

not_searched_yet = ()

1264

pending.difference_update(not_searched_yet)

1265

get_parent_map = self._parents_provider.get_parent_map

1266

while pending:

1267

parent_map = get_parent_map(pending)

1268

all_parents = []

1269

# We don't care if it is a ghost, since it can't be seen if it is

1270

# a ghost

1271

for parent_ids in parent_map.itervalues():

1272

all_parents.extend(parent_ids)

1273

next_pending = all_seen.intersection(all_parents).difference(seen_ancestors)

1274

seen_ancestors.update(next_pending)

1275

next_pending.difference_update(not_searched_yet)

1276

pending = next_pending

1277

625

1278

return seen_ancestors

626

1279

627

1280

def stop_searching_any(self, revisions):

631

1284

None of the specified revisions are required to be present in the

632

1285

search list. In this case, the call is a no-op.

633

1286

"""

1287

# TODO: does this help performance?

1288

# if not revisions:

1289

# return set()

634

1290

revisions = frozenset(revisions)

635

1291

if self._returning == 'next':

636

1292

stopped = self._next_query.intersection(revisions)

676

1332

revisions = frozenset(revisions)

677

1333

self._started_keys.update(revisions)

678

1334

new_revisions = revisions.difference(self.seen)

679

revs, ghosts, query, parents = self._do_query(revisions)

680

self._stopped_keys.update(ghosts)

681

1335

if self._returning == 'next':

682

1336

self._next_query.update(new_revisions)

1337

self.seen.update(new_revisions)

683

1338

else:

684

1339

# perform a query on revisions

1340

revs, ghosts, query, parents = self._do_query(revisions)

1341

self._stopped_keys.update(ghosts)

685

1342

self._current_present.update(revs)

686

1343

self._current_ghosts.update(ghosts)

687

1344

self._next_query.update(query)

Older »