/brz/remove-bazaar : revision 0.64.44

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to processors/generic_processor.py

Committer: Ian Clatworthy
Date: 2008-02-21 07:22:58 UTC
mto: (0.106.1 trunk) (6622.6.1 bundle) (6628.1.3 integration-fastimport) (7194.1.1 fastexport-empty-parents)
mto: This revision was merged to the branch mainline in revision 6631.
Revision ID: ian.clatworthy@internode.on.net-20080221072258-vqp99j5te5fnyeb2

smart caching of serialised inventories

files modified:
__init__.py

processors/generic_processor.py

revisionloader.py

Show diffs side-by-side

added added

removed removed

processors/generic_processor.py

# How many commits before automatically checkpointing

_DEFAULT_AUTO_CHECKPOINT = 10000

# How many inventories to cache

_DEFAULT_INV_CACHE_SIZE = 10

class GenericProcessor(processor.ImportProcessor):

"""An import processor that handles basic imports.

above any checkpoints contained in the import stream.

The default is 10000.

* count - only import this many commits then exit. If not set,

all commits are imported.

* count - only import this many commits then exit. If not set

or negative, all commits are imported.

* inv-cache - number of inventories to cache.

If not set, the default is 10.

"""

known_params = ['info', 'trees', 'checkpoint', 'count']

known_params = ['info', 'trees', 'checkpoint', 'count', 'inv-cache']

def note(self, msg, *args):

"""Output a note but timestamp it."""

106

112

def pre_process(self):

107

113

self._start_time = time.time()

108

114

self._load_info_and_params()

109

self.cache_mgr = GenericCacheManager(self.info, verbose=self.verbose)

115

self.cache_mgr = GenericCacheManager(self.info, self.verbose,

116

self.inventory_cache_size)

110

117

self.init_stats()

111

118

112

119

# mapping of tag name to revision_id

116

123

# Checkpointing closes the current one and starts a new one.

117

124

self.repo.start_write_group()

118

125

126

# Turn on caching for the inventory versioned file

127

inv_vf = self.repo.get_inventory_weave()

128

inv_vf.enable_cache()

129

119

130

def _load_info_and_params(self):

120

131

# Load the info file, if any

121

132

info_path = self.params.get('info')

134

145

self.checkpoint_every = int(self.params.get('checkpoint',

135

146

_DEFAULT_AUTO_CHECKPOINT))

136

147

148

# Decide how big to make the inventory cache

149

self.inventory_cache_size = int(self.params.get('inv-cache',

150

_DEFAULT_INV_CACHE_SIZE))

151

137

152

# Find the maximum number of commits to import (None means all)

138

153

# and prepare progress reporting. Just in case the info file

139

154

# has an outdated count of commits, we store the max counts

354

369

self.last_ids = {}

355

370

self.heads = {}

356

371

372

# Cache of recent serialised inventories

373

self.inv_parent_texts = lru_cache.LRUCache(inventory_cache_size)

374

357

375

# Work out the blobs to make sticky - None means all

358

376

#print "%r" % (info,)

359

377

self._blobs_to_keep = None

401

419

self.cache_mgr = cache_mgr

402

420

self.verbose = verbose

403

421

# smart loader that uses these caches

404

self.loader = revisionloader.RevisionLoader(repo,

405

lambda revision_ids: self._get_inventories(revision_ids))

422

self.loader = revisionloader.ImportRevisionLoader(repo,

423

lambda revision_ids: self._get_inventories(revision_ids),

424

cache_mgr.inv_parent_texts)

425

#self.loader = revisionloader.RevisionLoader(repo,

426

# lambda revision_ids: self._get_inventories(revision_ids))

406

427

407

428

def note(self, msg, *args):

408

429

"""Output a note but add context."""

Older »