/brz/remove-bazaar : revision 1257

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/commit.py

Committer: Martin Pool
Date: 2005-09-15 06:32:04 UTC
Revision ID: mbp@sourcefrog.net-20050915063203-8d7b634786abe83b

doc

files added:
HACKING

Makefile

bzrlib/builtins.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/plugins/__init__.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/teststore.py

bzrlib/shellcomplete.py

bzrlib/ui.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/weavestore.py

bzrlib/xml5.py

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/revfile.txt

notes/schemas.xml

tools/history2revfiles.py

tools/history2weaves.py

tools/http_client.py

files removed:
plugins/changeset

plugins/changeset/__init__.py

plugins/changeset/apply_changeset.py

plugins/changeset/common.py

plugins/changeset/gen_changeset.py

plugins/changeset/read_changeset.py

plugins/checkperms

files renamed:
plugins/ => bzrlib/plugins/

tools/testweave.py => bzrlib/selftest/test_weave.py

effbot/ => bzrlib/util/effbot/

elementtree/ => bzrlib/util/elementtree/

urlgrabber/ => bzrlib/util/urlgrabber/

bzrlib/newinventory.py => contrib/newinventory.py

files modified:
.bzrignore

NEWS

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/branch.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/inventory.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/status.py

bzrlib/store.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml.py

doc/index.txt

doc/todo-from-arch.txt

setup.py

testsweet.py

tools/weavebench.py

tutorial.txt

Show diffs side-by-side

added added

removed removed

bzrlib/commit.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

# FIXME: "bzr commit doc/format" commits doc/format.txt!

def commit(branch, message,

timestamp=None,

timezone=None,

committer=None,

verbose=True,

specific_files=None,

rev_id=None,

allow_pointless=True):

"""Commit working copy as a new revision.

The basic approach is to add all the file texts into the

store, then the inventory, then make a new revision pointing

to that inventory and store that.

This is not quite safe if the working copy changes during the

commit; for the moment that is simply not allowed. A better

approach is to make a temporary copy of the files before

computing their hashes, and then add those hashes in turn to

the inventory. This should mean at least that there are no

broken hash pointers. There is no way we can get a snapshot

of the whole directory at an instant. This would also have to

be robust against files disappearing, moving, etc. So the

whole thing is a bit hard.

This raises PointlessCommit if there are no changes, no new merges,

and allow_pointless is false.

timestamp -- if not None, seconds-since-epoch for a

postdated/predated commit.

specific_files

If true, commit only those files.

rev_id

If set, use this as the new revision id.

Useful for test or import commands that need to tightly

control what revisions are assigned. If you duplicate

a revision id that exists elsewhere it is your own fault.

If null (default), a time/random revision id is generated.

"""

import time, tempfile

from bzrlib.osutils import local_time_offset, username

from bzrlib.branch import gen_file_id

from bzrlib.errors import BzrError, PointlessCommit

from bzrlib.revision import Revision, RevisionReference

from bzrlib.trace import mutter, note

from bzrlib.xml import pack_xml

branch.lock_write()

try:

# First walk over the working inventory; and both update that

# and also build a new revision inventory. The revision

# inventory needs to hold the text-id, sha1 and size of the

# actual file versions committed in the revision. (These are

# not present in the working inventory.) We also need to

# detect missing/deleted files, and remove them from the

# working inventory.

work_tree = branch.working_tree()

work_inv = work_tree.inventory

basis = branch.basis_tree()

basis_inv = basis.inventory

if verbose:

note('looking for changes...')

pending_merges = branch.pending_merges()

missing_ids, new_inv, any_changes = \

_gather_commit(branch,

work_tree,

work_inv,

basis_inv,

specific_files,

verbose)

100

if not (any_changes or allow_pointless or pending_merges):

101

raise PointlessCommit()

102

103

for file_id in missing_ids:

104

# Any files that have been deleted are now removed from the

105

# working inventory. Files that were not selected for commit

106

# are left as they were in the working inventory and ommitted

107

# from the revision inventory.

108

109

# have to do this later so we don't mess up the iterator.

110

# since parents may be removed before their children we

111

# have to test.

112

113

# FIXME: There's probably a better way to do this; perhaps

114

# the workingtree should know how to filter itbranch.

115

if work_inv.has_id(file_id):

116

del work_inv[file_id]

117

118

# XXX: Can we do any better about making interrupted commits change

# nothing? Perhaps the best approach is to integrate commit of

# AtomicFiles with releasing the lock on the Branch.

# TODO: Separate 'prepare' phase where we find a list of potentially

# committed files. We then can then pause the commit to prompt for a

# commit message, knowing the summary will be the same as what's

# actually used for the commit. (But perhaps simpler to simply get

# the tree status, then use that for a selective commit?)

# The newly committed revision is going to have a shape corresponding

# to that of the working inventory. Files that are not in the

# working tree and that were in the predecessor are reported as

# removed --- this can include files that were either removed from the

# inventory or deleted in the working tree. If they were only

# deleted from disk, they are removed from the working inventory.

# We then consider the remaining entries, which will be in the new

# version. Directory entries are simply copied across. File entries

# must be checked to see if a new version of the file should be

# recorded. For each parent revision inventory, we check to see what

# version of the file was present. If the file was present in at

# least one tree, and if it was the same version in all the trees,

# then we can just refer to that version. Otherwise, a new version

# representing the merger of the file versions must be added.

# TODO: Update hashcache before and after - or does the WorkingTree

# look after that?

import os

import sys

import time

import pdb

from binascii import hexlify

from cStringIO import StringIO

from bzrlib.osutils import (local_time_offset, username,

rand_bytes, compact_date, user_email,

kind_marker, is_inside_any, quotefn,

sha_string, sha_strings, sha_file, isdir, isfile,

split_lines)

from bzrlib.branch import gen_file_id, INVENTORY_FILEID, ANCESTRY_FILEID

from bzrlib.errors import BzrError, PointlessCommit

from bzrlib.revision import Revision, RevisionReference

from bzrlib.trace import mutter, note

from bzrlib.xml5 import serializer_v5

from bzrlib.inventory import Inventory

from bzrlib.weave import Weave

from bzrlib.weavefile import read_weave, write_weave_v5

from bzrlib.atomicfile import AtomicFile

def commit(*args, **kwargs):

"""Commit a new revision to a branch.

Function-style interface for convenience of old callers.

New code should use the Commit class instead.

"""

Commit().commit(*args, **kwargs)

class NullCommitReporter(object):

"""I report on progress of a commit."""

def added(self, path):

pass

def removed(self, path):

pass

def renamed(self, old_path, new_path):

pass

class ReportCommitToLog(NullCommitReporter):

def added(self, path):

note('added %s', path)

def removed(self, path):

100

note('removed %s', path)

101

102

def renamed(self, old_path, new_path):

103

note('renamed %s => %s', old_path, new_path)

104

105

106

class Commit(object):

107

"""Task of committing a new revision.

108

109

This is a MethodObject: it accumulates state as the commit is

110

prepared, and then it is discarded. It doesn't represent

111

historical revisions, just the act of recording a new one.

112

113

missing_ids

114

Modified to hold a list of files that have been deleted from

115

the working directory; these should be removed from the

116

working inventory.

117

"""

118

def __init__(self,

119

reporter=None):

120

if reporter is not None:

121

self.reporter = reporter

122

else:

123

self.reporter = NullCommitReporter()

124

125

126

def commit(self,

127

branch, message,

128

timestamp=None,

129

timezone=None,

130

committer=None,

131

specific_files=None,

132

rev_id=None,

133

allow_pointless=True):

134

"""Commit working copy as a new revision.

135

136

timestamp -- if not None, seconds-since-epoch for a

137

postdated/predated commit.

138

139

specific_files -- If true, commit only those files.

140

141

rev_id -- If set, use this as the new revision id.

142

Useful for test or import commands that need to tightly

143

control what revisions are assigned. If you duplicate

144

a revision id that exists elsewhere it is your own fault.

145

If null (default), a time/random revision id is generated.

146

147

allow_pointless -- If true (default), commit even if nothing

148

has changed and no merges are recorded.

149

"""

150

self.any_changes = False

151

152

self.branch = branch

153

self.weave_store = branch.weave_store

154

self.rev_id = rev_id

155

self.specific_files = specific_files

156

self.allow_pointless = allow_pointless

157

158

if timestamp is None:

159

self.timestamp = time.time()

160

else:

161

self.timestamp = long(timestamp)

162

119

163

if rev_id is None:

120

rev_id = _gen_revision_id(time.time())

121

inv_id = rev_id

122

123

inv_tmp = tempfile.TemporaryFile()

124

pack_xml(new_inv, inv_tmp)

125

inv_tmp.seek(0)

126

branch.inventory_store.add(inv_tmp, inv_id)

127

mutter('new inventory_id is {%s}' % inv_id)

128

129

# We could also just sha hash the inv_tmp file

130

# however, in the case that branch.inventory_store.add()

131

# ever actually does anything special

132

inv_sha1 = branch.get_inventory_sha1(inv_id)

133

134

branch._write_inventory(work_inv)

135

136

if timestamp == None:

137

timestamp = time.time()

138

139

if committer == None:

140

committer = username()

141

142

if timezone == None:

143

timezone = local_time_offset()

144

145

mutter("building commit log message")

146

rev = Revision(timestamp=timestamp,

147

timezone=timezone,

148

committer=committer,

149

message = message,

150

inventory_id=inv_id,

151

inventory_sha1=inv_sha1,

152

revision_id=rev_id)

153

154

rev.parents = []

155

precursor_id = branch.last_patch()

164

self.rev_id = _gen_revision_id(self.branch, self.timestamp)

165

else:

166

self.rev_id = rev_id

167

168

if committer is None:

169

self.committer = username(self.branch)

170

else:

171

assert isinstance(committer, basestring), type(committer)

172

self.committer = committer

173

174

if timezone is None:

175

self.timezone = local_time_offset()

176

else:

177

self.timezone = int(timezone)

178

179

assert isinstance(message, basestring), type(message)

180

self.message = message

181

182

self.branch.lock_write()

183

try:

184

self.work_tree = self.branch.working_tree()

185

self.work_inv = self.work_tree.inventory

186

self.basis_tree = self.branch.basis_tree()

187

self.basis_inv = self.basis_tree.inventory

188

189

self._gather_parents()

190

191

self._remove_deleted()

192

self.new_inv = Inventory()

193

self._store_files()

194

self._report_deletes()

195

196

if not (self.allow_pointless

197

or len(self.parents) != 1

198

or self.new_inv != self.basis_inv):

199

raise PointlessCommit()

200

201

self._record_inventory()

202

self._record_ancestry()

203

self._make_revision()

204

note('committed r%d {%s}', (self.branch.revno() + 1),

205

self.rev_id)

206

self.branch.append_revision(self.rev_id)

207

self.branch.set_pending_merges([])

208

finally:

209

self.branch.unlock()

210

211

212

213

def _record_inventory(self):

214

"""Store the inventory for the new revision."""

215

inv_text = serializer_v5.write_inventory_to_string(self.new_inv)

216

self.inv_sha1 = sha_string(inv_text)

217

self.weave_store.add_text(INVENTORY_FILEID, self.rev_id,

218

split_lines(inv_text), self.parents)

219

220

221

def _record_ancestry(self):

222

"""Append merged revision ancestry to the ancestry file."""

223

w = self.weave_store.get_weave_or_empty(ANCESTRY_FILEID)

224

if self.parents:

225

lines = w.get(w.lookup(self.parents[0]))

226

else:

227

lines = []

228

lines.append(self.rev_id + '\n')

229

parent_idxs = map(w.lookup, self.parents)

230

w.add(self.rev_id, parent_idxs, lines)

231

self.weave_store.put_weave(ANCESTRY_FILEID, w)

232

233

234

def _gather_parents(self):

235

pending_merges = self.branch.pending_merges()

236

self.parents = []

237

precursor_id = self.branch.last_revision()

156

238

if precursor_id:

157

precursor_sha1 = branch.get_revision_sha1(precursor_id)

158

rev.parents.append(RevisionReference(precursor_id, precursor_sha1))

159

for merge_rev in pending_merges:

160

rev.parents.append(RevisionReference(merge_rev))

161

162

rev_tmp = tempfile.TemporaryFile()

163

pack_xml(rev, rev_tmp)

239

self.parents.append(precursor_id)

240

self.parents += pending_merges

241

self.parent_trees = map(self.branch.revision_tree, self.parents)

242

243

244

def _make_revision(self):

245

"""Record a new revision object for this commit."""

246

self.rev = Revision(timestamp=self.timestamp,

247

timezone=self.timezone,

248

committer=self.committer,

249

message=self.message,

250

inventory_sha1=self.inv_sha1,

251

revision_id=self.rev_id)

252

self.rev.parents = map(RevisionReference, self.parents)

253

rev_tmp = StringIO()

254

serializer_v5.write_revision(self.rev, rev_tmp)

164

255

rev_tmp.seek(0)

165

branch.revision_store.add(rev_tmp, rev_id)

166

mutter("new revision_id is {%s}" % rev_id)

167

168

## XXX: Everything up to here can simply be orphaned if we abort

169

## the commit; it will leave junk files behind but that doesn't

170

## matter.

171

172

## TODO: Read back the just-generated changeset, and make sure it

173

## applies and recreates the right state.

174

175

## TODO: Also calculate and store the inventory SHA1

176

mutter("committing patch r%d" % (branch.revno() + 1))

177

178

branch.append_revision(rev_id)

179

180

branch.set_pending_merges([])

181

182

if verbose:

183

note("commited r%d" % branch.revno())

184

finally:

185

branch.unlock()

186

187

188

189

def _gen_revision_id(when):

256

self.branch.revision_store.add(rev_tmp, self.rev_id)

257

mutter('new revision_id is {%s}', self.rev_id)

258

259

260

def _remove_deleted(self):

261

"""Remove deleted files from the working inventories.

262

263

This is done prior to taking the working inventory as the

264

basis for the new committed inventory.

265

266

This returns true if any files

267

*that existed in the basis inventory* were deleted.

268

Files that were added and deleted

269

in the working copy don't matter.

270

"""

271

specific = self.specific_files

272

deleted_ids = []

273

for path, ie in self.work_inv.iter_entries():

274

if specific and not is_inside_any(specific, path):

275

continue

276

if not self.work_tree.has_filename(path):

277

note('missing %s', path)

278

deleted_ids.append(ie.file_id)

279

if deleted_ids:

280

for file_id in deleted_ids:

281

del self.work_inv[file_id]

282

self.branch._write_inventory(self.work_inv)

283

284

285

def _find_file_parents(self, file_id):

286

"""Return the text versions and hashes for all file parents.

287

288

Returned as a map from text version to text sha1.

289

290

This is a set containing the file versions in all parents

291

revisions containing the file. If the file is new, the set

292

will be empty."""

293

r = {}

294

for tree in self.parent_trees:

295

if file_id in tree.inventory:

296

ie = tree.inventory[file_id]

297

assert ie.kind == 'file'

298

assert ie.file_id == file_id

299

if ie.text_version in r:

300

assert r[ie.text_version] == ie.text_sha1

301

else:

302

r[ie.text_version] = ie.text_sha1

303

return r

304

305

306

def _store_files(self):

307

"""Store new texts of modified/added files.

308

309

This is called with new_inv set to a copy of the working

310

inventory, with deleted/removed files already cut out. So

311

this code only needs to deal with setting text versions, and

312

possibly recording new file texts."""

313

for path, new_ie in self.work_inv.iter_entries():

314

file_id = new_ie.file_id

315

mutter('check %s {%s}', path, new_ie.file_id)

316

if self.specific_files:

317

if not is_inside_any(self.specific_files, path):

318

mutter('%s not selected for commit', path)

319

self._carry_file(file_id)

320

continue

321

if new_ie.kind != 'file':

322

self._commit_nonfile(file_id)

323

continue

324

file_parents = self._find_file_parents(file_id)

325

wc_sha1 = self.work_tree.get_file_sha1(file_id)

326

if (len(file_parents) == 1

327

and file_parents.values()[0] == wc_sha1):

328

# not changed or merged

329

self._carry_file(file_id)

330

continue

331

332

mutter('parents of %s are %r', path, file_parents)

333

334

# file is either new, or a file merge; need to record

335

# a new version

336

if len(file_parents) > 1:

337

note('merged %s', path)

338

elif len(file_parents) == 0:

339

note('added %s', path)

340

else:

341

note('modified %s', path)

342

self._commit_file(new_ie, file_id, file_parents)

343

344

345

def _commit_nonfile(self, file_id):

346

self.new_inv.add(self.work_inv[file_id].copy())

347

348

349

def _carry_file(self, file_id):

350

"""Keep a file in the same state as in the basis."""

351

if self.basis_inv.has_id(file_id):

352

self.new_inv.add(self.basis_inv[file_id].copy())

353

354

355

def _report_deletes(self):

356

for file_id in self.basis_inv:

357

if file_id not in self.new_inv:

358

note('deleted %s', self.basis_inv.id2path(file_id))

359

360

361

def _commit_file(self, new_ie, file_id, file_parents):

362

mutter('store new text for {%s} in revision {%s}',

363

file_id, self.rev_id)

364

new_lines = self.work_tree.get_file(file_id).readlines()

365

self._add_text_to_weave(file_id, new_lines, file_parents)

366

new_ie.text_version = self.rev_id

367

new_ie.text_sha1 = sha_strings(new_lines)

368

new_ie.text_size = sum(map(len, new_lines))

369

self.new_inv.add(new_ie)

370

371

372

def _add_text_to_weave(self, file_id, new_lines, parents):

373

if file_id.startswith('__'):

374

raise ValueError('illegal file-id %r for text file' % file_id)

375

self.weave_store.add_text(file_id, self.rev_id, new_lines, parents)

376

377

378

def _gen_revision_id(branch, when):

190

379

"""Return new revision-id."""

191

from binascii import hexlify

192

from osutils import rand_bytes, compact_date, user_email

193

194

s = '%s-%s-' % (user_email(), compact_date(when))

380

s = '%s-%s-' % (user_email(branch), compact_date(when))

195

381

s += hexlify(rand_bytes(8))

196

382

return s

197

383

198

384

199

def _gather_commit(branch, work_tree, work_inv, basis_inv, specific_files,

200

verbose):

201

"""Build inventory preparatory to commit.

202

203

Returns missing_ids, new_inv, any_changes.

204

205

This adds any changed files into the text store, and sets their

206

test-id, sha and size in the returned inventory appropriately.

207

208

missing_ids

209

Modified to hold a list of files that have been deleted from

210

the working directory; these should be removed from the

211

working inventory.

212

"""

213

from bzrlib.inventory import Inventory

214

from bzrlib.osutils import isdir, isfile, sha_string, quotefn, \

215

local_time_offset, username, kind_marker, is_inside_any

216

217

from bzrlib.branch import gen_file_id

218

from bzrlib.errors import BzrError

219

from bzrlib.revision import Revision

220

from bzrlib.trace import mutter, note

221

222

any_changes = False

223

inv = Inventory(work_inv.root.file_id)

224

missing_ids = []

225

226

for path, entry in work_inv.iter_entries():

227

## TODO: Check that the file kind has not changed from the previous

228

## revision of this file (if any).

229

230

p = branch.abspath(path)

231

file_id = entry.file_id

232

mutter('commit prep file %s, id %r ' % (p, file_id))

233

234

if specific_files and not is_inside_any(specific_files, path):

235

mutter(' skipping file excluded from commit')

236

if basis_inv.has_id(file_id):

237

# carry over with previous state

238

inv.add(basis_inv[file_id].copy())

239

else:

240

# omit this from committed inventory

241

pass

242

continue

243

244

if not work_tree.has_id(file_id):

245

if verbose:

246

print('deleted %s%s' % (path, kind_marker(entry.kind)))

247

any_changes = True

248

mutter(" file is missing, removing from inventory")

249

missing_ids.append(file_id)

250

continue

251

252

# this is present in the new inventory; may be new, modified or

253

# unchanged.

254

old_ie = basis_inv.has_id(file_id) and basis_inv[file_id]

255

256

entry = entry.copy()

257

inv.add(entry)

258

259

if old_ie:

260

old_kind = old_ie.kind

261

if old_kind != entry.kind:

262

raise BzrError("entry %r changed kind from %r to %r"

263

% (file_id, old_kind, entry.kind))

264

265

if entry.kind == 'directory':

266

if not isdir(p):

267

raise BzrError("%s is entered as directory but not a directory"

268

% quotefn(p))

269

elif entry.kind == 'file':

270

if not isfile(p):

271

raise BzrError("%s is entered as file but is not a file" % quotefn(p))

272

273

new_sha1 = work_tree.get_file_sha1(file_id)

274

275

if (old_ie

276

and old_ie.text_sha1 == new_sha1):

277

## assert content == basis.get_file(file_id).read()

278

entry.text_id = old_ie.text_id

279

entry.text_sha1 = new_sha1

280

entry.text_size = old_ie.text_size

281

mutter(' unchanged from previous text_id {%s}' %

282

entry.text_id)

283

else:

284

content = file(p, 'rb').read()

285

286

# calculate the sha again, just in case the file contents

287

# changed since we updated the cache

288

entry.text_sha1 = sha_string(content)

289

entry.text_size = len(content)

290

291

entry.text_id = gen_file_id(entry.name)

292

branch.text_store.add(content, entry.text_id)

293

mutter(' stored with text_id {%s}' % entry.text_id)

294

295

if verbose:

296

marked = path + kind_marker(entry.kind)

297

if not old_ie:

298

print 'added', marked

299

any_changes = True

300

elif old_ie == entry:

301

pass # unchanged

302

elif (old_ie.name == entry.name

303

and old_ie.parent_id == entry.parent_id):

304

print 'modified', marked

305

any_changes = True

306

else:

307

print 'renamed', marked

308

any_changes = True

309

310

return missing_ids, inv, any_changes

311

312

385

386

Older »