bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
| 70
by mbp at sourcefrog Prepare for smart recursive add. | 1 | # Copyright (C) 2005 Canonical Ltd
 | 
| 1
by mbp at sourcefrog import from baz patch-364 | 2 | |
| 3 | # This program is free software; you can redistribute it and/or modify
 | |
| 4 | # it under the terms of the GNU General Public License as published by
 | |
| 5 | # the Free Software Foundation; either version 2 of the License, or
 | |
| 6 | # (at your option) any later version.
 | |
| 7 | ||
| 8 | # This program is distributed in the hope that it will be useful,
 | |
| 9 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
| 10 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
| 11 | # GNU General Public License for more details.
 | |
| 12 | ||
| 13 | # You should have received a copy of the GNU General Public License
 | |
| 14 | # along with this program; if not, write to the Free Software
 | |
| 15 | # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 | |
| 16 | ||
| 17 | """Tree classes, representing directory at point in time.
 | |
| 18 | """
 | |
| 19 | ||
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 20 | import os | 
| 800
by Martin Pool Merge John's import-speedup branch: | 21 | |
| 1018
by Martin Pool - remove root_id from EmptyTree | 22 | import bzrlib | 
| 694
by Martin Pool - weed out all remaining calls to bailout() and remove the function | 23 | from bzrlib.trace import mutter, note | 
| 24 | from bzrlib.errors import BzrError | |
| 1018
by Martin Pool - remove root_id from EmptyTree | 25 | from bzrlib.inventory import Inventory | 
| 26 | from bzrlib.osutils import pumpfile, appendpath, fingerprint_file | |
| 1
by mbp at sourcefrog import from baz patch-364 | 27 | |
| 28 | ||
| 678
by Martin Pool - export to tarballs | 29 | exporters = {} | 
| 30 | ||
| 558
by Martin Pool - All top-level classes inherit from object | 31 | class Tree(object): | 
| 1
by mbp at sourcefrog import from baz patch-364 | 32 | """Abstract file tree. | 
| 33 | ||
| 34 |     There are several subclasses:
 | |
| 35 |     
 | |
| 36 |     * `WorkingTree` exists as files on disk editable by the user.
 | |
| 37 | ||
| 38 |     * `RevisionTree` is a tree as recorded at some point in the past.
 | |
| 39 | ||
| 40 |     * `EmptyTree`
 | |
| 41 | ||
| 42 |     Trees contain an `Inventory` object, and also know how to retrieve
 | |
| 43 |     file texts mentioned in the inventory, either from a working
 | |
| 44 |     directory or from a store.
 | |
| 45 | ||
| 46 |     It is possible for trees to contain files that are not described
 | |
| 47 |     in their inventory or vice versa; for this use `filenames()`.
 | |
| 48 | ||
| 49 |     Trees can be compared, etc, regardless of whether they are working
 | |
| 50 |     trees or versioned trees.
 | |
| 51 |     """
 | |
| 52 | ||
| 53 | def has_filename(self, filename): | |
| 54 | """True if the tree has given filename.""" | |
| 55 | raise NotImplementedError() | |
| 56 | ||
| 57 | def has_id(self, file_id): | |
| 58 | return self.inventory.has_id(file_id) | |
| 59 | ||
| 462
by Martin Pool - New form 'file_id in tree' to check if the file is present | 60 | __contains__ = has_id | 
| 61 | ||
| 62 | def __iter__(self): | |
| 63 | return iter(self.inventory) | |
| 64 | ||
| 1
by mbp at sourcefrog import from baz patch-364 | 65 | def id2path(self, file_id): | 
| 66 | return self.inventory.id2path(file_id) | |
| 67 | ||
| 68 | def _get_inventory(self): | |
| 69 | return self._inventory | |
| 977
by Martin Pool - new method Tree.get_file_by_path | 70 | |
| 71 | def get_file_by_path(self, path): | |
| 72 | return self.get_file(self._inventory.path2id(path)) | |
| 1
by mbp at sourcefrog import from baz patch-364 | 73 | |
| 74 | inventory = property(_get_inventory, | |
| 75 | doc="Inventory of this Tree") | |
| 76 | ||
| 77 | def _check_retrieved(self, ie, f): | |
| 130
by mbp at sourcefrog - fixup checks on retrieved files to cope with compression, | 78 | fp = fingerprint_file(f) | 
| 79 | f.seek(0) | |
| 80 | ||
| 184
by mbp at sourcefrog pychecker fixups | 81 | if ie.text_size != None: | 
| 131
by mbp at sourcefrog check size and sha1 of files retrieved from the tree | 82 | if ie.text_size != fp['size']: | 
| 694
by Martin Pool - weed out all remaining calls to bailout() and remove the function | 83 | raise BzrError("mismatched size for file %r in %r" % (ie.file_id, self._store), | 
| 1
by mbp at sourcefrog import from baz patch-364 | 84 | ["inventory expects %d bytes" % ie.text_size, | 
| 130
by mbp at sourcefrog - fixup checks on retrieved files to cope with compression, | 85 | "file is actually %d bytes" % fp['size'], | 
| 1
by mbp at sourcefrog import from baz patch-364 | 86 | "store is probably damaged/corrupt"]) | 
| 87 | ||
| 130
by mbp at sourcefrog - fixup checks on retrieved files to cope with compression, | 88 | if ie.text_sha1 != fp['sha1']: | 
| 694
by Martin Pool - weed out all remaining calls to bailout() and remove the function | 89 | raise BzrError("wrong SHA-1 for file %r in %r" % (ie.file_id, self._store), | 
| 1
by mbp at sourcefrog import from baz patch-364 | 90 | ["inventory expects %s" % ie.text_sha1, | 
| 130
by mbp at sourcefrog - fixup checks on retrieved files to cope with compression, | 91 | "file is actually %s" % fp['sha1'], | 
| 1
by mbp at sourcefrog import from baz patch-364 | 92 | "store is probably damaged/corrupt"]) | 
| 93 | ||
| 94 | ||
| 176
by mbp at sourcefrog New cat command contributed by janmar. | 95 | def print_file(self, fileid): | 
| 96 | """Print file with id `fileid` to stdout.""" | |
| 97 | import sys | |
| 98 | pumpfile(self.get_file(fileid), sys.stdout) | |
| 99 | ||
| 100 | ||
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 101 | def export(self, dest, format='dir', root=None): | 
| 678
by Martin Pool - export to tarballs | 102 | """Export this tree.""" | 
| 103 | try: | |
| 104 | exporter = exporters[format] | |
| 105 | except KeyError: | |
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 106 | from bzrlib.errors import BzrCommandError | 
| 678
by Martin Pool - export to tarballs | 107 | raise BzrCommandError("export format %r not supported" % format) | 
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 108 | exporter(self, dest, root) | 
| 1
by mbp at sourcefrog import from baz patch-364 | 109 | |
| 110 | ||
| 111 | ||
| 112 | class RevisionTree(Tree): | |
| 113 | """Tree viewing a previous revision. | |
| 114 | ||
| 115 |     File text can be retrieved from the text store.
 | |
| 116 | ||
| 254
by Martin Pool - Doc cleanups from Magnus Therning | 117 |     TODO: Some kind of `__repr__` method, but a good one
 | 
| 1
by mbp at sourcefrog import from baz patch-364 | 118 |            probably means knowing the branch and revision number,
 | 
| 119 |            or at least passing a description to the constructor.
 | |
| 120 |     """
 | |
| 121 | ||
| 122 | def __init__(self, store, inv): | |
| 123 | self._store = store | |
| 124 | self._inventory = inv | |
| 125 | ||
| 126 | def get_file(self, file_id): | |
| 127 | ie = self._inventory[file_id] | |
| 128 | f = self._store[ie.text_id] | |
| 129 | mutter(" get fileid{%s} from %r" % (file_id, self)) | |
| 131
by mbp at sourcefrog check size and sha1 of files retrieved from the tree | 130 | self._check_retrieved(ie, f) | 
| 1
by mbp at sourcefrog import from baz patch-364 | 131 | return f | 
| 132 | ||
| 133 | def get_file_size(self, file_id): | |
| 134 | return self._inventory[file_id].text_size | |
| 135 | ||
| 136 | def get_file_sha1(self, file_id): | |
| 137 | ie = self._inventory[file_id] | |
| 138 | return ie.text_sha1 | |
| 139 | ||
| 140 | def has_filename(self, filename): | |
| 141 | return bool(self.inventory.path2id(filename)) | |
| 142 | ||
| 143 | def list_files(self): | |
| 144 |         # The only files returned by this are those from the version
 | |
| 145 | for path, entry in self.inventory.iter_entries(): | |
| 146 | yield path, 'V', entry.kind, entry.file_id | |
| 147 | ||
| 148 | ||
| 149 | class EmptyTree(Tree): | |
| 1018
by Martin Pool - remove root_id from EmptyTree | 150 | def __init__(self): | 
| 151 | self._inventory = Inventory() | |
| 1
by mbp at sourcefrog import from baz patch-364 | 152 | |
| 153 | def has_filename(self, filename): | |
| 154 | return False | |
| 155 | ||
| 156 | def list_files(self): | |
| 157 | if False: # just to make it a generator | |
| 158 | yield None | |
| 159 | ||
| 160 | ||
| 161 | ||
| 162 | ######################################################################
 | |
| 163 | # diff
 | |
| 164 | ||
| 165 | # TODO: Merge these two functions into a single one that can operate
 | |
| 166 | # on either a whole tree or a set of files.
 | |
| 167 | ||
| 168 | # TODO: Return the diff in order by filename, not by category or in
 | |
| 169 | # random order.  Can probably be done by lock-stepping through the
 | |
| 170 | # filenames from both trees.
 | |
| 171 | ||
| 172 | ||
| 173 | def file_status(filename, old_tree, new_tree): | |
| 174 | """Return single-letter status, old and new names for a file. | |
| 175 | ||
| 176 |     The complexity here is in deciding how to represent renames;
 | |
| 177 |     many complex cases are possible.
 | |
| 178 |     """
 | |
| 179 | old_inv = old_tree.inventory | |
| 180 | new_inv = new_tree.inventory | |
| 181 | new_id = new_inv.path2id(filename) | |
| 182 | old_id = old_inv.path2id(filename) | |
| 183 | ||
| 184 | if not new_id and not old_id: | |
| 185 |         # easy: doesn't exist in either; not versioned at all
 | |
| 186 | if new_tree.is_ignored(filename): | |
| 187 | return 'I', None, None | |
| 188 | else: | |
| 189 | return '?', None, None | |
| 190 | elif new_id: | |
| 191 |         # There is now a file of this name, great.
 | |
| 192 |         pass
 | |
| 193 | else: | |
| 194 |         # There is no longer a file of this name, but we can describe
 | |
| 195 |         # what happened to the file that used to have
 | |
| 196 |         # this name.  There are two possibilities: either it was
 | |
| 197 |         # deleted entirely, or renamed.
 | |
| 198 | assert old_id | |
| 199 | if new_inv.has_id(old_id): | |
| 200 | return 'X', old_inv.id2path(old_id), new_inv.id2path(old_id) | |
| 201 | else: | |
| 202 | return 'D', old_inv.id2path(old_id), None | |
| 203 | ||
| 204 |     # if the file_id is new in this revision, it is added
 | |
| 205 | if new_id and not old_inv.has_id(new_id): | |
| 206 | return 'A' | |
| 207 | ||
| 208 |     # if there used to be a file of this name, but that ID has now
 | |
| 209 |     # disappeared, it is deleted
 | |
| 210 | if old_id and not new_inv.has_id(old_id): | |
| 211 | return 'D' | |
| 212 | ||
| 213 | return 'wtf?' | |
| 214 | ||
| 215 | ||
| 216 | ||
| 164
by mbp at sourcefrog new 'renames' command | 217 | def find_renames(old_inv, new_inv): | 
| 218 | for file_id in old_inv: | |
| 219 | if file_id not in new_inv: | |
| 220 |             continue
 | |
| 221 | old_name = old_inv.id2path(file_id) | |
| 222 | new_name = new_inv.id2path(file_id) | |
| 223 | if old_name != new_name: | |
| 224 | yield (old_name, new_name) | |
| 225 | ||
| 678
by Martin Pool - export to tarballs | 226 | |
| 227 | ||
| 228 | ######################################################################
 | |
| 229 | # export
 | |
| 230 | ||
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 231 | def dir_exporter(tree, dest, root): | 
| 678
by Martin Pool - export to tarballs | 232 | """Export this tree to a new directory. | 
| 233 | ||
| 234 |     `dest` should not exist, and will be created holding the
 | |
| 235 |     contents of this tree.
 | |
| 236 | ||
| 237 |     TODO: To handle subdirectories we need to create the
 | |
| 238 |            directories first.
 | |
| 239 | ||
| 240 |     :note: If the export fails, the destination directory will be
 | |
| 241 |            left in a half-assed state.
 | |
| 242 |     """
 | |
| 800
by Martin Pool Merge John's import-speedup branch: | 243 | import os | 
| 678
by Martin Pool - export to tarballs | 244 | os.mkdir(dest) | 
| 245 | mutter('export version %r' % tree) | |
| 246 | inv = tree.inventory | |
| 247 | for dp, ie in inv.iter_entries(): | |
| 248 | kind = ie.kind | |
| 249 | fullpath = appendpath(dest, dp) | |
| 250 | if kind == 'directory': | |
| 251 | os.mkdir(fullpath) | |
| 252 | elif kind == 'file': | |
| 253 | pumpfile(tree.get_file(ie.file_id), file(fullpath, 'wb')) | |
| 254 | else: | |
| 694
by Martin Pool - weed out all remaining calls to bailout() and remove the function | 255 | raise BzrError("don't know how to export {%s} of kind %r" % (ie.file_id, kind)) | 
| 678
by Martin Pool - export to tarballs | 256 | mutter(" export {%s} kind %s to %s" % (ie.file_id, kind, fullpath)) | 
| 257 | exporters['dir'] = dir_exporter | |
| 258 | ||
| 259 | try: | |
| 260 | import tarfile | |
| 261 | except ImportError: | |
| 262 |     pass
 | |
| 263 | else: | |
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 264 | def get_root_name(dest): | 
| 265 | """Get just the root name for a tarball. | |
| 266 | ||
| 267 |         >>> get_root_name('mytar.tar')
 | |
| 268 |         'mytar'
 | |
| 269 |         >>> get_root_name('mytar.tar.bz2')
 | |
| 270 |         'mytar'
 | |
| 271 |         >>> get_root_name('tar.tar.tar.tgz')
 | |
| 272 |         'tar.tar.tar'
 | |
| 273 |         >>> get_root_name('bzr-0.0.5.tar.gz')
 | |
| 274 |         'bzr-0.0.5'
 | |
| 275 |         >>> get_root_name('a/long/path/mytar.tgz')
 | |
| 276 |         'mytar'
 | |
| 277 |         >>> get_root_name('../parent/../dir/other.tbz2')
 | |
| 278 |         'other'
 | |
| 279 |         """
 | |
| 280 | endings = ['.tar', '.tar.gz', '.tgz', '.tar.bz2', '.tbz2'] | |
| 281 | dest = os.path.basename(dest) | |
| 282 | for end in endings: | |
| 283 | if dest.endswith(end): | |
| 284 | return dest[:-len(end)] | |
| 285 | ||
| 286 | def tar_exporter(tree, dest, root, compression=None): | |
| 678
by Martin Pool - export to tarballs | 287 | """Export this tree to a new tar file. | 
| 288 | ||
| 289 |         `dest` will be created holding the contents of this tree; if it
 | |
| 290 |         already exists, it will be clobbered, like with "tar -c".
 | |
| 291 |         """
 | |
| 800
by Martin Pool Merge John's import-speedup branch: | 292 | from time import time | 
| 293 | now = time() | |
| 678
by Martin Pool - export to tarballs | 294 | compression = str(compression or '') | 
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 295 | if root is None: | 
| 296 | root = get_root_name(dest) | |
| 678
by Martin Pool - export to tarballs | 297 | try: | 
| 298 | ball = tarfile.open(dest, 'w:' + compression) | |
| 299 | except tarfile.CompressionError, e: | |
| 694
by Martin Pool - weed out all remaining calls to bailout() and remove the function | 300 | raise BzrError(str(e)) | 
| 678
by Martin Pool - export to tarballs | 301 | mutter('export version %r' % tree) | 
| 302 | inv = tree.inventory | |
| 303 | for dp, ie in inv.iter_entries(): | |
| 304 | mutter(" export {%s} kind %s to %s" % (ie.file_id, ie.kind, dest)) | |
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 305 | item = tarfile.TarInfo(os.path.join(root, dp)) | 
| 678
by Martin Pool - export to tarballs | 306 |             # TODO: would be cool to actually set it to the timestamp of the
 | 
| 307 |             # revision it was last changed
 | |
| 308 | item.mtime = now | |
| 309 | if ie.kind == 'directory': | |
| 310 | item.type = tarfile.DIRTYPE | |
| 311 | fileobj = None | |
| 312 | item.name += '/' | |
| 313 | item.size = 0 | |
| 314 | item.mode = 0755 | |
| 315 | elif ie.kind == 'file': | |
| 316 | item.type = tarfile.REGTYPE | |
| 317 | fileobj = tree.get_file(ie.file_id) | |
| 318 | item.size = _find_file_size(fileobj) | |
| 319 | item.mode = 0644 | |
| 320 | else: | |
| 694
by Martin Pool - weed out all remaining calls to bailout() and remove the function | 321 | raise BzrError("don't know how to export {%s} of kind %r" % | 
| 678
by Martin Pool - export to tarballs | 322 | (ie.file_id, ie.kind)) | 
| 323 | ||
| 324 | ball.addfile(item, fileobj) | |
| 325 | ball.close() | |
| 326 | exporters['tar'] = tar_exporter | |
| 327 | ||
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 328 | def tgz_exporter(tree, dest, root): | 
| 329 | tar_exporter(tree, dest, root, compression='gz') | |
| 678
by Martin Pool - export to tarballs | 330 | exporters['tgz'] = tgz_exporter | 
| 331 | ||
| 849
by Martin Pool - Put files inside an exported tarball into a top-level directory rather than | 332 | def tbz_exporter(tree, dest, root): | 
| 333 | tar_exporter(tree, dest, root, compression='bz2') | |
| 678
by Martin Pool - export to tarballs | 334 | exporters['tbz2'] = tbz_exporter | 
| 335 | ||
| 336 | ||
| 337 | def _find_file_size(fileobj): | |
| 338 | offset = fileobj.tell() | |
| 339 | try: | |
| 340 | fileobj.seek(0, 2) | |
| 341 | size = fileobj.tell() | |
| 342 | except TypeError: | |
| 343 |         # gzip doesn't accept second argument to seek()
 | |
| 344 | fileobj.seek(0) | |
| 345 | size = 0 | |
| 346 | while True: | |
| 347 | nread = len(fileobj.read()) | |
| 348 | if nread == 0: | |
| 349 |                 break
 | |
| 350 | size += nread | |
| 351 | fileobj.seek(offset) | |
| 352 | return size |