17
17
"""Read in a bundle stream, and process it into a BundleReader object."""
19
from __future__ import absolute_import
20
from cStringIO import StringIO
29
from bzrlib.bundle import apply_bundle
30
from bzrlib.errors import (TestamentMismatch, BzrError,
31
MalformedHeader, MalformedPatches, NotABundle)
32
from bzrlib.inventory import (Inventory, InventoryEntry,
33
InventoryDirectory, InventoryFile,
35
from bzrlib.osutils import sha_file, sha_string, pathjoin
36
from bzrlib.revision import Revision, NULL_REVISION
37
from bzrlib.testament import StrictTestament
38
from bzrlib.trace import mutter, warning
39
import bzrlib.transport
40
from bzrlib.tree import Tree
41
import bzrlib.urlutils
42
from bzrlib.xml5 import serializer_v5
30
from . import apply_bundle
31
from ..errors import (
35
from ..bzr.inventory import (
41
from ..osutils import sha_string, pathjoin
42
from ..revision import Revision, NULL_REVISION
43
from ..sixish import (
47
from ..testament import StrictTestament
48
from ..trace import mutter, warning
49
from ..tree import Tree
50
from ..bzr.xml5 import serializer_v5
45
53
class RevisionInfo(object):
278
286
if rev.revision_id != revision_id:
279
287
raise AssertionError()
280
288
if sha1 != rev.inventory_sha1:
281
open(',,bogus-inv', 'wb').write(s)
289
with open(',,bogus-inv', 'wb') as f:
282
291
warning('Inventory sha hash mismatch for revision %s. %s'
283
292
' != %s' % (revision_id, sha1, rev.inventory_sha1))
285
def _validate_revision(self, inventory, revision_id):
294
def _validate_revision(self, tree, revision_id):
286
295
"""Make sure all revision entries match their checksum."""
288
# This is a mapping from each revision id to it's sha hash
297
# This is a mapping from each revision id to its sha hash
291
300
rev = self.get_revision(revision_id)
460
468
class BundleTree(Tree):
461
470
def __init__(self, base_tree, revision_id):
462
471
self.base_tree = base_tree
463
472
self._renamed = {} # Mapping from old_path => new_path
464
473
self._renamed_r = {} # new_path => old_path
465
474
self._new_id = {} # new_path => new_id
466
475
self._new_id_r = {} # new_id => new_path
467
self._kinds = {} # new_id => kind
476
self._kinds = {} # new_path => kind
468
477
self._last_changed = {} # new_id => revision_id
469
478
self._executable = {} # new_id => executable value
470
479
self.patches = {}
614
623
in the text-store, so that the file contents would
627
file_id = self.path2id(path)
617
628
base_id = self.old_contents_id(file_id)
618
629
if (base_id is not None and
619
base_id != self.base_tree.inventory.root.file_id):
620
patch_original = self.base_tree.get_file(base_id)
630
base_id != self.base_tree.get_root_id()):
631
patch_original = self.base_tree.get_file(
632
self.base_tree.id2path(base_id), base_id)
622
634
patch_original = None
623
file_patch = self.patches.get(self.id2path(file_id))
635
file_patch = self.patches.get(path)
624
636
if file_patch is None:
625
637
if (patch_original is None and
626
self.get_kind(file_id) == 'directory'):
638
self.kind(path, file_id) == 'directory'):
628
640
if patch_original is None:
629
641
raise AssertionError("None: %s" % file_id)
630
642
return patch_original
634
646
'Malformed patch for %s, %r' % (file_id, file_patch))
635
647
return patched_file(file_patch, patch_original)
637
def get_symlink_target(self, file_id):
638
new_path = self.id2path(file_id)
640
return self._targets[new_path]
642
return self.base_tree.get_symlink_target(file_id)
644
def get_kind(self, file_id):
645
if file_id in self._kinds:
646
return self._kinds[file_id]
647
return self.base_tree.inventory[file_id].kind
649
def is_executable(self, file_id):
650
path = self.id2path(file_id)
649
def get_symlink_target(self, path, file_id=None):
651
return self._targets[path]
653
return self.base_tree.get_symlink_target(path, file_id)
655
def kind(self, path, file_id=None):
657
return self._kinds[path]
659
return self.base_tree.kind(path, file_id)
661
def get_file_revision(self, path, file_id=None):
662
if path in self._last_changed:
663
return self._last_changed[path]
665
return self.base_tree.get_file_revision(path, file_id)
667
def is_executable(self, path, file_id=None):
651
668
if path in self._executable:
652
669
return self._executable[path]
654
return self.base_tree.inventory[file_id].executable
671
return self.base_tree.is_executable(path, file_id)
656
def get_last_changed(self, file_id):
657
path = self.id2path(file_id)
673
def get_last_changed(self, path, file_id=None):
658
674
if path in self._last_changed:
659
675
return self._last_changed[path]
660
return self.base_tree.inventory[file_id].revision
676
return self.base_tree.get_file_revision(path, file_id)
662
def get_size_and_sha1(self, file_id):
678
def get_size_and_sha1(self, new_path, file_id=None):
663
679
"""Return the size and sha1 hash of the given file id.
664
680
If the file was not locally modified, this is extracted
665
681
from the base_tree. Rather than re-reading the file.
667
new_path = self.id2path(file_id)
668
683
if new_path is None:
669
684
return None, None
670
685
if new_path not in self.patches:
671
686
# If the entry does not have a patch, then the
672
687
# contents must be the same as in the base_tree
673
ie = self.base_tree.inventory[file_id]
674
if ie.text_size is None:
675
return ie.text_size, ie.text_sha1
676
return int(ie.text_size), ie.text_sha1
677
fileobj = self.get_file(file_id)
688
base_path = self.base_tree.id2path(file_id)
689
text_size = self.base_tree.get_file_size(base_path, file_id)
690
text_sha1 = self.base_tree.get_file_sha1(base_path, file_id)
691
return text_size, text_sha1
692
fileobj = self.get_file(new_path, file_id)
678
693
content = fileobj.read()
679
694
return len(content), sha_string(content)
684
699
This need to be called before ever accessing self.inventory
686
701
from os.path import dirname, basename
687
base_inv = self.base_tree.inventory
688
702
inv = Inventory(None, self.revision_id)
690
def add_entry(file_id):
691
path = self.id2path(file_id)
704
def add_entry(path, file_id):
697
708
parent_path = dirname(path)
698
709
parent_id = self.path2id(parent_path)
700
kind = self.get_kind(file_id)
701
revision_id = self.get_last_changed(file_id)
711
kind = self.kind(path, file_id)
712
revision_id = self.get_last_changed(path, file_id)
703
714
name = basename(path)
704
715
if kind == 'directory':
705
716
ie = InventoryDirectory(file_id, name, parent_id)
706
717
elif kind == 'file':
707
718
ie = InventoryFile(file_id, name, parent_id)
708
ie.executable = self.is_executable(file_id)
719
ie.executable = self.is_executable(path, file_id)
709
720
elif kind == 'symlink':
710
721
ie = InventoryLink(file_id, name, parent_id)
711
ie.symlink_target = self.get_symlink_target(file_id)
722
ie.symlink_target = self.get_symlink_target(path, file_id)
712
723
ie.revision = revision_id
714
if kind in ('directory', 'symlink'):
715
ie.text_size, ie.text_sha1 = None, None
717
ie.text_size, ie.text_sha1 = self.get_size_and_sha1(file_id)
718
if (ie.text_size is None) and (kind == 'file'):
719
raise BzrError('Got a text_size of None for file_id %r' % file_id)
726
ie.text_size, ie.text_sha1 = self.get_size_and_sha1(
728
if ie.text_size is None:
730
'Got a text_size of None for file_id %r' % file_id)
722
733
sorted_entries = self.sorted_path_id()
723
734
for path, file_id in sorted_entries:
735
add_entry(path, file_id)
732
743
# at that instant
733
744
inventory = property(_get_inventory)
736
for path, entry in self.inventory.iter_entries():
746
root_inventory = property(_get_inventory)
748
def all_file_ids(self):
749
return {entry.file_id for path, entry in self.inventory.iter_entries()}
751
def all_versioned_paths(self):
752
return {path for path, entry in self.inventory.iter_entries()}
754
def list_files(self, include_root=False, from_dir=None, recursive=True):
755
# The only files returned by this are those from the version
760
from_dir_id = inv.path2id(from_dir)
761
if from_dir_id is None:
762
# Directory not versioned
764
entries = inv.iter_entries(from_dir=from_dir_id, recursive=recursive)
765
if inv.root is not None and not include_root and from_dir is None:
766
# skip the root for compatability with the current apis.
768
for path, entry in entries:
769
yield path, 'V', entry.kind, entry.file_id, entry
739
771
def sorted_path_id(self):
741
for result in self._new_id.iteritems():
773
for result in viewitems(self._new_id):
742
774
paths.append(result)
743
for id in self.base_tree:
775
for id in self.base_tree.all_file_ids():
744
776
path = self.id2path(id)
752
784
def patched_file(file_patch, original):
753
785
"""Produce a file-like object with the patched version of a text"""
754
from bzrlib.patches import iter_patched
755
from bzrlib.iterablefile import IterableFile
786
from breezy.patches import iter_patched
787
from breezy.iterablefile import IterableFile
756
788
if file_patch == "":
757
789
return IterableFile(())
758
790
# string.splitlines(True) also splits on '\r', but the iter_patched code
759
791
# only expects to iterate over '\n' style lines
760
792
return IterableFile(iter_patched(original,
761
StringIO(file_patch).readlines()))
793
BytesIO(file_patch).readlines()))