/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
0.78.3 by Ian Clatworthy
move GenericCacheManager into its own module
1
# Copyright (C) 2009 Canonical Ltd
2
#
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
#
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
#
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
"""A manager of caches."""
18
19
0.64.153 by Ian Clatworthy
clear caches before packing; show cache stats in verbose mode
20
from bzrlib import lru_cache, trace
21
from bzrlib.plugins.fastimport import helpers
0.64.118 by Ian Clatworthy
fix lru_cache import
22
0.78.3 by Ian Clatworthy
move GenericCacheManager into its own module
23
class CacheManager(object):
24
0.83.1 by Ian Clatworthy
head tracking tests and fix
25
    def __init__(self, info=None, verbose=False, inventory_cache_size=10):
0.78.3 by Ian Clatworthy
move GenericCacheManager into its own module
26
        """Create a manager of caches.
27
28
        :param info: a ConfigObj holding the output from
29
            the --info processor, or None if no hints are available
30
        """
31
        self.verbose = verbose
32
33
        # dataref -> data. datref is either :mark or the sha-1.
34
        # Sticky blobs aren't removed after being referenced.
35
        self._blobs = {}
36
        self._sticky_blobs = {}
37
38
        # revision-id -> Inventory cache
39
        # these are large and we probably don't need too many as
40
        # most parents are recent in history
41
        self.inventories = lru_cache.LRUCache(inventory_cache_size)
42
43
        # import commmit-ids -> revision-id lookup table
44
        # we need to keep all of these but they are small
45
        self.revision_ids = {}
46
47
        # path -> file-ids - as generated
48
        self.file_ids = {}
49
50
        # Head tracking: last ref, last id per ref & map of commit ids to ref*s*
51
        self.last_ref = None
52
        self.last_ids = {}
53
        self.heads = {}
54
55
        # Work out the blobs to make sticky - None means all
56
        self._blobs_to_keep = None
57
        if info is not None:
58
            try:
59
                self._blobs_to_keep = info['Blob usage tracking']['multi']
60
            except KeyError:
61
                # info not in file - possible when no blobs used
62
                pass
63
0.64.153 by Ian Clatworthy
clear caches before packing; show cache stats in verbose mode
64
    def dump_stats(self, note=trace.note):
65
        """Dump some statistics about what we cached."""
66
        # TODO: add in inventory stastistics
67
        note("Cache statistics:")
68
        self._show_stats_for(self._sticky_blobs, "sticky blobs", note=note)
69
        self._show_stats_for(self.revision_ids, "revision-ids", note=note)
70
        self._show_stats_for(self.file_ids, "file-ids", note=note)
71
        # These aren't interesting so omit from the output, at least for now
72
        #self._show_stats_for(self._blobs, "other blobs", note=note)
73
        #self._show_stats_for(self.last_ids, "last-ids", note=note)
74
        #self._show_stats_for(self.heads, "heads", note=note)
75
76
    def _show_stats_for(self, dict, label, note=trace.note):
77
        """Dump statistics about a given dictionary.
78
79
        By the key and value need to support len().
80
        """
81
        count = len(dict)
82
        size = sum(map(len, dict.keys()))
83
        size += sum(map(len, dict.values()))
84
        kbytes = size * 1.0 / 1024
85
        note("    %-12s: %8.1fs kB (%d %s)" % (label, kbytes, count,
86
            helpers.single_plural(count, "item", "items")))
87
88
    def clear_all(self):
89
        """Free up any memory used by the caches."""
90
        self._blobs.clear()
91
        self._sticky_blobs.clear()
92
        self.revision_ids.clear()
93
        self.file_ids.clear()
94
        self.last_ids.clear()
95
        self.heads.clear()
96
        self.inventories.clear()
97
0.78.3 by Ian Clatworthy
move GenericCacheManager into its own module
98
    def store_blob(self, id, data):
99
        """Store a blob of data."""
100
        if (self._blobs_to_keep is None or data == '' or
101
            id in self._blobs_to_keep):
102
            self._sticky_blobs[id] = data
103
        else:
104
            self._blobs[id] = data
105
106
    def fetch_blob(self, id):
107
        """Fetch a blob of data."""
108
        try:
109
            return self._sticky_blobs[id]
110
        except KeyError:
111
            return self._blobs.pop(id)
112
113
    def delete_path(self, path):
114
        """Remove a path from caches."""
115
        # we actually want to remember what file-id we gave a path,
116
        # even when that file is deleted, so doing nothing is correct
117
        pass
118
119
    def rename_path(self, old_path, new_path):
120
        """Rename a path in the caches."""
121
        # In this case, we need to forget the file-id we gave a path,
122
        # otherwise, we'll get duplicate file-ids in the repository.
123
        self.file_ids[new_path] = self.file_ids[old_path]
124
        del self.file_ids[old_path]
125
0.81.1 by Ian Clatworthy
move GenericCommitHandler into its own module in prep for a delta-based one
126
    def track_heads(self, cmd):
127
        """Track the repository heads given a CommitCommand.
128
        
129
        :param cmd: the CommitCommand
130
        :return: the list of parents in terms of commit-ids
131
        """
132
        # Get the true set of parents
133
        if cmd.from_ is not None:
134
            parents = [cmd.from_]
135
        else:
136
            last_id = self.last_ids.get(cmd.ref)
137
            if last_id is not None:
138
                parents = [last_id]
139
            else:
140
                parents = []
141
        parents.extend(cmd.merges)
142
143
        # Track the heads
144
        self.track_heads_for_ref(cmd.ref, cmd.id, parents)
145
        return parents
146
0.78.3 by Ian Clatworthy
move GenericCacheManager into its own module
147
    def track_heads_for_ref(self, cmd_ref, cmd_id, parents=None):
148
        if parents is not None:
149
            for parent in parents:
0.83.1 by Ian Clatworthy
head tracking tests and fix
150
                if parent in self.heads:
151
                    del self.heads[parent]
0.78.3 by Ian Clatworthy
move GenericCacheManager into its own module
152
        self.heads.setdefault(cmd_id, set()).add(cmd_ref)
153
        self.last_ids[cmd_ref] = cmd_id
154
        self.last_ref = cmd_ref