/brz/remove-bazaar

To get this branch, use:
bzr branch http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
1080 by Martin Pool
- test tool for converting history to weave files
1
#! /usr/bin/python
1267 by Martin Pool
- notes on conversion of existing history to weaves
2
#
1080 by Martin Pool
- test tool for converting history to weave files
3
# Copyright (C) 2005 Canonical Ltd
1267 by Martin Pool
- notes on conversion of existing history to weaves
4
#
1080 by Martin Pool
- test tool for converting history to weave files
5
# This program is free software; you can redistribute it and/or modify
6
# it under the terms of the GNU General Public License as published by
7
# the Free Software Foundation; either version 2 of the License, or
8
# (at your option) any later version.
1267 by Martin Pool
- notes on conversion of existing history to weaves
9
#
1080 by Martin Pool
- test tool for converting history to weave files
10
# This program is distributed in the hope that it will be useful,
11
# but WITHOUT ANY WARRANTY; without even the implied warranty of
12
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13
# GNU General Public License for more details.
1267 by Martin Pool
- notes on conversion of existing history to weaves
14
#
1080 by Martin Pool
- test tool for converting history to weave files
15
# You should have received a copy of the GNU General Public License
16
# along with this program; if not, write to the Free Software
17
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
18
19
"""Experiment in converting existing bzr branches to weaves."""
20
1267 by Martin Pool
- notes on conversion of existing history to weaves
21
# To make this properly useful
22
#
23
# 1. assign text version ids, and put those text versions into
24
#    the inventory as they're converted.
25
#
26
# 2. keep track of the previous version of each file, rather than
27
#    just using the last one imported
28
#
29
# 3. assign entry versions when files are added, renamed or moved.
30
#
31
# 4. when merged-in versions are observed, walk down through them
32
#    to discover everything, then commit bottom-up
33
#
34
# 5. track ancestry as things are merged in, and commit that in each
35
#    revision
36
#
37
# Perhaps it's best to first walk the whole graph and make a plan for
38
# what should be imported in what order?  Need a kind of topological
39
# sort of all revisions.  (Or do we, can we just before doing a revision
40
# see that all its parents have either been converted or abandoned?)
41
1300 by Martin Pool
- refactor weave upgrade into a MethodObject
42
if False:
43
    try:
44
        import psyco
45
        psyco.full()
46
    except ImportError:
47
        pass
1083 by Martin Pool
- add space to store revision-id in weave files
48
1080 by Martin Pool
- test tool for converting history to weave files
49
1267 by Martin Pool
- notes on conversion of existing history to weaves
50
import tempfile
51
import hotshot, hotshot.stats
52
import sys
1132 by Martin Pool
- fix up logging for history2weaves tool
53
import logging
1300 by Martin Pool
- refactor weave upgrade into a MethodObject
54
import time
1132 by Martin Pool
- fix up logging for history2weaves tool
55
1290 by Martin Pool
- clean up imports
56
from bzrlib.branch import Branch, find_branch
1080 by Martin Pool
- test tool for converting history to weave files
57
from bzrlib.revfile import Revfile
58
from bzrlib.weave import Weave
59
from bzrlib.weavefile import read_weave, write_weave
60
from bzrlib.progress import ProgressBar
61
from bzrlib.atomicfile import AtomicFile
1300 by Martin Pool
- refactor weave upgrade into a MethodObject
62
from bzrlib.xml4 import serializer_v4
63
from bzrlib.xml5 import serializer_v5
1132 by Martin Pool
- fix up logging for history2weaves tool
64
import bzrlib.trace
1267 by Martin Pool
- notes on conversion of existing history to weaves
65
66
1080 by Martin Pool
- test tool for converting history to weave files
67
1300 by Martin Pool
- refactor weave upgrade into a MethodObject
68
class Convert(object):
69
    def __init__(self):
70
        self.total_revs = 0
71
        self.converted_revs = 0
72
        self.text_count = 0
73
        self.convert()
74
75
76
77
    def convert(self):
78
        bzrlib.trace.enable_default_logging()
79
        self.pb = ProgressBar()
80
        self.inv_weave = Weave('__inventory')
81
        self.anc_weave = Weave('__ancestry')
82
83
        last_text_sha = {}
84
85
        # holds in-memory weaves for all files
86
        text_weaves = {}
87
88
        b = self.branch = Branch('.', relax_version_check=True)
89
90
        revno = 1
91
        rev_history = b.revision_history()
92
        last_idx = None
93
        inv_parents = []
94
95
        # todo is a stack holding the revisions we still need to process;
96
        # appending to it adds new highest-priority revisions
97
        todo = rev_history[:]
98
        todo.reverse()
99
        self.total_revs = len(todo)
100
101
        while todo:
102
            self._convert_one_rev(todo.pop())
103
104
        self.pb.clear()
105
        print 'upgraded to weaves:'
106
        print '  %6d revisions and inventories' % self.converted_revs
107
        print '  %6d texts' % self.text_count
108
109
        self._write_all_weaves()
110
111
112
    def _write_all_weaves(self):
113
        i = 0
114
        return ############################################
115
        # TODO: commit them all atomically at the end, not one by one
116
        write_atomic_weave(self.inv_weave, 'weaves/inventory.weave')
117
        write_atomic_weave(self.anc_weave, 'weaves/ancestry.weave')
118
        for file_id, file_weave in text_weaves.items():
119
            self.pb.update('writing weave', i, len(text_weaves))
120
            write_atomic_weave(file_weave, 'weaves/%s.weave' % file_id)
121
            i += 1
122
123
        self.pb.clear()
124
125
        
126
    def _convert_one_rev(self, rev_id):
127
        self._bump_progress()
128
        b = self.branch
129
        rev_xml = b.revision_store[rev_id].read()
130
        inv_xml = b.inventory_store[rev_id].read()
131
132
        rev = serializer_v4.read_revision_from_string(rev_xml)
133
        inv = serializer_v4.read_inventory_from_string(inv_xml)
134
        
135
        return ##########################################
136
137
        new_idx = self.inv_weave.add(rev_id, inv_parents, inv_xml)
1087 by Martin Pool
- add a tool script to convert past history into weaves
138
        inv_parents = [new_idx]
139
140
        tree = b.revision_tree(rev_id)
141
        inv = tree.inventory
142
143
        # for each file in the inventory, put it into its own revfile
144
        for file_id in inv:
145
            ie = inv[file_id]
146
            if ie.kind != 'file':
147
                continue
148
            if last_text_sha.get(file_id) == ie.text_sha1:
149
                # same as last time
150
                continue
151
            last_text_sha[file_id] = ie.text_sha1
152
153
            # new text (though possibly already stored); need to store it
154
            text_lines = tree.get_file(file_id).readlines()
155
156
            # if the file's created for the first time in this
157
            # revision then make a new weave; else find the old one
158
            if file_id not in text_weaves:
159
                text_weaves[file_id] = Weave()
1300 by Martin Pool
- refactor weave upgrade into a MethodObject
160
1087 by Martin Pool
- add a tool script to convert past history into weaves
161
            w = text_weaves[file_id]
162
163
            # base the new text version off whatever was last
164
            # (actually it'd be better to track this, to allow for
165
            # files that are deleted and then reappear)
166
            last = len(w)
167
            if last == 0:
168
                parents = []
169
            else:
170
                parents = [last-1]
171
172
            w.add(rev_id, parents, text_lines)
173
            text_count += 1
1080 by Martin Pool
- test tool for converting history to weave files
174
175
        revno += 1
1300 by Martin Pool
- refactor weave upgrade into a MethodObject
176
        
177
    def _bump_progress(self):
178
        self.converted_revs += 1
179
        self.pb.update('converting revisions',
180
                       self.converted_revs,
181
                       self.total_revs)
1087 by Martin Pool
- add a tool script to convert past history into weaves
182
183
184
def write_atomic_weave(weave, filename):
185
    inv_wf = AtomicFile(filename)
1080 by Martin Pool
- test tool for converting history to weave files
186
    try:
1087 by Martin Pool
- add a tool script to convert past history into weaves
187
        write_weave(weave, inv_wf)
1080 by Martin Pool
- test tool for converting history to weave files
188
        inv_wf.commit()
189
    finally:
190
        inv_wf.close()
191
1087 by Martin Pool
- add a tool script to convert past history into weaves
192
    
1080 by Martin Pool
- test tool for converting history to weave files
193
194
195
def profile_convert(): 
196
    prof_f = tempfile.NamedTemporaryFile()
197
198
    prof = hotshot.Profile(prof_f.name)
199
1300 by Martin Pool
- refactor weave upgrade into a MethodObject
200
    prof.runcall(Convert) 
1080 by Martin Pool
- test tool for converting history to weave files
201
    prof.close()
202
203
    stats = hotshot.stats.load(prof_f.name)
1267 by Martin Pool
- notes on conversion of existing history to weaves
204
    ##stats.strip_dirs()
1080 by Martin Pool
- test tool for converting history to weave files
205
    stats.sort_stats('time')
1267 by Martin Pool
- notes on conversion of existing history to weaves
206
    # XXX: Might like to write to stderr or the trace file instead but
207
    # print_stats seems hardcoded to stdout
1080 by Martin Pool
- test tool for converting history to weave files
208
    stats.print_stats(20)
209
            
210
211
if '-p' in sys.argv[1:]:
212
    profile_convert()
213
else:
1300 by Martin Pool
- refactor weave upgrade into a MethodObject
214
    Convert()
1080 by Martin Pool
- test tool for converting history to weave files
215