~bzr-pqm/bzr/bzr.dev

1080 by Martin Pool
- test tool for converting history to weave files
1
#! /usr/bin/python
1267 by Martin Pool
- notes on conversion of existing history to weaves
2
#
1080 by Martin Pool
- test tool for converting history to weave files
3
# Copyright (C) 2005 Canonical Ltd
1267 by Martin Pool
- notes on conversion of existing history to weaves
4
#
1080 by Martin Pool
- test tool for converting history to weave files
5
# This program is free software; you can redistribute it and/or modify
6
# it under the terms of the GNU General Public License as published by
7
# the Free Software Foundation; either version 2 of the License, or
8
# (at your option) any later version.
1267 by Martin Pool
- notes on conversion of existing history to weaves
9
#
1080 by Martin Pool
- test tool for converting history to weave files
10
# This program is distributed in the hope that it will be useful,
11
# but WITHOUT ANY WARRANTY; without even the implied warranty of
12
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
13
# GNU General Public License for more details.
1267 by Martin Pool
- notes on conversion of existing history to weaves
14
#
1080 by Martin Pool
- test tool for converting history to weave files
15
# You should have received a copy of the GNU General Public License
16
# along with this program; if not, write to the Free Software
17
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
18
19
"""Experiment in converting existing bzr branches to weaves."""
20
1267 by Martin Pool
- notes on conversion of existing history to weaves
21
# To make this properly useful
22
#
23
# 1. assign text version ids, and put those text versions into
24
#    the inventory as they're converted.
25
#
26
# 2. keep track of the previous version of each file, rather than
27
#    just using the last one imported
28
#
29
# 3. assign entry versions when files are added, renamed or moved.
30
#
31
# 4. when merged-in versions are observed, walk down through them
32
#    to discover everything, then commit bottom-up
33
#
34
# 5. track ancestry as things are merged in, and commit that in each
35
#    revision
36
#
37
# Perhaps it's best to first walk the whole graph and make a plan for
38
# what should be imported in what order?  Need a kind of topological
39
# sort of all revisions.  (Or do we, can we just before doing a revision
40
# see that all its parents have either been converted or abandoned?)
41
1083 by Martin Pool
- add space to store revision-id in weave files
42
try:
43
    import psyco
44
    psyco.full()
45
except ImportError:
46
    pass
47
1080 by Martin Pool
- test tool for converting history to weave files
48
1267 by Martin Pool
- notes on conversion of existing history to weaves
49
import tempfile
50
import hotshot, hotshot.stats
51
import sys
1132 by Martin Pool
- fix up logging for history2weaves tool
52
import logging
53
1290 by Martin Pool
- clean up imports
54
from bzrlib.branch import Branch, find_branch
1080 by Martin Pool
- test tool for converting history to weave files
55
from bzrlib.revfile import Revfile
56
from bzrlib.weave import Weave
57
from bzrlib.weavefile import read_weave, write_weave
58
from bzrlib.progress import ProgressBar
59
from bzrlib.atomicfile import AtomicFile
1132 by Martin Pool
- fix up logging for history2weaves tool
60
import bzrlib.trace
1267 by Martin Pool
- notes on conversion of existing history to weaves
61
62
1080 by Martin Pool
- test tool for converting history to weave files
63
64
def convert():
1132 by Martin Pool
- fix up logging for history2weaves tool
65
    bzrlib.trace.enable_default_logging()
66
1080 by Martin Pool
- test tool for converting history to weave files
67
    pb = ProgressBar()
68
69
    inv_weave = Weave()
70
71
    last_text_sha = {}
1087 by Martin Pool
- add a tool script to convert past history into weaves
72
73
    # holds in-memory weaves for all files
74
    text_weaves = {}
1080 by Martin Pool
- test tool for converting history to weave files
75
1293 by Martin Pool
- add Branch constructor option to relax version check
76
    b = Branch('.', relax_version_check=True)
1080 by Martin Pool
- test tool for converting history to weave files
77
78
    revno = 1
79
    rev_history = b.revision_history()
80
    last_idx = None
1087 by Martin Pool
- add a tool script to convert past history into weaves
81
    inv_parents = []
82
    text_count = 0
1080 by Martin Pool
- test tool for converting history to weave files
83
    
84
    for rev_id in rev_history:
1089 by Martin Pool
- better progress messages for conversion to weaves
85
        pb.update('converting revision', revno, len(rev_history))
1080 by Martin Pool
- test tool for converting history to weave files
86
        
87
        inv_xml = b.get_inventory_xml(rev_id).readlines()
88
1087 by Martin Pool
- add a tool script to convert past history into weaves
89
        new_idx = inv_weave.add(rev_id, inv_parents, inv_xml)
90
        inv_parents = [new_idx]
91
92
        tree = b.revision_tree(rev_id)
93
        inv = tree.inventory
94
95
        # for each file in the inventory, put it into its own revfile
96
        for file_id in inv:
97
            ie = inv[file_id]
98
            if ie.kind != 'file':
99
                continue
100
            if last_text_sha.get(file_id) == ie.text_sha1:
101
                # same as last time
102
                continue
103
            last_text_sha[file_id] = ie.text_sha1
104
105
            # new text (though possibly already stored); need to store it
106
            text_lines = tree.get_file(file_id).readlines()
107
108
            # if the file's created for the first time in this
109
            # revision then make a new weave; else find the old one
110
            if file_id not in text_weaves:
111
                text_weaves[file_id] = Weave()
112
                
113
            w = text_weaves[file_id]
114
115
            # base the new text version off whatever was last
116
            # (actually it'd be better to track this, to allow for
117
            # files that are deleted and then reappear)
118
            last = len(w)
119
            if last == 0:
120
                parents = []
121
            else:
122
                parents = [last-1]
123
124
            w.add(rev_id, parents, text_lines)
125
            text_count += 1
1080 by Martin Pool
- test tool for converting history to weave files
126
127
        revno += 1
128
1087 by Martin Pool
- add a tool script to convert past history into weaves
129
    pb.clear()
130
    print '%6d revisions and inventories' % revno
131
    print '%6d texts' % text_count
132
133
    i = 0
134
    # TODO: commit them all atomically at the end, not one by one
135
    write_atomic_weave(inv_weave, 'weaves/inventory.weave')
136
    for file_id, file_weave in text_weaves.items():
1089 by Martin Pool
- better progress messages for conversion to weaves
137
        pb.update('writing weave', i, len(text_weaves))
1087 by Martin Pool
- add a tool script to convert past history into weaves
138
        write_atomic_weave(file_weave, 'weaves/%s.weave' % file_id)
139
        i += 1
140
141
    pb.clear()
142
143
144
def write_atomic_weave(weave, filename):
145
    inv_wf = AtomicFile(filename)
1080 by Martin Pool
- test tool for converting history to weave files
146
    try:
1087 by Martin Pool
- add a tool script to convert past history into weaves
147
        write_weave(weave, inv_wf)
1080 by Martin Pool
- test tool for converting history to weave files
148
        inv_wf.commit()
149
    finally:
150
        inv_wf.close()
151
1087 by Martin Pool
- add a tool script to convert past history into weaves
152
    
1080 by Martin Pool
- test tool for converting history to weave files
153
154
155
def profile_convert(): 
156
    prof_f = tempfile.NamedTemporaryFile()
157
158
    prof = hotshot.Profile(prof_f.name)
159
160
    prof.runcall(convert) 
161
    prof.close()
162
163
    stats = hotshot.stats.load(prof_f.name)
1267 by Martin Pool
- notes on conversion of existing history to weaves
164
    ##stats.strip_dirs()
1080 by Martin Pool
- test tool for converting history to weave files
165
    stats.sort_stats('time')
1267 by Martin Pool
- notes on conversion of existing history to weaves
166
    # XXX: Might like to write to stderr or the trace file instead but
167
    # print_stats seems hardcoded to stdout
1080 by Martin Pool
- test tool for converting history to weave files
168
    stats.print_stats(20)
169
            
170
171
if '-p' in sys.argv[1:]:
172
    profile_convert()
173
else:
174
    convert()
175