~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to tools/history2weaves.py

Committer: Martin Pool
Date: 2005-09-13 01:37:23 UTC
Revision ID: mbp@sourcefrog.net-20050913013723-7e0026b48cbf08ff

- BROKEN: start refactoring fetch code to work well with weaves

files removed:
bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_commit.py

bzrlib/xml4.py

files renamed:
bzrlib/selftest/test_weave.py => tools/testweave.py

files modified:
.bzrignore

NEWS

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commit.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/merge.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/store.py

bzrlib/trace.py

bzrlib/upgrade.py

bzrlib/weave.py

bzrlib/weavestore.py

bzrlib/workingtree.py

bzrlib/xml.py

tools/history2weaves.py

Show diffs side-by-side

added added

removed removed

tools/history2weaves.py

#! /usr/bin/python

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Experiment in converting existing bzr branches to weaves."""

# To make this properly useful

# 1. assign text version ids, and put those text versions into

# the inventory as they're converted.

# 2. keep track of the previous version of each file, rather than

# just using the last one imported

# 3. assign entry versions when files are added, renamed or moved.

# 4. when merged-in versions are observed, walk down through them

# to discover everything, then commit bottom-up

# 5. track ancestry as things are merged in, and commit that in each

# revision

# Perhaps it's best to first walk the whole graph and make a plan for

# what should be imported in what order? Need a kind of topological

# sort of all revisions. (Or do we, can we just before doing a revision

# see that all its parents have either been converted or abandoned?)

if False:

try:

import psyco

psyco.full()

except ImportError:

pass

import tempfile

import hotshot, hotshot.stats

import sys

try:

import psyco

psyco.full()

except ImportError:

pass

import logging

import time

from bzrlib.branch import Branch, find_branch

import bzrlib.branch

from bzrlib.revfile import Revfile

from bzrlib.weave import Weave

from bzrlib.weavefile import read_weave, write_weave

from bzrlib.progress import ProgressBar

from bzrlib.atomicfile import AtomicFile

from bzrlib.xml4 import serializer_v4

from bzrlib.xml5 import serializer_v5

import bzrlib.trace

class Convert(object):

def __init__(self):

self.total_revs = 0

self.converted_revs = 0

self.text_count = 0

self.convert()

def convert(self):

bzrlib.trace.enable_default_logging()

self.pb = ProgressBar()

self.inv_weave = Weave('__inventory')

self.anc_weave = Weave('__ancestry')

last_text_sha = {}

# holds in-memory weaves for all files

text_weaves = {}

b = self.branch = Branch('.', relax_version_check=True)

revno = 1

rev_history = b.revision_history()

last_idx = None

inv_parents = []

# todo is a stack holding the revisions we still need to process;

# appending to it adds new highest-priority revisions

todo = rev_history[:]

todo.reverse()

self.total_revs = len(todo)

100

101

while todo:

102

self._convert_one_rev(todo.pop())

103

104

self.pb.clear()

105

print 'upgraded to weaves:'

106

print ' %6d revisions and inventories' % self.converted_revs

107

print ' %6d texts' % self.text_count

108

109

self._write_all_weaves()

110

111

112

def _write_all_weaves(self):

113

i = 0

114

return ############################################

115

# TODO: commit them all atomically at the end, not one by one

116

write_atomic_weave(self.inv_weave, 'weaves/inventory.weave')

117

write_atomic_weave(self.anc_weave, 'weaves/ancestry.weave')

118

for file_id, file_weave in text_weaves.items():

119

self.pb.update('writing weave', i, len(text_weaves))

120

write_atomic_weave(file_weave, 'weaves/%s.weave' % file_id)

121

i += 1

122

123

self.pb.clear()

124

125

126

def _convert_one_rev(self, rev_id):

127

self._bump_progress()

128

b = self.branch

129

rev_xml = b.revision_store[rev_id].read()

130

inv_xml = b.inventory_store[rev_id].read()

131

132

rev = serializer_v4.read_revision_from_string(rev_xml)

133

inv = serializer_v4.read_inventory_from_string(inv_xml)

134

135

return ##########################################

136

137

new_idx = self.inv_weave.add(rev_id, inv_parents, inv_xml)

import tempfile

import hotshot, hotshot.stats

import sys

def convert():

bzrlib.trace.enable_default_logging()

pb = ProgressBar()

inv_weave = Weave()

last_text_sha = {}

# holds in-memory weaves for all files

text_weaves = {}

b = bzrlib.branch.find_branch('.')

revno = 1

rev_history = b.revision_history()

last_idx = None

inv_parents = []

text_count = 0

for rev_id in rev_history:

pb.update('converting revision', revno, len(rev_history))

inv_xml = b.get_inventory_xml(rev_id).readlines()

new_idx = inv_weave.add(rev_id, inv_parents, inv_xml)

138

inv_parents = [new_idx]

139

140

tree = b.revision_tree(rev_id)

157

# revision then make a new weave; else find the old one

158

if file_id not in text_weaves:

159

text_weaves[file_id] = Weave()

160

161

w = text_weaves[file_id]

162

163

# base the new text version off whatever was last

173

102

text_count += 1

174

103

175

104

revno += 1

176

177

def _bump_progress(self):

178

self.converted_revs += 1

179

self.pb.update('converting revisions',

180

self.converted_revs,

181

self.total_revs)

105

106

pb.clear()

107

print '%6d revisions and inventories' % revno

108

print '%6d texts' % text_count

109

110

i = 0

111

# TODO: commit them all atomically at the end, not one by one

112

write_atomic_weave(inv_weave, 'weaves/inventory.weave')

113

for file_id, file_weave in text_weaves.items():

114

pb.update('writing weave', i, len(text_weaves))

115

write_atomic_weave(file_weave, 'weaves/%s.weave' % file_id)

116

i += 1

117

118

pb.clear()

182

119

183

120

184

121

def write_atomic_weave(weave, filename):

197

134

198

135

prof = hotshot.Profile(prof_f.name)

199

136

200

prof.runcall(Convert)

137

prof.runcall(convert)

201

138

prof.close()

202

139

203

140

stats = hotshot.stats.load(prof_f.name)

204

##stats.strip_dirs()

141

#stats.strip_dirs()

205

142

stats.sort_stats('time')

206

# XXX: Might like to write to stderr or the trace file instead but

207

# print_stats seems hardcoded to stdout

143

## XXX: Might like to write to stderr or the trace file instead but

144

## print_stats seems hardcoded to stdout

208

145

stats.print_stats(20)

209

146

210

147

211

148

if '-p' in sys.argv[1:]:

212

149

profile_convert()

213

150

else:

214

Convert()

151

convert()

215

152

Older »