~bzr-pqm/bzr/bzr.dev

485 by Martin Pool
- move commit code into its own module
1
# Copyright (C) 2005 Canonical Ltd
2
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
18
## XXX: Can we do any better about making interrupted commits change
19
## nothing?
20
21
## XXX: If we merged two versions of a file then we still need to
22
## create a new version representing that merge, even if it didn't
23
## change from the parent.
1189 by Martin Pool
- BROKEN: partial support for commit into weave
24
25
## TODO: Read back the just-generated changeset, and make sure it
26
## applies and recreates the right state.
27
28
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
29
30
1189 by Martin Pool
- BROKEN: partial support for commit into weave
31
import os
32
import sys
1188 by Martin Pool
- clean up imports in commit code
33
import time
34
import tempfile
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
35
import sha
36
1188 by Martin Pool
- clean up imports in commit code
37
from binascii import hexlify
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
38
from cStringIO import StringIO
1188 by Martin Pool
- clean up imports in commit code
39
40
from bzrlib.osutils import (local_time_offset, username,
41
                            rand_bytes, compact_date, user_email,
42
                            kind_marker, is_inside_any, quotefn,
1189 by Martin Pool
- BROKEN: partial support for commit into weave
43
                            sha_string, sha_file, isdir, isfile)
1188 by Martin Pool
- clean up imports in commit code
44
from bzrlib.branch import gen_file_id
45
from bzrlib.errors import BzrError, PointlessCommit
46
from bzrlib.revision import Revision, RevisionReference
47
from bzrlib.trace import mutter, note
1189 by Martin Pool
- BROKEN: partial support for commit into weave
48
from bzrlib.xml5 import serializer_v5
1188 by Martin Pool
- clean up imports in commit code
49
from bzrlib.inventory import Inventory
1189 by Martin Pool
- BROKEN: partial support for commit into weave
50
from bzrlib.delta import compare_trees
51
from bzrlib.weave import Weave
52
from bzrlib.weavefile import read_weave, write_weave_v5
53
from bzrlib.atomicfile import AtomicFile
54
55
1205 by Martin Pool
- add bzrlib.commit.commit compatability interface
56
def commit(*args, **kwargs):
57
    """Commit a new revision to a branch.
58
59
    Function-style interface for convenience of old callers.
60
61
    New code should use the Commit class instead.
62
    """
63
    Commit().commit(*args, **kwargs)
64
65
1189 by Martin Pool
- BROKEN: partial support for commit into weave
66
class NullCommitReporter(object):
67
    """I report on progress of a commit."""
68
    def added(self, path):
69
        pass
70
71
    def removed(self, path):
72
        pass
73
74
    def renamed(self, old_path, new_path):
75
        pass
76
77
78
class ReportCommitToLog(NullCommitReporter):
79
    def added(self, path):
80
        note('added %s', path)
81
82
    def removed(self, path):
83
        note('removed %s', path)
84
85
    def renamed(self, old_path, new_path):
86
        note('renamed %s => %s', old_path, new_path)
87
88
89
class Commit(object):
90
    """Task of committing a new revision.
91
92
    This is a MethodObject: it accumulates state as the commit is
93
    prepared, and then it is discarded.  It doesn't represent
94
    historical revisions, just the act of recording a new one.
95
96
            missing_ids
97
            Modified to hold a list of files that have been deleted from
98
            the working directory; these should be removed from the
99
            working inventory.
485 by Martin Pool
- move commit code into its own module
100
    """
1189 by Martin Pool
- BROKEN: partial support for commit into weave
101
    def __init__(self,
102
                 reporter=None):
103
        if reporter is not None:
104
            self.reporter = reporter
105
        else:
106
            self.reporter = NullCommitReporter()
107
108
        
109
    def commit(self,
110
               branch, message,
111
               timestamp=None,
112
               timezone=None,
113
               committer=None,
114
               specific_files=None,
115
               rev_id=None,
116
               allow_pointless=True):
117
        """Commit working copy as a new revision.
118
119
        The basic approach is to add all the file texts into the
120
        store, then the inventory, then make a new revision pointing
121
        to that inventory and store that.
122
123
        This is not quite safe if the working copy changes during the
124
        commit; for the moment that is simply not allowed.  A better
125
        approach is to make a temporary copy of the files before
126
        computing their hashes, and then add those hashes in turn to
127
        the inventory.  This should mean at least that there are no
128
        broken hash pointers.  There is no way we can get a snapshot
129
        of the whole directory at an instant.  This would also have to
130
        be robust against files disappearing, moving, etc.  So the
131
        whole thing is a bit hard.
132
133
        This raises PointlessCommit if there are no changes, no new merges,
134
        and allow_pointless  is false.
135
136
        timestamp -- if not None, seconds-since-epoch for a
137
             postdated/predated commit.
138
139
        specific_files
140
            If true, commit only those files.
141
142
        rev_id
143
            If set, use this as the new revision id.
144
            Useful for test or import commands that need to tightly
145
            control what revisions are assigned.  If you duplicate
146
            a revision id that exists elsewhere it is your own fault.
147
            If null (default), a time/random revision id is generated.
148
        """
149
150
        self.branch = branch
151
        self.branch.lock_write()
152
        self.rev_id = rev_id
153
        self.specific_files = specific_files
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
154
        self.allow_pointless = allow_pointless
1189 by Martin Pool
- BROKEN: partial support for commit into weave
155
156
        if timestamp is None:
157
            self.timestamp = time.time()
158
        else:
159
            self.timestamp = long(timestamp)
160
            
161
        if committer is None:
162
            self.committer = username(self.branch)
163
        else:
164
            assert isinstance(committer, basestring), type(committer)
165
            self.committer = committer
166
167
        if timezone is None:
168
            self.timezone = local_time_offset()
169
        else:
170
            self.timezone = int(timezone)
171
172
        assert isinstance(message, basestring), type(message)
173
        self.message = message
174
175
        try:
176
            # First walk over the working inventory; and both update that
177
            # and also build a new revision inventory.  The revision
178
            # inventory needs to hold the text-id, sha1 and size of the
179
            # actual file versions committed in the revision.  (These are
180
            # not present in the working inventory.)  We also need to
181
            # detect missing/deleted files, and remove them from the
182
            # working inventory.
183
184
            self.work_tree = self.branch.working_tree()
185
            self.work_inv = self.work_tree.inventory
186
            self.basis_tree = self.branch.basis_tree()
187
            self.basis_inv = self.basis_tree.inventory
188
189
            self.pending_merges = self.branch.pending_merges()
1199 by Martin Pool
- weave commit records per-file ancestors
190
            if self.pending_merges:
191
                raise NotImplementedError("sorry, can't commit merges to the weave format yet")
192
            
1189 by Martin Pool
- BROKEN: partial support for commit into weave
193
            if self.rev_id is None:
194
                self.rev_id = _gen_revision_id(self.branch, time.time())
195
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
196
            # todo: update hashcache
1189 by Martin Pool
- BROKEN: partial support for commit into weave
197
            self.delta = compare_trees(self.basis_tree, self.work_tree,
198
                                       specific_files=self.specific_files)
199
200
            if not (self.delta.has_changed()
201
                    or self.allow_pointless
202
                    or self.pending_merges):
203
                raise PointlessCommit()
204
205
            self.new_inv = self.basis_inv.copy()
206
207
            self.delta.show(sys.stdout)
208
209
            self._remove_deleted()
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
210
            self._store_files()
1189 by Martin Pool
- BROKEN: partial support for commit into weave
211
212
            self.branch._write_inventory(self.work_inv)
213
            self._record_inventory()
214
215
            self._make_revision()
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
216
            note('committted r%d {%s}', (self.branch.revno() + 1),
217
                 self.rev_id)
218
            self.branch.append_revision(self.rev_id)
1189 by Martin Pool
- BROKEN: partial support for commit into weave
219
            self.branch.set_pending_merges([])
220
        finally:
221
            self.branch.unlock()
222
223
224
    def _record_inventory(self):
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
225
        inv_tmp = StringIO()
1189 by Martin Pool
- BROKEN: partial support for commit into weave
226
        serializer_v5.write_inventory(self.new_inv, inv_tmp)
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
227
        self.inv_sha1 = sha_string(inv_tmp.getvalue())
1189 by Martin Pool
- BROKEN: partial support for commit into weave
228
        inv_tmp.seek(0)
229
        self.branch.inventory_store.add(inv_tmp, self.rev_id)
230
231
232
    def _make_revision(self):
233
        """Record a new revision object for this commit."""
234
        self.rev = Revision(timestamp=self.timestamp,
235
                            timezone=self.timezone,
236
                            committer=self.committer,
237
                            message=self.message,
238
                            inventory_sha1=self.inv_sha1,
239
                            revision_id=self.rev_id)
240
241
        self.rev.parents = []
242
        precursor_id = self.branch.last_patch()
717 by Martin Pool
- correctly set parent list when committing first
243
        if precursor_id:
1189 by Martin Pool
- BROKEN: partial support for commit into weave
244
            self.rev.parents.append(RevisionReference(precursor_id))
245
        for merge_rev in self.pending_merges:
246
            rev.parents.append(RevisionReference(merge_rev))
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
247
248
        rev_tmp = tempfile.TemporaryFile()
1189 by Martin Pool
- BROKEN: partial support for commit into weave
249
        serializer_v5.write_revision(self.rev, rev_tmp)
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
250
        rev_tmp.seek(0)
1189 by Martin Pool
- BROKEN: partial support for commit into weave
251
        self.branch.revision_store.add(rev_tmp, self.rev_id)
252
        mutter('new revision_id is {%s}', self.rev_id)
253
254
255
    def _remove_deleted(self):
256
        """Remove deleted files from the working and stored inventories."""
257
        for path, id, kind in self.delta.removed:
258
            if self.work_inv.has_id(id):
259
                del self.work_inv[id]
260
            if self.new_inv.has_id(id):
261
                del self.new_inv[id]
262
263
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
264
265
    def _store_files(self):
1189 by Martin Pool
- BROKEN: partial support for commit into weave
266
        """Store new texts of modified/added files."""
1207 by Martin Pool
- fix bugs in adding files in subdirectories
267
        # We must make sure that directories are added before anything
268
        # inside them is added.  the files within the delta report are
269
        # sorted by path so we know the directory will come before its
270
        # contents. 
271
        for path, file_id, kind in self.delta.added:
272
            if kind != 'file':
273
                ie = self.work_inv[file_id].copy()
274
                self.new_inv.add(ie)
275
            else:
276
                self._store_file_text(file_id)
277
278
        for path, file_id, kind in self.delta.modified:
279
            if kind != 'file':
280
                continue
281
            self._store_file_text(file_id)
282
283
        for old_path, new_path, file_id, kind, text_modified in self.delta.renamed:
1189 by Martin Pool
- BROKEN: partial support for commit into weave
284
            if kind != 'file':
285
                continue
286
            if not text_modified:
287
                continue
1207 by Martin Pool
- fix bugs in adding files in subdirectories
288
            self._store_file_text(file_id)
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
289
290
291
    def _store_file_text(self, file_id):
1189 by Martin Pool
- BROKEN: partial support for commit into weave
292
        """Store updated text for one modified or added file."""
1199 by Martin Pool
- weave commit records per-file ancestors
293
        note('store new text for {%s} in revision {%s}',
294
             file_id, self.rev_id)
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
295
        new_lines = self.work_tree.get_file(file_id).readlines()
1199 by Martin Pool
- weave commit records per-file ancestors
296
        if file_id in self.new_inv:     # was in basis inventory
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
297
            ie = self.new_inv[file_id]
298
            assert ie.file_id == file_id
1199 by Martin Pool
- weave commit records per-file ancestors
299
            assert file_id in self.basis_inv
300
            assert self.basis_inv[file_id].kind == 'file'
301
            old_version = self.basis_inv[file_id].text_version
302
            file_parents = [old_version]
303
        else:                           # new in this revision
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
304
            ie = self.work_inv[file_id].copy()
305
            self.new_inv.add(ie)
1199 by Martin Pool
- weave commit records per-file ancestors
306
            assert file_id not in self.basis_inv
307
            file_parents = []
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
308
        assert ie.kind == 'file'
1199 by Martin Pool
- weave commit records per-file ancestors
309
        self._add_text_to_weave(file_id, new_lines, file_parents)
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
310
        # make a new inventory entry for this file, using whatever
311
        # it had in the working copy, plus details on the new text
312
        ie.text_sha1 = _sha_strings(new_lines)
313
        ie.text_size = sum(map(len, new_lines))
314
        ie.text_version = self.rev_id
315
        ie.entry_version = self.rev_id
316
317
1199 by Martin Pool
- weave commit records per-file ancestors
318
    def _add_text_to_weave(self, file_id, new_lines, parents):
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
319
        weave_fn = self.branch.controlfilename(['weaves', file_id+'.weave'])
1189 by Martin Pool
- BROKEN: partial support for commit into weave
320
        if os.path.exists(weave_fn):
321
            w = read_weave(file(weave_fn, 'rb'))
322
        else:
323
            w = Weave()
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
324
        # XXX: Should set the appropriate parents by looking for this file_id
325
        # in all revision parents
1199 by Martin Pool
- weave commit records per-file ancestors
326
        parent_idxs = map(w.lookup, parents)
327
        w.add(self.rev_id, parent_idxs, new_lines)
1189 by Martin Pool
- BROKEN: partial support for commit into weave
328
        af = AtomicFile(weave_fn)
329
        try:
330
            write_weave_v5(w, af)
331
            af.commit()
332
        finally:
333
            af.close()
334
335
336
def _gen_revision_id(branch, when):
337
    """Return new revision-id."""
338
    s = '%s-%s-' % (user_email(branch), compact_date(when))
339
    s += hexlify(rand_bytes(8))
340
    return s
633 by Martin Pool
- Show added/renamed/modified messages from commit for non-file
341
342
1194 by Martin Pool
- [BROKEN] more progress of commit into weaves
343
def _sha_strings(strings):
344
    """Return the sha-1 of concatenation of strings"""
345
    s = sha.new()
346
    map(s.update, strings)
347
    return s.hexdigest()