~bzr-pqm/bzr/bzr.dev

485 by Martin Pool
- move commit code into its own module
1
# Copyright (C) 2005 Canonical Ltd
2
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
7
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
11
# GNU General Public License for more details.
12
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
16
17
18
517 by Martin Pool
- cleanup
19
def commit(branch, message,
20
           timestamp=None,
21
           timezone=None,
485 by Martin Pool
- move commit code into its own module
22
           committer=None,
491 by Martin Pool
- Selective commit!
23
           verbose=True,
494 by Martin Pool
- commit takes an optional caller-specified revision id
24
           specific_files=None,
25
           rev_id=None):
485 by Martin Pool
- move commit code into its own module
26
    """Commit working copy as a new revision.
27
28
    The basic approach is to add all the file texts into the
29
    store, then the inventory, then make a new revision pointing
30
    to that inventory and store that.
31
32
    This is not quite safe if the working copy changes during the
33
    commit; for the moment that is simply not allowed.  A better
34
    approach is to make a temporary copy of the files before
35
    computing their hashes, and then add those hashes in turn to
36
    the inventory.  This should mean at least that there are no
37
    broken hash pointers.  There is no way we can get a snapshot
38
    of the whole directory at an instant.  This would also have to
39
    be robust against files disappearing, moving, etc.  So the
40
    whole thing is a bit hard.
41
42
    timestamp -- if not None, seconds-since-epoch for a
43
         postdated/predated commit.
491 by Martin Pool
- Selective commit!
44
45
    specific_files
46
        If true, commit only those files.
504 by Martin Pool
doc
47
48
    rev_id
49
        If set, use this as the new revision id.
50
        Useful for test or import commands that need to tightly
51
        control what revisions are assigned.  If you duplicate
52
        a revision id that exists elsewhere it is your own fault.
53
        If null (default), a time/random revision id is generated.
485 by Martin Pool
- move commit code into its own module
54
    """
55
632 by Martin Pool
- refactor commit code
56
    import time, tempfile
485 by Martin Pool
- move commit code into its own module
57
697 by Martin Pool
- write out parent list for new revisions
58
    from bzrlib.osutils import local_time_offset, username
59
    from bzrlib.branch import gen_file_id
60
    from bzrlib.errors import BzrError
61
    from bzrlib.revision import Revision, RevisionReference
62
    from bzrlib.trace import mutter, note
485 by Martin Pool
- move commit code into its own module
63
610 by Martin Pool
- replace Branch.lock(mode) with separate lock_read and lock_write
64
    branch.lock_write()
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
65
66
    try:
67
        # First walk over the working inventory; and both update that
68
        # and also build a new revision inventory.  The revision
69
        # inventory needs to hold the text-id, sha1 and size of the
70
        # actual file versions committed in the revision.  (These are
71
        # not present in the working inventory.)  We also need to
72
        # detect missing/deleted files, and remove them from the
73
        # working inventory.
74
75
        work_tree = branch.working_tree()
76
        work_inv = work_tree.inventory
77
        basis = branch.basis_tree()
78
        basis_inv = basis.inventory
79
80
        if verbose:
81
            note('looking for changes...')
82
632 by Martin Pool
- refactor commit code
83
        missing_ids, new_inv = _gather_commit(branch,
84
                                              work_tree,
85
                                              work_inv,
86
                                              basis_inv,
87
                                              specific_files,
88
                                              verbose)
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
89
90
        for file_id in missing_ids:
91
            # Any files that have been deleted are now removed from the
92
            # working inventory.  Files that were not selected for commit
93
            # are left as they were in the working inventory and ommitted
94
            # from the revision inventory.
95
96
            # have to do this later so we don't mess up the iterator.
97
            # since parents may be removed before their children we
98
            # have to test.
99
100
            # FIXME: There's probably a better way to do this; perhaps
101
            # the workingtree should know how to filter itbranch.
102
            if work_inv.has_id(file_id):
103
                del work_inv[file_id]
104
105
106
        if rev_id is None:
107
            rev_id = _gen_revision_id(time.time())
108
        inv_id = rev_id
109
110
        inv_tmp = tempfile.TemporaryFile()
632 by Martin Pool
- refactor commit code
111
        new_inv.write_xml(inv_tmp)
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
112
        inv_tmp.seek(0)
113
        branch.inventory_store.add(inv_tmp, inv_id)
114
        mutter('new inventory_id is {%s}' % inv_id)
115
672 by Martin Pool
- revision records include the hash of their inventory and
116
        # We could also just sha hash the inv_tmp file
117
        # however, in the case that branch.inventory_store.add()
118
        # ever actually does anything special
119
        inv_sha1 = branch.get_inventory_sha1(inv_id)
120
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
121
        branch._write_inventory(work_inv)
122
123
        if timestamp == None:
124
            timestamp = time.time()
125
126
        if committer == None:
127
            committer = username()
128
129
        if timezone == None:
130
            timezone = local_time_offset()
131
132
        mutter("building commit log message")
133
        rev = Revision(timestamp=timestamp,
134
                       timezone=timezone,
135
                       committer=committer,
136
                       message = message,
137
                       inventory_id=inv_id,
672 by Martin Pool
- revision records include the hash of their inventory and
138
                       inventory_sha1=inv_sha1,
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
139
                       revision_id=rev_id)
717 by Martin Pool
- correctly set parent list when committing first
140
141
        precursor_id = branch.last_patch()
142
        if precursor_id:
143
            precursor_sha1 = branch.get_revision_sha1(precursor_id)
144
            rev.parents = [RevisionReference(precursor_id, precursor_sha1)]
580 by Martin Pool
- Use explicit lock methods on a branch, rather than doing it
145
146
        rev_tmp = tempfile.TemporaryFile()
147
        rev.write_xml(rev_tmp)
148
        rev_tmp.seek(0)
149
        branch.revision_store.add(rev_tmp, rev_id)
150
        mutter("new revision_id is {%s}" % rev_id)
151
152
        ## XXX: Everything up to here can simply be orphaned if we abort
153
        ## the commit; it will leave junk files behind but that doesn't
154
        ## matter.
155
156
        ## TODO: Read back the just-generated changeset, and make sure it
157
        ## applies and recreates the right state.
158
159
        ## TODO: Also calculate and store the inventory SHA1
160
        mutter("committing patch r%d" % (branch.revno() + 1))
161
162
        branch.append_revision(rev_id)
163
164
        if verbose:
165
            note("commited r%d" % branch.revno())
166
    finally:
167
        branch.unlock()
485 by Martin Pool
- move commit code into its own module
168
169
170
171
def _gen_revision_id(when):
172
    """Return new revision-id."""
173
    from binascii import hexlify
174
    from osutils import rand_bytes, compact_date, user_email
175
176
    s = '%s-%s-' % (user_email(), compact_date(when))
177
    s += hexlify(rand_bytes(8))
178
    return s
179
180
632 by Martin Pool
- refactor commit code
181
def _gather_commit(branch, work_tree, work_inv, basis_inv, specific_files,
182
                   verbose):
183
    """Build inventory preparatory to commit.
184
185
    This adds any changed files into the text store, and sets their
186
    test-id, sha and size in the returned inventory appropriately.
187
188
    missing_ids
189
        Modified to hold a list of files that have been deleted from
190
        the working directory; these should be removed from the
191
        working inventory.
192
    """
193
    from bzrlib.inventory import Inventory
194
    from osutils import isdir, isfile, sha_string, quotefn, \
195
         local_time_offset, username, kind_marker, is_inside_any
196
    
197
    from branch import gen_file_id
198
    from errors import BzrError
199
    from revision import Revision
200
    from bzrlib.trace import mutter, note
201
202
    inv = Inventory()
203
    missing_ids = []
204
    
205
    for path, entry in work_inv.iter_entries():
206
        ## TODO: Check that the file kind has not changed from the previous
207
        ## revision of this file (if any).
208
209
        p = branch.abspath(path)
210
        file_id = entry.file_id
211
        mutter('commit prep file %s, id %r ' % (p, file_id))
212
213
        if specific_files and not is_inside_any(specific_files, path):
214
            if basis_inv.has_id(file_id):
215
                # carry over with previous state
216
                inv.add(basis_inv[file_id].copy())
217
            else:
218
                # omit this from committed inventory
219
                pass
220
            continue
221
222
        if not work_tree.has_id(file_id):
223
            if verbose:
224
                print('deleted %s%s' % (path, kind_marker(entry.kind)))
225
            mutter("    file is missing, removing from inventory")
226
            missing_ids.append(file_id)
227
            continue
228
633 by Martin Pool
- Show added/renamed/modified messages from commit for non-file
229
        # this is present in the new inventory; may be new, modified or
230
        # unchanged.
231
        old_ie = basis_inv.has_id(file_id) and basis_inv[file_id]
232
        
233
        entry = entry.copy()
632 by Martin Pool
- refactor commit code
234
        inv.add(entry)
235
633 by Martin Pool
- Show added/renamed/modified messages from commit for non-file
236
        if old_ie:
237
            old_kind = old_ie.kind
632 by Martin Pool
- refactor commit code
238
            if old_kind != entry.kind:
239
                raise BzrError("entry %r changed kind from %r to %r"
240
                        % (file_id, old_kind, entry.kind))
241
242
        if entry.kind == 'directory':
243
            if not isdir(p):
244
                raise BzrError("%s is entered as directory but not a directory"
245
                               % quotefn(p))
246
        elif entry.kind == 'file':
247
            if not isfile(p):
248
                raise BzrError("%s is entered as file but is not a file" % quotefn(p))
249
250
            new_sha1 = work_tree.get_file_sha1(file_id)
251
252
            if (old_ie
253
                and old_ie.text_sha1 == new_sha1):
254
                ## assert content == basis.get_file(file_id).read()
255
                entry.text_id = old_ie.text_id
256
                entry.text_sha1 = new_sha1
257
                entry.text_size = old_ie.text_size
258
                mutter('    unchanged from previous text_id {%s}' %
259
                       entry.text_id)
260
            else:
261
                content = file(p, 'rb').read()
262
263
                # calculate the sha again, just in case the file contents
264
                # changed since we updated the cache
265
                entry.text_sha1 = sha_string(content)
266
                entry.text_size = len(content)
267
268
                entry.text_id = gen_file_id(entry.name)
269
                branch.text_store.add(content, entry.text_id)
270
                mutter('    stored with text_id {%s}' % entry.text_id)
633 by Martin Pool
- Show added/renamed/modified messages from commit for non-file
271
272
        if verbose:
273
            marked = path + kind_marker(entry.kind)
274
            if not old_ie:
275
                print 'added', marked
276
            elif old_ie == entry:
277
                pass                    # unchanged
278
            elif (old_ie.name == entry.name
279
                  and old_ie.parent_id == entry.parent_id):
280
                print 'modified', marked
281
            else:
282
                print 'renamed', marked
632 by Martin Pool
- refactor commit code
283
                        
284
    return missing_ids, inv
633 by Martin Pool
- Show added/renamed/modified messages from commit for non-file
285
286