~abentley/bzrtools/bzrtools.dev

« back to all changes in this revision

Viewing changes to upstream_import.py

  • Committer: Aaron Bentley
  • Date: 2006-03-24 19:01:30 UTC
  • Revision ID: abentley@panoramicfeedback.com-20060324190130-2208c693486a8b33
Added apache index scraping to the branches command

Show diffs side-by-side

added added

removed removed

Lines of Context:
1
 
"""Import upstream source into a branch"""
2
 
 
3
 
from bz2 import BZ2File
4
 
import errno
5
 
import os
6
 
from StringIO import StringIO
7
 
import stat
8
 
import tarfile
9
 
import zipfile
10
 
 
11
 
from bzrlib import generate_ids
12
 
from bzrlib.bzrdir import BzrDir
13
 
from bzrlib.errors import NoSuchFile, BzrCommandError, NotBranchError
14
 
from bzrlib.osutils import (pathjoin, isdir, file_iterator, basename,
15
 
                            file_kind)
16
 
from bzrlib.trace import warning
17
 
from bzrlib.transform import TreeTransform, resolve_conflicts, cook_conflicts
18
 
from bzrlib.workingtree import WorkingTree
19
 
 
20
 
class ZipFileWrapper(object):
21
 
 
22
 
    def __init__(self, fileobj, mode):
23
 
        self.zipfile = zipfile.ZipFile(fileobj, mode)
24
 
 
25
 
    def getmembers(self):
26
 
        for info in self.zipfile.infolist():
27
 
            yield ZipInfoWrapper(self.zipfile, info)
28
 
 
29
 
    def extractfile(self, infowrapper):
30
 
        return StringIO(self.zipfile.read(infowrapper.name))
31
 
 
32
 
    def add(self, filename):
33
 
        if isdir(filename):
34
 
            self.zipfile.writestr(filename+'/', '')
35
 
        else:
36
 
            self.zipfile.write(filename)
37
 
 
38
 
    def close(self):
39
 
        self.zipfile.close()
40
 
 
41
 
 
42
 
class ZipInfoWrapper(object):
43
 
    
44
 
    def __init__(self, zipfile, info):
45
 
        self.info = info
46
 
        self.type = None
47
 
        self.name = info.filename
48
 
        self.zipfile = zipfile
49
 
        self.mode = 0666
50
 
 
51
 
    def isdir(self):
52
 
        # Really? Eeeew!
53
 
        return bool(self.name.endswith('/'))
54
 
 
55
 
    def isreg(self):
56
 
        # Really? Eeeew!
57
 
        return not self.isdir()
58
 
 
59
 
 
60
 
class DirWrapper(object):
61
 
    def __init__(self, fileobj, mode='r'):
62
 
        assert mode == 'r', mode
63
 
        self.root = os.path.realpath(fileobj.read())
64
 
 
65
 
    def __repr__(self):
66
 
        return 'DirWrapper(%r)' % self.root
67
 
 
68
 
    def getmembers(self, subdir=None):
69
 
        if subdir is not None:
70
 
            mydir = pathjoin(self.root, subdir)
71
 
        else:
72
 
            mydir = self.root
73
 
        for child in os.listdir(mydir):
74
 
            if subdir is not None:
75
 
                child = pathjoin(subdir, child)
76
 
            fi = FileInfo(self.root, child)
77
 
            yield fi
78
 
            if fi.isdir():
79
 
                for v in self.getmembers(child):
80
 
                    yield v
81
 
 
82
 
    def extractfile(self, member):
83
 
        return open(member.fullpath)
84
 
 
85
 
 
86
 
class FileInfo(object):
87
 
 
88
 
    def __init__(self, root, filepath):
89
 
        self.fullpath = pathjoin(root, filepath)
90
 
        self.root = root
91
 
        if filepath != '':
92
 
            self.name = pathjoin(basename(root), filepath)
93
 
        else:
94
 
            print 'root %r' % root
95
 
            self.name = basename(root)
96
 
        self.type = None
97
 
        stat = os.lstat(self.fullpath)
98
 
        self.mode = stat.st_mode
99
 
        if self.isdir():
100
 
            self.name += '/'
101
 
 
102
 
    def __repr__(self):
103
 
        return 'FileInfo(%r)' % self.name
104
 
 
105
 
    def isreg(self):
106
 
        return stat.S_ISREG(self.mode)
107
 
 
108
 
    def isdir(self):
109
 
        return stat.S_ISDIR(self.mode)
110
 
 
111
 
        
112
 
def top_directory(path):
113
 
    """Return the top directory given in a path."""
114
 
    dirname = os.path.dirname(path)
115
 
    last_dirname = dirname
116
 
    while True:
117
 
        dirname = os.path.dirname(dirname)
118
 
        if dirname == '' or dirname == last_dirname:
119
 
            return last_dirname
120
 
        last_dirname = dirname
121
 
 
122
 
 
123
 
def common_directory(names):
124
 
    """Determine a single directory prefix from a list of names"""
125
 
    possible_prefix = None
126
 
    for name in names:
127
 
        name_top = top_directory(name)
128
 
        if name_top == '':
129
 
            return None
130
 
        if possible_prefix is None:
131
 
            possible_prefix = name_top
132
 
        else:
133
 
            if name_top != possible_prefix:
134
 
                return None
135
 
    return possible_prefix
136
 
 
137
 
 
138
 
def do_directory(tt, trans_id, tree, relative_path, path):
139
 
    if isdir(path) and tree.path2id(relative_path) is not None:
140
 
        tt.cancel_deletion(trans_id)
141
 
    else:
142
 
        tt.create_directory(trans_id)
143
 
 
144
 
 
145
 
def add_implied_parents(implied_parents, path):
146
 
    """Update the set of implied parents from a path"""
147
 
    parent = os.path.dirname(path)
148
 
    if parent in implied_parents:
149
 
        return
150
 
    implied_parents.add(parent)
151
 
    add_implied_parents(implied_parents, parent)
152
 
 
153
 
 
154
 
def names_of_files(tar_file):
155
 
    for member in tar_file.getmembers():
156
 
        if member.type != "g":
157
 
            yield member.name
158
 
 
159
 
 
160
 
def import_tar(tree, tar_input):
161
 
    """Replace the contents of a working directory with tarfile contents.
162
 
    The tarfile may be a gzipped stream.  File ids will be updated.
163
 
    """
164
 
    tar_file = tarfile.open('lala', 'r', tar_input)
165
 
    import_archive(tree, tar_file)
166
 
 
167
 
def import_zip(tree, zip_input):
168
 
    zip_file = ZipFileWrapper(zip_input, 'r')
169
 
    import_archive(tree, zip_file)
170
 
 
171
 
def import_dir(tree, dir_input):
172
 
    dir_file = DirWrapper(dir_input)
173
 
    import_archive(tree, dir_file)
174
 
 
175
 
def import_archive(tree, archive_file):
176
 
    prefix = common_directory(names_of_files(archive_file))
177
 
    tt = TreeTransform(tree)
178
 
 
179
 
    removed = set()
180
 
    for path, entry in tree.inventory.iter_entries():
181
 
        if entry.parent_id is None:
182
 
            continue
183
 
        trans_id = tt.trans_id_tree_path(path)
184
 
        tt.delete_contents(trans_id)
185
 
        removed.add(path)
186
 
 
187
 
    added = set() 
188
 
    implied_parents = set()
189
 
    seen = set()
190
 
    for member in archive_file.getmembers():
191
 
        if member.type == 'g':
192
 
            # type 'g' is a header
193
 
            continue
194
 
        relative_path = member.name 
195
 
        if prefix is not None:
196
 
            relative_path = relative_path[len(prefix)+1:]
197
 
        if relative_path == '':
198
 
            continue
199
 
        add_implied_parents(implied_parents, relative_path)
200
 
        trans_id = tt.trans_id_tree_path(relative_path)
201
 
        added.add(relative_path.rstrip('/'))
202
 
        path = tree.abspath(relative_path)
203
 
        if member.name in seen:
204
 
            if tt.final_kind(trans_id) == 'file':
205
 
                tt.set_executability(None, trans_id)
206
 
            tt.cancel_creation(trans_id)
207
 
        seen.add(member.name)
208
 
        if member.isreg():
209
 
            tt.create_file(file_iterator(archive_file.extractfile(member)), 
210
 
                           trans_id)
211
 
            executable = (member.mode & 0111) != 0
212
 
            tt.set_executability(executable, trans_id)
213
 
        elif member.isdir():
214
 
            do_directory(tt, trans_id, tree, relative_path, path)
215
 
        elif member.issym():
216
 
            tt.create_symlink(member.linkname, trans_id)
217
 
        else:
218
 
            continue
219
 
        if tt.tree_file_id(trans_id) is None:
220
 
            name = basename(member.name.rstrip('/'))
221
 
            file_id = generate_ids.gen_file_id(name)
222
 
            tt.version_file(file_id, trans_id)
223
 
 
224
 
    for relative_path in implied_parents.difference(added):
225
 
        if relative_path == "":
226
 
            continue
227
 
        trans_id = tt.trans_id_tree_path(relative_path)
228
 
        path = tree.abspath(relative_path)
229
 
        do_directory(tt, trans_id, tree, relative_path, path)
230
 
        if tt.tree_file_id(trans_id) is None:
231
 
            tt.version_file(trans_id, trans_id)
232
 
        added.add(relative_path)
233
 
 
234
 
    for path in removed.difference(added):
235
 
        tt.unversion_file(tt.trans_id_tree_path(path))
236
 
 
237
 
    for conflict in cook_conflicts(resolve_conflicts(tt), tt):
238
 
        warning(conflict)
239
 
    tt.apply()
240
 
 
241
 
 
242
 
def do_import(source, tree_directory=None):
243
 
    """Implementation of import command.  Intended for UI only"""
244
 
    if tree_directory is not None:
245
 
        try:
246
 
            tree = WorkingTree.open(tree_directory)
247
 
        except NotBranchError:
248
 
            if not os.path.exists(tree_directory):
249
 
                os.mkdir(tree_directory)
250
 
            branch = BzrDir.create_branch_convenience(tree_directory)
251
 
            tree = branch.bzrdir.open_workingtree()
252
 
    else:
253
 
        tree = WorkingTree.open_containing('.')[0]
254
 
    tree.lock_write()
255
 
    try:
256
 
        if tree.changes_from(tree.basis_tree()).has_changed():
257
 
            raise BzrCommandError("Working tree has uncommitted changes.")
258
 
 
259
 
        if (source.endswith('.tar') or source.endswith('.tar.gz') or 
260
 
            source.endswith('.tar.bz2')) or source.endswith('.tgz'):
261
 
            try:
262
 
                if source.endswith('.bz2'):
263
 
                    tar_input = BZ2File(source, 'r')
264
 
                    tar_input = StringIO(tar_input.read())
265
 
                else:
266
 
                    tar_input = file(source, 'rb')
267
 
            except IOError, e:
268
 
                if e.errno == errno.ENOENT:
269
 
                    raise NoSuchFile(source)
270
 
            try:
271
 
                import_tar(tree, tar_input)
272
 
            finally:
273
 
                tar_input.close()
274
 
        elif source.endswith('.zip'):
275
 
            import_zip(tree, open(source, 'rb'))
276
 
        elif file_kind(source) == 'directory':
277
 
            s = StringIO(source)
278
 
            s.seek(0)
279
 
            import_dir(tree, s)
280
 
        else:
281
 
            raise BzrCommandError('Unhandled import source')
282
 
    finally:
283
 
        tree.unlock()