~bzr-pqm/bzr/bzr.dev : contents of bzrlib/workingtree.py at revision 1105

~bzr-pqm/bzr/bzr.dev : (revision 1105)

# Copyright (C) 2005 Canonical Ltd

# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.

# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA

# TODO: Don't allow WorkingTrees to be constructed for remote branches.

# FIXME: I don't know if writing out the cache from the destructor is really a
# good idea, because destructors are considered poor taste in Python, and
# it's not predictable when it will be written out.

import os
    
import bzrlib.tree
from errors import BzrCheckError
from trace import mutter

class WorkingTree(bzrlib.tree.Tree):
    """Working copy tree.

    The inventory is held in the `Branch` working-inventory, and the
    files are in a directory on disk.

    It is possible for a `WorkingTree` to have a filename which is
    not listed in the Inventory and vice versa.
    """
    def __init__(self, basedir, inv):
        from bzrlib.hashcache import HashCache
        from bzrlib.trace import note, mutter

        self._inventory = inv
        self.basedir = basedir
        self.path2id = inv.path2id

        # update the whole cache up front and write to disk if anything changed;
        # in the future we might want to do this more selectively
        hc = self._hashcache = HashCache(basedir)
        hc.read()
        hc.scan()

        if hc.needs_write:
            mutter("write hc")
            hc.write()
            
            
    def __del__(self):
        if self._hashcache.needs_write:
            self._hashcache.write()


    def __iter__(self):
        """Iterate through file_ids for this tree.

        file_ids are in a WorkingTree if they are in the working inventory
        and the working file exists.
        """
        inv = self._inventory
        for path, ie in inv.iter_entries():
            if os.path.exists(self.abspath(path)):
                yield ie.file_id


    def __repr__(self):
        return "<%s of %s>" % (self.__class__.__name__,
                               getattr(self, 'basedir', None))



    def abspath(self, filename):
        return os.path.join(self.basedir, filename)

    def has_filename(self, filename):
        return os.path.exists(self.abspath(filename))

    def get_file(self, file_id):
        return self.get_file_byname(self.id2path(file_id))

    def get_file_byname(self, filename):
        return file(self.abspath(filename), 'rb')

    def _get_store_filename(self, file_id):
        ## XXX: badly named; this isn't in the store at all
        return self.abspath(self.id2path(file_id))

                
    def has_id(self, file_id):
        # files that have been deleted are excluded
        inv = self._inventory
        if not inv.has_id(file_id):
            return False
        path = inv.id2path(file_id)
        return os.path.exists(self.abspath(path))


    __contains__ = has_id
    

    def get_file_size(self, file_id):
        # is this still called?
        raise NotImplementedError()


    def get_file_sha1(self, file_id):
        path = self._inventory.id2path(file_id)
        return self._hashcache.get_sha1(path)


    def file_class(self, filename):
        if self.path2id(filename):
            return 'V'
        elif self.is_ignored(filename):
            return 'I'
        else:
            return '?'


    def list_files(self):
        """Recursively list all files as (path, class, kind, id).

        Lists, but does not descend into unversioned directories.

        This does not include files that have been deleted in this
        tree.

        Skips the control directory.
        """
        from osutils import appendpath, file_kind
        import os

        inv = self._inventory

        def descend(from_dir_relpath, from_dir_id, dp):
            ls = os.listdir(dp)
            ls.sort()
            for f in ls:
                ## TODO: If we find a subdirectory with its own .bzr
                ## directory, then that is a separate tree and we
                ## should exclude it.
                if bzrlib.BZRDIR == f:
                    continue

                # path within tree
                fp = appendpath(from_dir_relpath, f)

                # absolute path
                fap = appendpath(dp, f)
                
                f_ie = inv.get_child(from_dir_id, f)
                if f_ie:
                    c = 'V'
                elif self.is_ignored(fp):
                    c = 'I'
                else:
                    c = '?'

                fk = file_kind(fap)

                if f_ie:
                    if f_ie.kind != fk:
                        raise BzrCheckError("file %r entered as kind %r id %r, "
                                            "now of kind %r"
                                            % (fap, f_ie.kind, f_ie.file_id, fk))

                yield fp, c, fk, (f_ie and f_ie.file_id)

                if fk != 'directory':
                    continue

                if c != 'V':
                    # don't descend unversioned directories
                    continue
                
                for ff in descend(fp, f_ie.file_id, fap):
                    yield ff

        for f in descend('', inv.root.file_id, self.basedir):
            yield f
            


    def unknowns(self):
        for subp in self.extras():
            if not self.is_ignored(subp):
                yield subp


    def extras(self):
        """Yield all unknown files in this WorkingTree.

        If there are any unknown directories then only the directory is
        returned, not all its children.  But if there are unknown files
        under a versioned subdirectory, they are returned.

        Currently returned depth-first, sorted by name within directories.
        """
        ## TODO: Work from given directory downwards
        from osutils import isdir, appendpath
        
        for path, dir_entry in self.inventory.directories():
            mutter("search for unknowns in %r" % path)
            dirabs = self.abspath(path)
            if not isdir(dirabs):
                # e.g. directory deleted
                continue

            fl = []
            for subf in os.listdir(dirabs):
                if (subf != '.bzr'
                    and (subf not in dir_entry.children)):
                    fl.append(subf)
            
            fl.sort()
            for subf in fl:
                subp = appendpath(path, subf)
                yield subp


    def ignored_files(self):
        """Yield list of PATH, IGNORE_PATTERN"""
        for subp in self.extras():
            pat = self.is_ignored(subp)
            if pat != None:
                yield subp, pat


    def get_ignore_list(self):
        """Return list of ignore patterns.

        Cached in the Tree object after the first call.
        """
        if hasattr(self, '_ignorelist'):
            return self._ignorelist

        l = bzrlib.DEFAULT_IGNORE[:]
        if self.has_filename(bzrlib.IGNORE_FILENAME):
            f = self.get_file_byname(bzrlib.IGNORE_FILENAME)
            l.extend([line.rstrip("\n\r") for line in f.readlines()])
        self._ignorelist = l
        return l


    def is_ignored(self, filename):
        r"""Check whether the filename matches an ignore pattern.

        Patterns containing '/' or '\' need to match the whole path;
        others match against only the last component.

        If the file is ignored, returns the pattern which caused it to
        be ignored, otherwise None.  So this can simply be used as a
        boolean if desired."""

        # TODO: Use '**' to match directories, and other extended
        # globbing stuff from cvs/rsync.

        # XXX: fnmatch is actually not quite what we want: it's only
        # approximately the same as real Unix fnmatch, and doesn't
        # treat dotfiles correctly and allows * to match /.
        # Eventually it should be replaced with something more
        # accurate.
        
        import fnmatch
        from osutils import splitpath
        
        for pat in self.get_ignore_list():
            if '/' in pat or '\\' in pat:
                
                # as a special case, you can put ./ at the start of a
                # pattern; this is good to match in the top-level
                # only;
                
                if (pat[:2] == './') or (pat[:2] == '.\\'):
                    newpat = pat[2:]
                else:
                    newpat = pat
                if fnmatch.fnmatchcase(filename, newpat):
                    return pat
            else:
                if fnmatch.fnmatchcase(splitpath(filename)[-1], pat):
                    return pat
        else:
            return None
        

453 by Martin Pool - Split WorkingTree into its own file	1	# Copyright (C) 2005 Canonical Ltd
	2
	3	# This program is free software; you can redistribute it and/or modify
	4	# it under the terms of the GNU General Public License as published by
	5	# the Free Software Foundation; either version 2 of the License, or
	6	# (at your option) any later version.
	7
	8	# This program is distributed in the hope that it will be useful,
	9	# but WITHOUT ANY WARRANTY; without even the implied warranty of
	10	# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	11	# GNU General Public License for more details.
	12
	13	# You should have received a copy of the GNU General Public License
	14	# along with this program; if not, write to the Free Software
	15	# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
	16
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	17	# TODO: Don't allow WorkingTrees to be constructed for remote branches.
453 by Martin Pool - Split WorkingTree into its own file	18
956 by Martin Pool doc	19	# FIXME: I don't know if writing out the cache from the destructor is really a
	20	# good idea, because destructors are considered poor taste in Python, and
	21	# it's not predictable when it will be written out.
	22
453 by Martin Pool - Split WorkingTree into its own file	23	import os
	24
	25	import bzrlib.tree
	26	from errors import BzrCheckError
	27	from trace import mutter
	28
	29	class WorkingTree(bzrlib.tree.Tree):
	30	"""Working copy tree.
	31
	32	The inventory is held in the `Branch` working-inventory, and the
	33	files are in a directory on disk.
	34
	35	It is possible for a `WorkingTree` to have a filename which is
	36	not listed in the Inventory and vice versa.
	37	"""
	38	def __init__(self, basedir, inv):
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	39	from bzrlib.hashcache import HashCache
	40	from bzrlib.trace import note, mutter
	41
453 by Martin Pool - Split WorkingTree into its own file	42	self._inventory = inv
	43	self.basedir = basedir
	44	self.path2id = inv.path2id
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	45
	46	# update the whole cache up front and write to disk if anything changed;
	47	# in the future we might want to do this more selectively
	48	hc = self._hashcache = HashCache(basedir)
	49	hc.read()
954 by Martin Pool - separate out code that just scans the hash cache to find files that are possibly	50	hc.scan()
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	51
	52	if hc.needs_write:
	53	mutter("write hc")
	54	hc.write()
954 by Martin Pool - separate out code that just scans the hash cache to find files that are possibly	55
	56
	57	def __del__(self):
	58	if self._hashcache.needs_write:
	59	self._hashcache.write()
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	60
453 by Martin Pool - Split WorkingTree into its own file	61
462 by Martin Pool - New form 'file_id in tree' to check if the file is present	62	def __iter__(self):
	63	"""Iterate through file_ids for this tree.
	64
	65	file_ids are in a WorkingTree if they are in the working inventory
	66	and the working file exists.
	67	"""
	68	inv = self._inventory
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	69	for path, ie in inv.iter_entries():
	70	if os.path.exists(self.abspath(path)):
	71	yield ie.file_id
462 by Martin Pool - New form 'file_id in tree' to check if the file is present	72
	73
453 by Martin Pool - Split WorkingTree into its own file	74	def __repr__(self):
453 by Martin Pool - Split WorkingTree into its own file	75	return "<%s of %s>" % (self.__class__.__name__,
954 by Martin Pool - separate out code that just scans the hash cache to find files that are possibly	76	getattr(self, 'basedir', None))
453 by Martin Pool - Split WorkingTree into its own file	77
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	78
	79
453 by Martin Pool - Split WorkingTree into its own file	80	def abspath(self, filename):
	81	return os.path.join(self.basedir, filename)
	82
	83	def has_filename(self, filename):
	84	return os.path.exists(self.abspath(filename))
	85
	86	def get_file(self, file_id):
	87	return self.get_file_byname(self.id2path(file_id))
	88
	89	def get_file_byname(self, filename):
	90	return file(self.abspath(filename), 'rb')
	91
	92	def _get_store_filename(self, file_id):
	93	## XXX: badly named; this isn't in the store at all
	94	return self.abspath(self.id2path(file_id))
	95
462 by Martin Pool - New form 'file_id in tree' to check if the file is present	96
453 by Martin Pool - Split WorkingTree into its own file	97	def has_id(self, file_id):
453 by Martin Pool - Split WorkingTree into its own file	98	# files that have been deleted are excluded
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	99	inv = self._inventory
	100	if not inv.has_id(file_id):
453 by Martin Pool - Split WorkingTree into its own file	101	return False
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	102	path = inv.id2path(file_id)
	103	return os.path.exists(self.abspath(path))
462 by Martin Pool - New form 'file_id in tree' to check if the file is present	104
	105
	106	__contains__ = has_id
	107
	108
453 by Martin Pool - Split WorkingTree into its own file	109	def get_file_size(self, file_id):
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	110	# is this still called?
	111	raise NotImplementedError()
453 by Martin Pool - Split WorkingTree into its own file	112
	113
	114	def get_file_sha1(self, file_id):
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	115	path = self._inventory.id2path(file_id)
	116	return self._hashcache.get_sha1(path)
453 by Martin Pool - Split WorkingTree into its own file	117
	118
	119	def file_class(self, filename):
	120	if self.path2id(filename):
	121	return 'V'
	122	elif self.is_ignored(filename):
	123	return 'I'
	124	else:
	125	return '?'
	126
	127
	128	def list_files(self):
	129	"""Recursively list all files as (path, class, kind, id).
	130
	131	Lists, but does not descend into unversioned directories.
	132
	133	This does not include files that have been deleted in this
	134	tree.
	135
	136	Skips the control directory.
	137	"""
	138	from osutils import appendpath, file_kind
	139	import os
	140
866 by Martin Pool - use new path-based hashcache for WorkingTree- squash mtime/ctime to whole seconds- update and if necessary write out hashcache when WorkingTree object is created.	141	inv = self._inventory
453 by Martin Pool - Split WorkingTree into its own file	142
	143	def descend(from_dir_relpath, from_dir_id, dp):
	144	ls = os.listdir(dp)
	145	ls.sort()
	146	for f in ls:
	147	## TODO: If we find a subdirectory with its own .bzr
	148	## directory, then that is a separate tree and we
	149	## should exclude it.
	150	if bzrlib.BZRDIR == f:
	151	continue
	152
	153	# path within tree
	154	fp = appendpath(from_dir_relpath, f)
	155
	156	# absolute path
	157	fap = appendpath(dp, f)
	158
	159	f_ie = inv.get_child(from_dir_id, f)
	160	if f_ie:
	161	c = 'V'
	162	elif self.is_ignored(fp):
	163	c = 'I'
	164	else:
	165	c = '?'
	166
	167	fk = file_kind(fap)
	168
	169	if f_ie:
	170	if f_ie.kind != fk:
	171	raise BzrCheckError("file %r entered as kind %r id %r, "
	172	"now of kind %r"
	173	% (fap, f_ie.kind, f_ie.file_id, fk))
	174
	175	yield fp, c, fk, (f_ie and f_ie.file_id)
	176
	177	if fk != 'directory':
	178	continue
	179
	180	if c != 'V':
	181	# don't descend unversioned directories
	182	continue
	183
	184	for ff in descend(fp, f_ie.file_id, fap):
	185	yield ff
	186
	187	for f in descend('', inv.root.file_id, self.basedir):
	188	yield f
	189
	190
	191
	192	def unknowns(self):
	193	for subp in self.extras():
	194	if not self.is_ignored(subp):
	195	yield subp
	196
	197
	198	def extras(self):
	199	"""Yield all unknown files in this WorkingTree.
	200
	201	If there are any unknown directories then only the directory is
	202	returned, not all its children. But if there are unknown files
	203	under a versioned subdirectory, they are returned.
	204
	205	Currently returned depth-first, sorted by name within directories.
206	"""
207	## TODO: Work from given directory downwards
208	from osutils import isdir, appendpath
209
210	for path, dir_entry in self.inventory.directories():
211	mutter("search for unknowns in %r" % path)
212	dirabs = self.abspath(path)
213	if not isdir(dirabs):
214	# e.g. directory deleted
215	continue
216
217	fl = []
218	for subf in os.listdir(dirabs):
219	if (subf != '.bzr'
220	and (subf not in dir_entry.children)):
221	fl.append(subf)
222
223	fl.sort()
224	for subf in fl:
225	subp = appendpath(path, subf)
226	yield subp
227
228
229	def ignored_files(self):
230	"""Yield list of PATH, IGNORE_PATTERN"""
231	for subp in self.extras():
232	pat = self.is_ignored(subp)
233	if pat != None:
234	yield subp, pat
235
236
237	def get_ignore_list(self):
238	"""Return list of ignore patterns.
239
240	Cached in the Tree object after the first call.
241	"""
242	if hasattr(self, '_ignorelist'):
243	return self._ignorelist
244
245	l = bzrlib.DEFAULT_IGNORE[:]
246	if self.has_filename(bzrlib.IGNORE_FILENAME):
247	f = self.get_file_byname(bzrlib.IGNORE_FILENAME)
248	l.extend([line.rstrip("\n\r") for line in f.readlines()])
249	self._ignorelist = l
250	return l
251
252
253	def is_ignored(self, filename):
254	r"""Check whether the filename matches an ignore pattern.
255
256	Patterns containing '/' or '\' need to match the whole path;
257	others match against only the last component.
258
259	If the file is ignored, returns the pattern which caused it to
260	be ignored, otherwise None. So this can simply be used as a
261	boolean if desired."""
262
263	# TODO: Use '**' to match directories, and other extended
264	# globbing stuff from cvs/rsync.
265
266	# XXX: fnmatch is actually not quite what we want: it's only
267	# approximately the same as real Unix fnmatch, and doesn't
268	# treat dotfiles correctly and allows * to match /.
269	# Eventually it should be replaced with something more
270	# accurate.
271
272	import fnmatch
273	from osutils import splitpath
274
275	for pat in self.get_ignore_list():
276	if '/' in pat or '\\' in pat:
277
278	# as a special case, you can put ./ at the start of a
279	# pattern; this is good to match in the top-level
280	# only;
281
282	if (pat[:2] == './') or (pat[:2] == '.\\'):
283	newpat = pat[2:]
284	else:
285	newpat = pat
286	if fnmatch.fnmatchcase(filename, newpat):
287	return pat
288	else:
289	if fnmatch.fnmatchcase(splitpath(filename)[-1], pat):
290	return pat
291	else:
292	return None
956 by Martin Pool doc	293