5024.1.1
by John Arbash Meinel
Fix bug #303275, return a kind marker for sockets and fifos. |
1 |
# Copyright (C) 2005-2010 Canonical Ltd
|
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
2 |
#
|
1
by mbp at sourcefrog
import from baz patch-364 |
3 |
# This program is free software; you can redistribute it and/or modify
|
4 |
# it under the terms of the GNU General Public License as published by
|
|
5 |
# the Free Software Foundation; either version 2 of the License, or
|
|
6 |
# (at your option) any later version.
|
|
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
7 |
#
|
1
by mbp at sourcefrog
import from baz patch-364 |
8 |
# This program is distributed in the hope that it will be useful,
|
9 |
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
10 |
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
11 |
# GNU General Public License for more details.
|
|
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
12 |
#
|
1
by mbp at sourcefrog
import from baz patch-364 |
13 |
# You should have received a copy of the GNU General Public License
|
14 |
# along with this program; if not, write to the Free Software
|
|
4183.7.1
by Sabin Iacob
update FSF mailing address |
15 |
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
1
by mbp at sourcefrog
import from baz patch-364 |
16 |
|
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
17 |
import os |
18 |
import re |
|
19 |
import stat |
|
20 |
from stat import (S_ISREG, S_ISDIR, S_ISLNK, ST_MODE, ST_SIZE, |
|
21 |
S_ISCHR, S_ISBLK, S_ISFIFO, S_ISSOCK) |
|
22 |
import sys |
|
23 |
import time |
|
5051.2.1
by Benjamin Peterson
move codecs import out of lazy section since it is used on module import |
24 |
import codecs |
4574.3.2
by Martin Pool
Change back to python warnings for failure to load extensions |
25 |
import warnings |
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
26 |
|
27 |
from bzrlib.lazy_import import lazy_import |
|
28 |
lazy_import(globals(), """ |
|
2215.6.1
by James Henstridge
Don't rely on time.timezone and time.altzone in local_time_offset(), |
29 |
from datetime import datetime
|
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
30 |
import errno
|
1711.4.5
by John Arbash Meinel
the _posix_* routines should use posixpath not os.path, so tests pass on win32 |
31 |
from ntpath import (abspath as _nt_abspath,
|
32 |
join as _nt_join,
|
|
33 |
normpath as _nt_normpath,
|
|
34 |
realpath as _nt_realpath,
|
|
1711.5.2
by John Arbash Meinel
win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this |
35 |
splitdrive as _nt_splitdrive,
|
1711.4.5
by John Arbash Meinel
the _posix_* routines should use posixpath not os.path, so tests pass on win32 |
36 |
)
|
37 |
import posixpath
|
|
1692.7.6
by Martin Pool
[patch] force deletion of trees containing readonly files (alexander) |
38 |
import shutil
|
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
39 |
from shutil import (
|
40 |
rmtree,
|
|
41 |
)
|
|
4747.5.3
by Vincent Ladeuil
Review feedback: import signal lazily and don't install SIGWINCH on windows. |
42 |
import signal
|
4398.4.3
by Vincent Ladeuil
Detect # cores on win32 and Solaris too. |
43 |
import subprocess
|
1185.31.40
by John Arbash Meinel
Added osutils.mkdtemp() |
44 |
import tempfile
|
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
45 |
from tempfile import (
|
46 |
mkdtemp,
|
|
47 |
)
|
|
1185.85.75
by John Arbash Meinel
Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. |
48 |
import unicodedata
|
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
49 |
|
50 |
from bzrlib import (
|
|
2249.5.16
by John Arbash Meinel
[merge] bzr.dev 2283 |
51 |
cache_utf8,
|
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
52 |
errors,
|
2245.4.6
by Alexander Belchenko
osutils.py: terminal_width() now use win32utils.get_console_size() |
53 |
win32utils,
|
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
54 |
)
|
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
55 |
""") |
1
by mbp at sourcefrog
import from baz patch-364 |
56 |
|
3734.2.4
by Vincent Ladeuil
Fix python2.6 deprecation warnings related to hashlib. |
57 |
# sha and md5 modules are deprecated in python2.6 but hashlib is available as
|
58 |
# of 2.5
|
|
2929.3.1
by Vincent Ladeuil
Fix python2.6 deprecation warnings (still 4 failures 5 errors in test suite). |
59 |
if sys.version_info < (2, 5): |
3734.5.2
by Vincent Ladeuil
Martin's review feedback. |
60 |
import md5 as _mod_md5 |
61 |
md5 = _mod_md5.new |
|
62 |
import sha as _mod_sha |
|
63 |
sha = _mod_sha.new |
|
2929.3.1
by Vincent Ladeuil
Fix python2.6 deprecation warnings (still 4 failures 5 errors in test suite). |
64 |
else: |
65 |
from hashlib import ( |
|
66 |
md5, |
|
67 |
sha1 as sha, |
|
68 |
)
|
|
69 |
||
3504.4.1
by John Arbash Meinel
Write an alternative 'walkdirs' implementation that uses win32 apis. |
70 |
|
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
71 |
import bzrlib |
2309.4.3
by John Arbash Meinel
(broken) change safe_*_id to emit a warning. |
72 |
from bzrlib import symbol_versioning |
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
73 |
|
1
by mbp at sourcefrog
import from baz patch-364 |
74 |
|
4889.2.5
by John Arbash Meinel
Review feedback from Andrew. |
75 |
# Cross platform wall-clock time functionality with decent resolution.
|
76 |
# On Linux ``time.clock`` returns only CPU time. On Windows, ``time.time()``
|
|
77 |
# only has a resolution of ~15ms. Note that ``time.clock()`` is not
|
|
78 |
# synchronized with ``time.time()``, this is only meant to be used to find
|
|
79 |
# delta times by subtracting from another call to this function.
|
|
4889.2.1
by John Arbash Meinel
Make -Dhpss log debug information for the server process. |
80 |
timer_func = time.time |
81 |
if sys.platform == 'win32': |
|
82 |
timer_func = time.clock |
|
83 |
||
1755.3.7
by John Arbash Meinel
Clean up and write tests for permissions. Now we use fstat which should be cheap, and lets us check the permissions and the file size |
84 |
# On win32, O_BINARY is used to indicate the file should
|
85 |
# be opened in binary mode, rather than text mode.
|
|
86 |
# On other platforms, O_BINARY doesn't exist, because
|
|
87 |
# they always open in binary mode, so it is okay to
|
|
88 |
# OR with 0 on those platforms
|
|
89 |
O_BINARY = getattr(os, 'O_BINARY', 0) |
|
90 |
||
91 |
||
4355.2.2
by Alexander Belchenko
osutils.py: get_unicode_argv function (to obtain unicode command line arguments from sys.argv) moved to the beginning of module based on suggestions from review of John Meinel. |
92 |
def get_unicode_argv(): |
93 |
try: |
|
94 |
user_encoding = get_user_encoding() |
|
95 |
return [a.decode(user_encoding) for a in sys.argv[1:]] |
|
96 |
except UnicodeDecodeError: |
|
97 |
raise errors.BzrError(("Parameter '%r' is unsupported by the current " |
|
98 |
"encoding." % a)) |
|
99 |
||
100 |
||
1
by mbp at sourcefrog
import from baz patch-364 |
101 |
def make_readonly(filename): |
102 |
"""Make a filename read-only."""
|
|
2949.6.1
by Alexander Belchenko
windows python has os.lstat |
103 |
mod = os.lstat(filename).st_mode |
2568.1.1
by John Arbash Meinel
(Elliot Murphy) Use os.lstat rather than os.stat for osutils.make_readonly/make_writeable |
104 |
if not stat.S_ISLNK(mod): |
105 |
mod = mod & 0777555 |
|
106 |
os.chmod(filename, mod) |
|
1
by mbp at sourcefrog
import from baz patch-364 |
107 |
|
108 |
||
109 |
def make_writable(filename): |
|
2949.6.1
by Alexander Belchenko
windows python has os.lstat |
110 |
mod = os.lstat(filename).st_mode |
2568.1.1
by John Arbash Meinel
(Elliot Murphy) Use os.lstat rather than os.stat for osutils.make_readonly/make_writeable |
111 |
if not stat.S_ISLNK(mod): |
112 |
mod = mod | 0200 |
|
113 |
os.chmod(filename, mod) |
|
1
by mbp at sourcefrog
import from baz patch-364 |
114 |
|
115 |
||
2825.7.1
by Robert Collins
* Partial commits are now approximately 40% faster by walking over the |
116 |
def minimum_path_selection(paths): |
117 |
"""Return the smallset subset of paths which are outside paths.
|
|
118 |
||
2843.1.1
by Ian Clatworthy
Faster partial commits by walking less data (Robert Collins) |
119 |
:param paths: A container (and hence not None) of paths.
|
2825.7.1
by Robert Collins
* Partial commits are now approximately 40% faster by walking over the |
120 |
:return: A set of paths sufficient to include everything in paths via
|
4325.3.3
by Johan Walles
Add unit test and fix for minimum_path_selection() vs directory names with |
121 |
is_inside, drawn from the paths parameter.
|
2825.7.1
by Robert Collins
* Partial commits are now approximately 40% faster by walking over the |
122 |
"""
|
4325.3.7
by Johan Walles
Style fixes for minimum_path_selection(). |
123 |
if len(paths) < 2: |
124 |
return set(paths) |
|
4325.3.3
by Johan Walles
Add unit test and fix for minimum_path_selection() vs directory names with |
125 |
|
126 |
def sort_key(path): |
|
127 |
return path.split('/') |
|
128 |
sorted_paths = sorted(list(paths), key=sort_key) |
|
129 |
||
4325.3.7
by Johan Walles
Style fixes for minimum_path_selection(). |
130 |
search_paths = [sorted_paths[0]] |
131 |
for path in sorted_paths[1:]: |
|
4325.3.2
by Johan Walles
Use a linear algorithm for osutil.minimum_path_selection(). |
132 |
if not is_inside(search_paths[-1], path): |
133 |
# This path is unique, add it
|
|
134 |
search_paths.append(path) |
|
4325.3.7
by Johan Walles
Style fixes for minimum_path_selection(). |
135 |
|
4325.3.2
by Johan Walles
Use a linear algorithm for osutil.minimum_path_selection(). |
136 |
return set(search_paths) |
2825.7.1
by Robert Collins
* Partial commits are now approximately 40% faster by walking over the |
137 |
|
138 |
||
1077
by Martin Pool
- avoid compiling REs at module load time |
139 |
_QUOTE_RE = None |
969
by Martin Pool
- Add less-sucky is_within_any |
140 |
|
141 |
||
1
by mbp at sourcefrog
import from baz patch-364 |
142 |
def quotefn(f): |
779
by Martin Pool
- better quotefn for windows: use doublequotes for strings with |
143 |
"""Return a quoted filename filename
|
144 |
||
145 |
This previously used backslash quoting, but that works poorly on
|
|
146 |
Windows."""
|
|
147 |
# TODO: I'm not really sure this is the best format either.x
|
|
1077
by Martin Pool
- avoid compiling REs at module load time |
148 |
global _QUOTE_RE |
1963.2.6
by Robey Pointer
pychecker is on crack; go back to using 'is None'. |
149 |
if _QUOTE_RE is None: |
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
150 |
_QUOTE_RE = re.compile(r'([^a-zA-Z0-9.,:/\\_~-])') |
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
151 |
|
779
by Martin Pool
- better quotefn for windows: use doublequotes for strings with |
152 |
if _QUOTE_RE.search(f): |
153 |
return '"' + f + '"' |
|
154 |
else: |
|
155 |
return f |
|
1
by mbp at sourcefrog
import from baz patch-364 |
156 |
|
157 |
||
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
158 |
_directory_kind = 'directory' |
159 |
||
1755.3.7
by John Arbash Meinel
Clean up and write tests for permissions. Now we use fstat which should be cheap, and lets us check the permissions and the file size |
160 |
def get_umask(): |
161 |
"""Return the current umask"""
|
|
162 |
# Assume that people aren't messing with the umask while running
|
|
163 |
# XXX: This is not thread safe, but there is no way to get the
|
|
164 |
# umask without setting it
|
|
165 |
umask = os.umask(0) |
|
166 |
os.umask(umask) |
|
167 |
return umask |
|
168 |
||
169 |
||
2324.2.1
by Dmitry Vasiliev
kind_marker() optimization |
170 |
_kind_marker_map = { |
171 |
"file": "", |
|
172 |
_directory_kind: "/", |
|
173 |
"symlink": "@", |
|
1551.10.30
by Aaron Bentley
Merge from bzr.dev |
174 |
'tree-reference': '+', |
2324.2.1
by Dmitry Vasiliev
kind_marker() optimization |
175 |
}
|
1551.10.30
by Aaron Bentley
Merge from bzr.dev |
176 |
|
177 |
||
488
by Martin Pool
- new helper function kind_marker() |
178 |
def kind_marker(kind): |
2324.2.1
by Dmitry Vasiliev
kind_marker() optimization |
179 |
try: |
180 |
return _kind_marker_map[kind] |
|
181 |
except KeyError: |
|
5024.1.2
by John Arbash Meinel
Switch so that all unknown files get an empty marker, rather than failing. |
182 |
# Slightly faster than using .get(, '') when the common case is that
|
183 |
# kind will be found
|
|
184 |
return '' |
|
1
by mbp at sourcefrog
import from baz patch-364 |
185 |
|
2324.2.1
by Dmitry Vasiliev
kind_marker() optimization |
186 |
|
1732.1.2
by John Arbash Meinel
just use os.path.lexists if it exists |
187 |
lexists = getattr(os.path, 'lexists', None) |
188 |
if lexists is None: |
|
189 |
def lexists(f): |
|
190 |
try: |
|
2324.2.2
by Dmitry Vasiliev
Fixed lexists() implementation |
191 |
stat = getattr(os, 'lstat', os.stat) |
192 |
stat(f) |
|
1732.1.2
by John Arbash Meinel
just use os.path.lexists if it exists |
193 |
return True |
2324.2.2
by Dmitry Vasiliev
Fixed lexists() implementation |
194 |
except OSError, e: |
1732.1.2
by John Arbash Meinel
just use os.path.lexists if it exists |
195 |
if e.errno == errno.ENOENT: |
196 |
return False; |
|
197 |
else: |
|
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
198 |
raise errors.BzrError("lstat/stat of (%r): %r" % (f, e)) |
1732.1.2
by John Arbash Meinel
just use os.path.lexists if it exists |
199 |
|
1
by mbp at sourcefrog
import from baz patch-364 |
200 |
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
201 |
def fancy_rename(old, new, rename_func, unlink_func): |
202 |
"""A fancy rename, when you don't have atomic rename.
|
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
203 |
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
204 |
:param old: The old path, to rename from
|
205 |
:param new: The new path, to rename to
|
|
206 |
:param rename_func: The potentially non-atomic rename function
|
|
4935.1.1
by Vincent Ladeuil
Support Unicode paths for ftp transport (encoded as utf8). |
207 |
:param unlink_func: A way to delete the target file if the full rename
|
208 |
succeeds
|
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
209 |
"""
|
210 |
# sftp rename doesn't allow overwriting, so play tricks:
|
|
211 |
base = os.path.basename(new) |
|
212 |
dirname = os.path.dirname(new) |
|
4935.1.3
by Vincent Ladeuil
Better fix for fancy_rename respecting callers file encoding. |
213 |
# callers use different encodings for the paths so the following MUST
|
214 |
# respect that. We rely on python upcasting to unicode if new is unicode
|
|
215 |
# and keeping a str if not.
|
|
216 |
tmp_name = 'tmp.%s.%.9f.%d.%s' % (base, time.time(), |
|
217 |
os.getpid(), rand_chars(10)) |
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
218 |
tmp_name = pathjoin(dirname, tmp_name) |
219 |
||
220 |
# Rename the file out of the way, but keep track if it didn't exist
|
|
221 |
# We don't want to grab just any exception
|
|
222 |
# something like EACCES should prevent us from continuing
|
|
223 |
# The downside is that the rename_func has to throw an exception
|
|
224 |
# with an errno = ENOENT, or NoSuchFile
|
|
225 |
file_existed = False |
|
226 |
try: |
|
227 |
rename_func(new, tmp_name) |
|
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
228 |
except (errors.NoSuchFile,), e: |
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
229 |
pass
|
1532
by Robert Collins
Merge in John Meinels integration branch. |
230 |
except IOError, e: |
231 |
# RBC 20060103 abstraction leakage: the paramiko SFTP clients rename
|
|
1963.2.6
by Robey Pointer
pychecker is on crack; go back to using 'is None'. |
232 |
# function raises an IOError with errno is None when a rename fails.
|
1532
by Robert Collins
Merge in John Meinels integration branch. |
233 |
# This then gets caught here.
|
1185.50.37
by John Arbash Meinel
Fixed exception handling for fancy_rename |
234 |
if e.errno not in (None, errno.ENOENT, errno.ENOTDIR): |
1532
by Robert Collins
Merge in John Meinels integration branch. |
235 |
raise
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
236 |
except Exception, e: |
1963.2.6
by Robey Pointer
pychecker is on crack; go back to using 'is None'. |
237 |
if (getattr(e, 'errno', None) is None |
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
238 |
or e.errno not in (errno.ENOENT, errno.ENOTDIR)): |
239 |
raise
|
|
240 |
else: |
|
241 |
file_existed = True |
|
242 |
||
4789.17.1
by John Arbash Meinel
Change fancy_rename slightly. |
243 |
failure_exc = None |
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
244 |
success = False |
245 |
try: |
|
2978.8.2
by Alexander Belchenko
teach fancy_rename to handle change case renames in possible case-insensitive filesystem |
246 |
try: |
247 |
# This may throw an exception, in which case success will
|
|
248 |
# not be set.
|
|
249 |
rename_func(old, new) |
|
250 |
success = True |
|
251 |
except (IOError, OSError), e: |
|
2978.8.3
by Alexander Belchenko
Aaron's review |
252 |
# source and target may be aliases of each other (e.g. on a
|
253 |
# case-insensitive filesystem), so we may have accidentally renamed
|
|
254 |
# source by when we tried to rename target
|
|
4789.17.1
by John Arbash Meinel
Change fancy_rename slightly. |
255 |
failure_exc = sys.exc_info() |
256 |
if (file_existed and e.errno in (None, errno.ENOENT) |
|
257 |
and old.lower() == new.lower()): |
|
258 |
# source and target are the same file on a case-insensitive
|
|
259 |
# filesystem, so we don't generate an exception
|
|
260 |
failure_exc = None |
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
261 |
finally: |
262 |
if file_existed: |
|
263 |
# If the file used to exist, rename it back into place
|
|
264 |
# otherwise just delete it from the tmp location
|
|
265 |
if success: |
|
1551.15.4
by Aaron Bentley
Revert now-unnecessary changes |
266 |
unlink_func(tmp_name) |
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
267 |
else: |
1185.31.49
by John Arbash Meinel
Some corrections using the new osutils.rename. **ALL TESTS PASS** |
268 |
rename_func(tmp_name, new) |
4789.17.2
by John Arbash Meinel
Also handle the case when source *and* target does not exist. |
269 |
if failure_exc is not None: |
270 |
raise failure_exc[0], failure_exc[1], failure_exc[2] |
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
271 |
|
1685.1.9
by John Arbash Meinel
Updated LocalTransport so that it's base is now a URL rather than a local path. This helps consistency with all other functions. To do so, I added local_abspath() which returns the local path, and local_path_to/from_url |
272 |
|
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
273 |
# In Python 2.4.2 and older, os.path.abspath and os.path.realpath
|
274 |
# choke on a Unicode string containing a relative path if
|
|
275 |
# os.getcwd() returns a non-sys.getdefaultencoding()-encoded
|
|
276 |
# string.
|
|
2093.1.1
by John Arbash Meinel
(Bart Teeuwisse) if sys.getfilesystemencoding() is None, use 'utf-8' |
277 |
_fs_enc = sys.getfilesystemencoding() or 'utf-8' |
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
278 |
def _posix_abspath(path): |
1711.4.5
by John Arbash Meinel
the _posix_* routines should use posixpath not os.path, so tests pass on win32 |
279 |
# jam 20060426 rather than encoding to fsencoding
|
280 |
# copy posixpath.abspath, but use os.getcwdu instead
|
|
281 |
if not posixpath.isabs(path): |
|
282 |
path = posixpath.join(getcwd(), path) |
|
283 |
return posixpath.normpath(path) |
|
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
284 |
|
285 |
||
286 |
def _posix_realpath(path): |
|
1711.4.5
by John Arbash Meinel
the _posix_* routines should use posixpath not os.path, so tests pass on win32 |
287 |
return posixpath.realpath(path.encode(_fs_enc)).decode(_fs_enc) |
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
288 |
|
289 |
||
1711.5.2
by John Arbash Meinel
win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this |
290 |
def _win32_fixdrive(path): |
291 |
"""Force drive letters to be consistent.
|
|
292 |
||
293 |
win32 is inconsistent whether it returns lower or upper case
|
|
294 |
and even if it was consistent the user might type the other
|
|
295 |
so we force it to uppercase
|
|
296 |
running python.exe under cmd.exe return capital C:\\
|
|
297 |
running win32 python inside a cygwin shell returns lowercase c:\\
|
|
298 |
"""
|
|
299 |
drive, path = _nt_splitdrive(path) |
|
300 |
return drive.upper() + path |
|
301 |
||
302 |
||
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
303 |
def _win32_abspath(path): |
1711.4.6
by John Arbash Meinel
Removing hacks for _win32_abspath, on real win32 abspath handles unicode just fine, it doesn't handle encoding into 'mbcs' |
304 |
# Real _nt_abspath doesn't have a problem with a unicode cwd
|
1711.5.2
by John Arbash Meinel
win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this |
305 |
return _win32_fixdrive(_nt_abspath(unicode(path)).replace('\\', '/')) |
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
306 |
|
307 |
||
2279.4.1
by Alexander Belchenko
Reimplementation of ntpath.abspath in Python for Windows98: unicode safe, UNC path safe |
308 |
def _win98_abspath(path): |
309 |
"""Return the absolute version of a path.
|
|
310 |
Windows 98 safe implementation (python reimplementation
|
|
311 |
of Win32 API function GetFullPathNameW)
|
|
312 |
"""
|
|
313 |
# Corner cases:
|
|
314 |
# C:\path => C:/path
|
|
315 |
# C:/path => C:/path
|
|
316 |
# \\HOST\path => //HOST/path
|
|
317 |
# //HOST/path => //HOST/path
|
|
318 |
# path => C:/cwd/path
|
|
319 |
# /path => C:/path
|
|
320 |
path = unicode(path) |
|
321 |
# check for absolute path
|
|
322 |
drive = _nt_splitdrive(path)[0] |
|
323 |
if drive == '' and path[:2] not in('//','\\\\'): |
|
324 |
cwd = os.getcwdu() |
|
325 |
# we cannot simply os.path.join cwd and path
|
|
326 |
# because os.path.join('C:','/path') produce '/path'
|
|
327 |
# and this is incorrect
|
|
328 |
if path[:1] in ('/','\\'): |
|
329 |
cwd = _nt_splitdrive(cwd)[0] |
|
2279.4.3
by Alexander Belchenko
win98_abspath: support for running in POSIX environment: cwd path has not drive letter |
330 |
path = path[1:] |
2279.4.1
by Alexander Belchenko
Reimplementation of ntpath.abspath in Python for Windows98: unicode safe, UNC path safe |
331 |
path = cwd + '\\' + path |
332 |
return _win32_fixdrive(_nt_normpath(path).replace('\\', '/')) |
|
333 |
||
334 |
||
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
335 |
def _win32_realpath(path): |
1711.4.6
by John Arbash Meinel
Removing hacks for _win32_abspath, on real win32 abspath handles unicode just fine, it doesn't handle encoding into 'mbcs' |
336 |
# Real _nt_realpath doesn't have a problem with a unicode cwd
|
1711.5.2
by John Arbash Meinel
win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this |
337 |
return _win32_fixdrive(_nt_realpath(unicode(path)).replace('\\', '/')) |
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
338 |
|
339 |
||
340 |
def _win32_pathjoin(*args): |
|
1685.1.31
by John Arbash Meinel
Adding tests for the rest of the _win32 functions. |
341 |
return _nt_join(*args).replace('\\', '/') |
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
342 |
|
343 |
||
344 |
def _win32_normpath(path): |
|
1711.5.2
by John Arbash Meinel
win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this |
345 |
return _win32_fixdrive(_nt_normpath(unicode(path)).replace('\\', '/')) |
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
346 |
|
347 |
||
348 |
def _win32_getcwd(): |
|
1711.5.2
by John Arbash Meinel
win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this |
349 |
return _win32_fixdrive(os.getcwdu().replace('\\', '/')) |
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
350 |
|
351 |
||
352 |
def _win32_mkdtemp(*args, **kwargs): |
|
1711.5.2
by John Arbash Meinel
win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this |
353 |
return _win32_fixdrive(tempfile.mkdtemp(*args, **kwargs).replace('\\', '/')) |
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
354 |
|
355 |
||
356 |
def _win32_rename(old, new): |
|
1711.7.6
by John Arbash Meinel
Change _win32_rename() so that it raises ENOENT *before* it tries any renaming. |
357 |
"""We expect to be able to atomically replace 'new' with old.
|
358 |
||
1711.7.17
by John Arbash Meinel
Delay the extra syscall in _win32_rename until we get a failure. |
359 |
On win32, if new exists, it must be moved out of the way first,
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
360 |
and then deleted.
|
1711.7.6
by John Arbash Meinel
Change _win32_rename() so that it raises ENOENT *before* it tries any renaming. |
361 |
"""
|
1711.7.17
by John Arbash Meinel
Delay the extra syscall in _win32_rename until we get a failure. |
362 |
try: |
363 |
fancy_rename(old, new, rename_func=os.rename, unlink_func=os.unlink) |
|
364 |
except OSError, e: |
|
1830.3.15
by John Arbash Meinel
On Mac we get EINVAL when renaming cwd |
365 |
if e.errno in (errno.EPERM, errno.EACCES, errno.EBUSY, errno.EINVAL): |
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
366 |
# If we try to rename a non-existant file onto cwd, we get
|
367 |
# EPERM or EACCES instead of ENOENT, this will raise ENOENT
|
|
1830.3.15
by John Arbash Meinel
On Mac we get EINVAL when renaming cwd |
368 |
# if the old path doesn't exist, sometimes we get EACCES
|
369 |
# On Linux, we seem to get EBUSY, on Mac we get EINVAL
|
|
1711.7.17
by John Arbash Meinel
Delay the extra syscall in _win32_rename until we get a failure. |
370 |
os.lstat(old) |
371 |
raise
|
|
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
372 |
|
373 |
||
1830.3.11
by John Arbash Meinel
Create a mac version of 'getcwd()' which normalizes the path. |
374 |
def _mac_getcwd(): |
3201.1.1
by jameinel
Fix bug #185458, switch from NFKC to NFC and add tests for filenames that would be broken under NFKC |
375 |
return unicodedata.normalize('NFC', os.getcwdu()) |
1830.3.11
by John Arbash Meinel
Create a mac version of 'getcwd()' which normalizes the path. |
376 |
|
377 |
||
1692.7.6
by Martin Pool
[patch] force deletion of trees containing readonly files (alexander) |
378 |
# Default is to just use the python builtins, but these can be rebound on
|
379 |
# particular platforms.
|
|
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
380 |
abspath = _posix_abspath |
381 |
realpath = _posix_realpath |
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
382 |
pathjoin = os.path.join |
383 |
normpath = os.path.normpath |
|
384 |
getcwd = os.getcwdu |
|
385 |
rename = os.rename |
|
386 |
dirname = os.path.dirname |
|
387 |
basename = os.path.basename |
|
2215.4.2
by Alexander Belchenko
split and splitext now the part of osutils |
388 |
split = os.path.split |
389 |
splitext = os.path.splitext |
|
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
390 |
# These were already imported into local scope
|
391 |
# mkdtemp = tempfile.mkdtemp
|
|
392 |
# rmtree = shutil.rmtree
|
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
393 |
|
1551.2.53
by abentley
Strip trailing slashes in a platform-sensible way |
394 |
MIN_ABS_PATHLENGTH = 1 |
395 |
||
1685.1.9
by John Arbash Meinel
Updated LocalTransport so that it's base is now a URL rather than a local path. This helps consistency with all other functions. To do so, I added local_abspath() which returns the local path, and local_path_to/from_url |
396 |
|
1185.31.47
by John Arbash Meinel
Added a fancy footwork rename to osutils, made SftpTransport use it. |
397 |
if sys.platform == 'win32': |
3224.5.35
by Andrew Bennetts
More improvements suggested by John's review. |
398 |
if win32utils.winver == 'Windows 98': |
399 |
abspath = _win98_abspath |
|
400 |
else: |
|
401 |
abspath = _win32_abspath |
|
1685.1.20
by John Arbash Meinel
More changes to get 'bzr branch' and 'bzr pull' to work |
402 |
realpath = _win32_realpath |
403 |
pathjoin = _win32_pathjoin |
|
404 |
normpath = _win32_normpath |
|
405 |
getcwd = _win32_getcwd |
|
406 |
mkdtemp = _win32_mkdtemp |
|
407 |
rename = _win32_rename |
|
408 |
||
1551.2.53
by abentley
Strip trailing slashes in a platform-sensible way |
409 |
MIN_ABS_PATHLENGTH = 3 |
1532
by Robert Collins
Merge in John Meinels integration branch. |
410 |
|
1692.7.6
by Martin Pool
[patch] force deletion of trees containing readonly files (alexander) |
411 |
def _win32_delete_readonly(function, path, excinfo): |
412 |
"""Error handler for shutil.rmtree function [for win32]
|
|
413 |
Helps to remove files and dirs marked as read-only.
|
|
414 |
"""
|
|
2116.5.1
by Henri Wiechers
Fixes osutils.rmtree on Windows with Python 2.5 |
415 |
exception = excinfo[1] |
1692.7.6
by Martin Pool
[patch] force deletion of trees containing readonly files (alexander) |
416 |
if function in (os.remove, os.rmdir) \ |
2116.5.1
by Henri Wiechers
Fixes osutils.rmtree on Windows with Python 2.5 |
417 |
and isinstance(exception, OSError) \ |
418 |
and exception.errno == errno.EACCES: |
|
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
419 |
make_writable(path) |
1692.7.6
by Martin Pool
[patch] force deletion of trees containing readonly files (alexander) |
420 |
function(path) |
421 |
else: |
|
422 |
raise
|
|
423 |
||
424 |
def rmtree(path, ignore_errors=False, onerror=_win32_delete_readonly): |
|
425 |
"""Replacer for shutil.rmtree: could remove readonly dirs/files"""
|
|
426 |
return shutil.rmtree(path, ignore_errors, onerror) |
|
4355.2.2
by Alexander Belchenko
osutils.py: get_unicode_argv function (to obtain unicode command line arguments from sys.argv) moved to the beginning of module based on suggestions from review of John Meinel. |
427 |
|
428 |
f = win32utils.get_unicode_argv # special function or None |
|
429 |
if f is not None: |
|
430 |
get_unicode_argv = f |
|
431 |
||
1830.3.11
by John Arbash Meinel
Create a mac version of 'getcwd()' which normalizes the path. |
432 |
elif sys.platform == 'darwin': |
433 |
getcwd = _mac_getcwd |
|
1692.7.6
by Martin Pool
[patch] force deletion of trees containing readonly files (alexander) |
434 |
|
1685.1.31
by John Arbash Meinel
Adding tests for the rest of the _win32 functions. |
435 |
|
1711.4.10
by John Arbash Meinel
Pull out sys.stdout.encoding handling into a separate function so it can be tested, and used elsewhere. |
436 |
def get_terminal_encoding(): |
437 |
"""Find the best encoding for printing to the screen.
|
|
438 |
||
439 |
This attempts to check both sys.stdout and sys.stdin to see
|
|
440 |
what encoding they are in, and if that fails it falls back to
|
|
3224.5.4
by Andrew Bennetts
Fix test suite, mainly weeding out uses of bzrlib.user_encoding. |
441 |
osutils.get_user_encoding().
|
1711.4.10
by John Arbash Meinel
Pull out sys.stdout.encoding handling into a separate function so it can be tested, and used elsewhere. |
442 |
The problem is that on Windows, locale.getpreferredencoding()
|
443 |
is not the same encoding as that used by the console:
|
|
444 |
http://mail.python.org/pipermail/python-list/2003-May/162357.html
|
|
445 |
||
446 |
On my standard US Windows XP, the preferred encoding is
|
|
447 |
cp1252, but the console is cp437
|
|
448 |
"""
|
|
3224.5.1
by Andrew Bennetts
Lots of assorted hackery to reduce the number of imports for common operations. Improves 'rocks', 'st' and 'help' times by ~50ms on my laptop. |
449 |
from bzrlib.trace import mutter |
1711.4.10
by John Arbash Meinel
Pull out sys.stdout.encoding handling into a separate function so it can be tested, and used elsewhere. |
450 |
output_encoding = getattr(sys.stdout, 'encoding', None) |
451 |
if not output_encoding: |
|
452 |
input_encoding = getattr(sys.stdin, 'encoding', None) |
|
453 |
if not input_encoding: |
|
3224.5.4
by Andrew Bennetts
Fix test suite, mainly weeding out uses of bzrlib.user_encoding. |
454 |
output_encoding = get_user_encoding() |
455 |
mutter('encoding stdout as osutils.get_user_encoding() %r', |
|
456 |
output_encoding) |
|
1711.4.10
by John Arbash Meinel
Pull out sys.stdout.encoding handling into a separate function so it can be tested, and used elsewhere. |
457 |
else: |
458 |
output_encoding = input_encoding |
|
459 |
mutter('encoding stdout as sys.stdin encoding %r', output_encoding) |
|
460 |
else: |
|
461 |
mutter('encoding stdout as sys.stdout encoding %r', output_encoding) |
|
2127.4.1
by Alexander Belchenko
(jam, bialix) Workaround for cp0 console encoding on Windows |
462 |
if output_encoding == 'cp0': |
463 |
# invalid encoding (cp0 means 'no codepage' on Windows)
|
|
3224.5.4
by Andrew Bennetts
Fix test suite, mainly weeding out uses of bzrlib.user_encoding. |
464 |
output_encoding = get_user_encoding() |
2127.4.1
by Alexander Belchenko
(jam, bialix) Workaround for cp0 console encoding on Windows |
465 |
mutter('cp0 is invalid encoding.' |
3224.5.4
by Andrew Bennetts
Fix test suite, mainly weeding out uses of bzrlib.user_encoding. |
466 |
' encoding stdout as osutils.get_user_encoding() %r', |
467 |
output_encoding) |
|
2192.1.1
by Alexander Belchenko
Before actually using encoding need to check that Python has corresponding codec |
468 |
# check encoding
|
469 |
try: |
|
470 |
codecs.lookup(output_encoding) |
|
471 |
except LookupError: |
|
472 |
sys.stderr.write('bzr: warning:' |
|
2192.1.9
by Alexander Belchenko
final fix suggested by John Meinel |
473 |
' unknown terminal encoding %s.\n' |
2192.1.1
by Alexander Belchenko
Before actually using encoding need to check that Python has corresponding codec |
474 |
' Using encoding %s instead.\n' |
3224.5.4
by Andrew Bennetts
Fix test suite, mainly weeding out uses of bzrlib.user_encoding. |
475 |
% (output_encoding, get_user_encoding()) |
2192.1.1
by Alexander Belchenko
Before actually using encoding need to check that Python has corresponding codec |
476 |
)
|
3224.5.4
by Andrew Bennetts
Fix test suite, mainly weeding out uses of bzrlib.user_encoding. |
477 |
output_encoding = get_user_encoding() |
2192.1.1
by Alexander Belchenko
Before actually using encoding need to check that Python has corresponding codec |
478 |
|
1711.4.10
by John Arbash Meinel
Pull out sys.stdout.encoding handling into a separate function so it can be tested, and used elsewhere. |
479 |
return output_encoding |
480 |
||
481 |
||
1185.31.32
by John Arbash Meinel
Updated the bzr sourcecode to use bzrlib.osutils.pathjoin rather than os.path.join to enforce internal use of / instead of \ |
482 |
def normalizepath(f): |
3287.18.2
by Matt McClure
Reverts to 3290. |
483 |
if getattr(os.path, 'realpath', None) is not None: |
1185.31.32
by John Arbash Meinel
Updated the bzr sourcecode to use bzrlib.osutils.pathjoin rather than os.path.join to enforce internal use of / instead of \ |
484 |
F = realpath |
485 |
else: |
|
486 |
F = abspath |
|
487 |
[p,e] = os.path.split(f) |
|
488 |
if e == "" or e == "." or e == "..": |
|
489 |
return F(f) |
|
490 |
else: |
|
491 |
return pathjoin(F(p), e) |
|
492 |
||
1
by mbp at sourcefrog
import from baz patch-364 |
493 |
|
494 |
def isdir(f): |
|
495 |
"""True if f is an accessible directory."""
|
|
496 |
try: |
|
497 |
return S_ISDIR(os.lstat(f)[ST_MODE]) |
|
498 |
except OSError: |
|
499 |
return False |
|
500 |
||
501 |
||
502 |
def isfile(f): |
|
503 |
"""True if f is a regular file."""
|
|
504 |
try: |
|
505 |
return S_ISREG(os.lstat(f)[ST_MODE]) |
|
506 |
except OSError: |
|
507 |
return False |
|
508 |
||
1092.2.6
by Robert Collins
symlink support updated to work |
509 |
def islink(f): |
510 |
"""True if f is a symlink."""
|
|
511 |
try: |
|
512 |
return S_ISLNK(os.lstat(f)[ST_MODE]) |
|
513 |
except OSError: |
|
514 |
return False |
|
1
by mbp at sourcefrog
import from baz patch-364 |
515 |
|
485
by Martin Pool
- move commit code into its own module |
516 |
def is_inside(dir, fname): |
517 |
"""True if fname is inside dir.
|
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
518 |
|
1185.31.38
by John Arbash Meinel
Changing os.path.normpath to osutils.normpath |
519 |
The parameters should typically be passed to osutils.normpath first, so
|
969
by Martin Pool
- Add less-sucky is_within_any |
520 |
that . and .. and repeated slashes are eliminated, and the separators
|
521 |
are canonical for the platform.
|
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
522 |
|
523 |
The empty string as a dir name is taken as top-of-tree and matches
|
|
974.1.26
by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472 |
524 |
everything.
|
485
by Martin Pool
- move commit code into its own module |
525 |
"""
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
526 |
# XXX: Most callers of this can actually do something smarter by
|
969
by Martin Pool
- Add less-sucky is_within_any |
527 |
# looking at the inventory
|
972
by Martin Pool
- less dodgy is_inside function |
528 |
if dir == fname: |
529 |
return True |
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
530 |
|
974.1.26
by aaron.bentley at utoronto
merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472 |
531 |
if dir == '': |
532 |
return True |
|
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
533 |
|
1185.31.34
by John Arbash Meinel
Removing instances of os.sep |
534 |
if dir[-1] != '/': |
535 |
dir += '/' |
|
1185.1.41
by Robert Collins
massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid |
536 |
|
972
by Martin Pool
- less dodgy is_inside function |
537 |
return fname.startswith(dir) |
538 |
||
485
by Martin Pool
- move commit code into its own module |
539 |
|
540 |
def is_inside_any(dir_list, fname): |
|
541 |
"""True if fname is inside any of given dirs."""
|
|
542 |
for dirname in dir_list: |
|
543 |
if is_inside(dirname, fname): |
|
544 |
return True |
|
2324.2.3
by Dmitry Vasiliev
Fixed is_inside_* methods implementation |
545 |
return False |
485
by Martin Pool
- move commit code into its own module |
546 |
|
547 |
||
1740.3.4
by Jelmer Vernooij
Move inventory to commit builder. |
548 |
def is_inside_or_parent_of_any(dir_list, fname): |
549 |
"""True if fname is a child or a parent of any of the given files."""
|
|
550 |
for dirname in dir_list: |
|
551 |
if is_inside(dirname, fname) or is_inside(fname, dirname): |
|
552 |
return True |
|
2324.2.3
by Dmitry Vasiliev
Fixed is_inside_* methods implementation |
553 |
return False |
1740.3.4
by Jelmer Vernooij
Move inventory to commit builder. |
554 |
|
555 |
||
3956.2.1
by John Arbash Meinel
Add report_activity to osutils.pumpfile |
556 |
def pumpfile(from_file, to_file, read_length=-1, buff_size=32768, |
557 |
report_activity=None, direction='read'): |
|
2745.5.2
by Robert Collins
* ``bzrlib.transport.Transport.put_file`` now returns the number of bytes |
558 |
"""Copy contents of one file to another.
|
3408.6.1
by Eric Holmberg
Fix for Bug #215426 in which bzr can cause a MemoryError in socket.recv while |
559 |
|
560 |
The read_length can either be -1 to read to end-of-file (EOF) or
|
|
561 |
it can specify the maximum number of bytes to read.
|
|
562 |
||
563 |
The buff_size represents the maximum size for each read operation
|
|
564 |
performed on from_file.
|
|
565 |
||
3956.2.1
by John Arbash Meinel
Add report_activity to osutils.pumpfile |
566 |
:param report_activity: Call this as bytes are read, see
|
567 |
Transport._report_activity
|
|
568 |
:param direction: Will be passed to report_activity
|
|
569 |
||
2745.5.2
by Robert Collins
* ``bzrlib.transport.Transport.put_file`` now returns the number of bytes |
570 |
:return: The number of bytes copied.
|
571 |
"""
|
|
572 |
length = 0 |
|
3408.6.1
by Eric Holmberg
Fix for Bug #215426 in which bzr can cause a MemoryError in socket.recv while |
573 |
if read_length >= 0: |
574 |
# read specified number of bytes
|
|
575 |
||
576 |
while read_length > 0: |
|
577 |
num_bytes_to_read = min(read_length, buff_size) |
|
578 |
||
579 |
block = from_file.read(num_bytes_to_read) |
|
580 |
if not block: |
|
581 |
# EOF reached
|
|
582 |
break
|
|
3956.2.1
by John Arbash Meinel
Add report_activity to osutils.pumpfile |
583 |
if report_activity is not None: |
584 |
report_activity(len(block), direction) |
|
3408.6.1
by Eric Holmberg
Fix for Bug #215426 in which bzr can cause a MemoryError in socket.recv while |
585 |
to_file.write(block) |
586 |
||
587 |
actual_bytes_read = len(block) |
|
588 |
read_length -= actual_bytes_read |
|
589 |
length += actual_bytes_read |
|
590 |
else: |
|
591 |
# read to EOF
|
|
592 |
while True: |
|
593 |
block = from_file.read(buff_size) |
|
594 |
if not block: |
|
595 |
# EOF reached
|
|
596 |
break
|
|
3956.2.1
by John Arbash Meinel
Add report_activity to osutils.pumpfile |
597 |
if report_activity is not None: |
598 |
report_activity(len(block), direction) |
|
3408.6.1
by Eric Holmberg
Fix for Bug #215426 in which bzr can cause a MemoryError in socket.recv while |
599 |
to_file.write(block) |
600 |
length += len(block) |
|
2745.5.2
by Robert Collins
* ``bzrlib.transport.Transport.put_file`` now returns the number of bytes |
601 |
return length |
1
by mbp at sourcefrog
import from baz patch-364 |
602 |
|
603 |
||
3635.1.2
by Robert Collins
Add osutils.pump_string_file helper function. |
604 |
def pump_string_file(bytes, file_handle, segment_size=None): |
605 |
"""Write bytes to file_handle in many smaller writes.
|
|
606 |
||
607 |
:param bytes: The string to write.
|
|
608 |
:param file_handle: The file to write to.
|
|
609 |
"""
|
|
610 |
# Write data in chunks rather than all at once, because very large
|
|
611 |
# writes fail on some platforms (e.g. Windows with SMB mounted
|
|
612 |
# drives).
|
|
613 |
if not segment_size: |
|
614 |
segment_size = 5242880 # 5MB |
|
615 |
segments = range(len(bytes) / segment_size + 1) |
|
616 |
write = file_handle.write |
|
617 |
for segment_index in segments: |
|
618 |
segment = buffer(bytes, segment_index * segment_size, segment_size) |
|
619 |
write(segment) |
|
620 |
||
621 |
||
1185.67.7
by Aaron Bentley
Refactored a bit |
622 |
def file_iterator(input_file, readsize=32768): |
623 |
while True: |
|
624 |
b = input_file.read(readsize) |
|
625 |
if len(b) == 0: |
|
626 |
break
|
|
627 |
yield b |
|
628 |
||
629 |
||
1
by mbp at sourcefrog
import from baz patch-364 |
630 |
def sha_file(f): |
3376.2.4
by Martin Pool
Remove every assert statement from bzrlib! |
631 |
"""Calculate the hexdigest of an open file.
|
632 |
||
633 |
The file cursor should be already at the start.
|
|
634 |
"""
|
|
2929.3.1
by Vincent Ladeuil
Fix python2.6 deprecation warnings (still 4 failures 5 errors in test suite). |
635 |
s = sha() |
320
by Martin Pool
- Compute SHA-1 of files in chunks |
636 |
BUFSIZE = 128<<10 |
637 |
while True: |
|
638 |
b = f.read(BUFSIZE) |
|
639 |
if not b: |
|
640 |
break
|
|
641 |
s.update(b) |
|
1
by mbp at sourcefrog
import from baz patch-364 |
642 |
return s.hexdigest() |
643 |
||
644 |
||
3368.2.49
by Ian Clatworthy
added osutils.size_sha_file() with tests |
645 |
def size_sha_file(f): |
646 |
"""Calculate the size and hexdigest of an open file.
|
|
647 |
||
648 |
The file cursor should be already at the start and
|
|
649 |
the caller is responsible for closing the file afterwards.
|
|
650 |
"""
|
|
651 |
size = 0 |
|
652 |
s = sha() |
|
653 |
BUFSIZE = 128<<10 |
|
654 |
while True: |
|
655 |
b = f.read(BUFSIZE) |
|
656 |
if not b: |
|
657 |
break
|
|
658 |
size += len(b) |
|
659 |
s.update(b) |
|
660 |
return size, s.hexdigest() |
|
661 |
||
662 |
||
2872.3.1
by Martin Pool
Add -Dhashcache option; clean up dirstate sha1 code |
663 |
def sha_file_by_name(fname): |
664 |
"""Calculate the SHA1 of a file by reading the full text"""
|
|
2929.3.1
by Vincent Ladeuil
Fix python2.6 deprecation warnings (still 4 failures 5 errors in test suite). |
665 |
s = sha() |
2922.1.1
by John Arbash Meinel
Fix bug #153493, use O_BINARY when reading files. |
666 |
f = os.open(fname, os.O_RDONLY | O_BINARY) |
2872.3.1
by Martin Pool
Add -Dhashcache option; clean up dirstate sha1 code |
667 |
try: |
2872.3.2
by Martin Pool
Do sha_file_by_name using raw os files rather than file objects; makes this routine about 12osutils.py faster |
668 |
while True: |
669 |
b = os.read(f, 1<<16) |
|
670 |
if not b: |
|
671 |
return s.hexdigest() |
|
672 |
s.update(b) |
|
2872.3.1
by Martin Pool
Add -Dhashcache option; clean up dirstate sha1 code |
673 |
finally: |
2872.3.2
by Martin Pool
Do sha_file_by_name using raw os files rather than file objects; makes this routine about 12osutils.py faster |
674 |
os.close(f) |
2872.3.1
by Martin Pool
Add -Dhashcache option; clean up dirstate sha1 code |
675 |
|
676 |
||
2929.3.1
by Vincent Ladeuil
Fix python2.6 deprecation warnings (still 4 failures 5 errors in test suite). |
677 |
def sha_strings(strings, _factory=sha): |
1235
by Martin Pool
- split sha_strings into osutils |
678 |
"""Return the sha-1 of concatenation of strings"""
|
2825.2.1
by Robert Collins
Micro-tweaks to sha routines. |
679 |
s = _factory() |
1235
by Martin Pool
- split sha_strings into osutils |
680 |
map(s.update, strings) |
681 |
return s.hexdigest() |
|
682 |
||
683 |
||
2929.3.1
by Vincent Ladeuil
Fix python2.6 deprecation warnings (still 4 failures 5 errors in test suite). |
684 |
def sha_string(f, _factory=sha): |
2825.2.1
by Robert Collins
Micro-tweaks to sha routines. |
685 |
return _factory(f).hexdigest() |
1
by mbp at sourcefrog
import from baz patch-364 |
686 |
|
687 |
||
124
by mbp at sourcefrog
- check file text for past revisions is correct |
688 |
def fingerprint_file(f): |
126
by mbp at sourcefrog
Use just one big read to fingerprint files |
689 |
b = f.read() |
2825.2.1
by Robert Collins
Micro-tweaks to sha routines. |
690 |
return {'size': len(b), |
2929.3.1
by Vincent Ladeuil
Fix python2.6 deprecation warnings (still 4 failures 5 errors in test suite). |
691 |
'sha1': sha(b).hexdigest()} |
124
by mbp at sourcefrog
- check file text for past revisions is correct |
692 |
|
693 |
||
1
by mbp at sourcefrog
import from baz patch-364 |
694 |
def compare_files(a, b): |
695 |
"""Returns true if equal in contents"""
|
|
74
by mbp at sourcefrog
compare_files: read in one page at a time rather than |
696 |
BUFSIZE = 4096 |
697 |
while True: |
|
698 |
ai = a.read(BUFSIZE) |
|
699 |
bi = b.read(BUFSIZE) |
|
700 |
if ai != bi: |
|
701 |
return False |
|
702 |
if ai == '': |
|
703 |
return True |
|
1
by mbp at sourcefrog
import from baz patch-364 |
704 |
|
705 |
||
49
by mbp at sourcefrog
fix local-time-offset calculation |
706 |
def local_time_offset(t=None): |
707 |
"""Return offset of local zone from GMT, either at present or at time t."""
|
|
1963.2.6
by Robey Pointer
pychecker is on crack; go back to using 'is None'. |
708 |
if t is None: |
73
by mbp at sourcefrog
fix time.localtime call for python 2.3 |
709 |
t = time.time() |
2215.6.1
by James Henstridge
Don't rely on time.timezone and time.altzone in local_time_offset(), |
710 |
offset = datetime.fromtimestamp(t) - datetime.utcfromtimestamp(t) |
711 |
return offset.days * 86400 + offset.seconds |
|
8
by mbp at sourcefrog
store committer's timezone in revision and show |
712 |
|
3512.3.1
by Martin von Gagern
Hand-selected minimalistic set of changes from my setlocale branch. |
713 |
weekdays = ['Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun'] |
4379.4.1
by Ian Clatworthy
make log --long faster |
714 |
_default_format_by_weekday_num = [wd + " %Y-%m-%d %H:%M:%S" for wd in weekdays] |
715 |
||
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
716 |
|
2425.6.2
by Martin Pool
Make timestamps use existing format_date; document that function more |
717 |
def format_date(t, offset=0, timezone='original', date_fmt=None, |
3526.5.4
by Martin von Gagern
Use separate function format_local_date for local weekday formats in unicode. |
718 |
show_offset=True): |
2425.6.2
by Martin Pool
Make timestamps use existing format_date; document that function more |
719 |
"""Return a formatted date string.
|
720 |
||
721 |
:param t: Seconds since the epoch.
|
|
722 |
:param offset: Timezone offset in seconds east of utc.
|
|
723 |
:param timezone: How to display the time: 'utc', 'original' for the
|
|
724 |
timezone specified by offset, or 'local' for the process's current
|
|
725 |
timezone.
|
|
3526.5.4
by Martin von Gagern
Use separate function format_local_date for local weekday formats in unicode. |
726 |
:param date_fmt: strftime format.
|
727 |
:param show_offset: Whether to append the timezone.
|
|
728 |
"""
|
|
729 |
(date_fmt, tt, offset_str) = \ |
|
730 |
_format_date(t, offset, timezone, date_fmt, show_offset) |
|
731 |
date_fmt = date_fmt.replace('%a', weekdays[tt[6]]) |
|
732 |
date_str = time.strftime(date_fmt, tt) |
|
733 |
return date_str + offset_str |
|
734 |
||
4379.4.1
by Ian Clatworthy
make log --long faster |
735 |
|
736 |
# Cache of formatted offset strings
|
|
737 |
_offset_cache = {} |
|
738 |
||
739 |
||
4379.4.2
by Ian Clatworthy
add NEWS item and tests for new date formatting API |
740 |
def format_date_with_offset_in_original_timezone(t, offset=0, |
4379.4.1
by Ian Clatworthy
make log --long faster |
741 |
_cache=_offset_cache): |
742 |
"""Return a formatted date string in the original timezone.
|
|
743 |
||
744 |
This routine may be faster then format_date.
|
|
745 |
||
746 |
:param t: Seconds since the epoch.
|
|
747 |
:param offset: Timezone offset in seconds east of utc.
|
|
748 |
"""
|
|
749 |
if offset is None: |
|
750 |
offset = 0 |
|
751 |
tt = time.gmtime(t + offset) |
|
752 |
date_fmt = _default_format_by_weekday_num[tt[6]] |
|
753 |
date_str = time.strftime(date_fmt, tt) |
|
754 |
offset_str = _cache.get(offset, None) |
|
755 |
if offset_str is None: |
|
756 |
offset_str = ' %+03d%02d' % (offset / 3600, (offset / 60) % 60) |
|
757 |
_cache[offset] = offset_str |
|
758 |
return date_str + offset_str |
|
759 |
||
760 |
||
3526.5.4
by Martin von Gagern
Use separate function format_local_date for local weekday formats in unicode. |
761 |
def format_local_date(t, offset=0, timezone='original', date_fmt=None, |
762 |
show_offset=True): |
|
763 |
"""Return an unicode date string formatted according to the current locale.
|
|
764 |
||
765 |
:param t: Seconds since the epoch.
|
|
766 |
:param offset: Timezone offset in seconds east of utc.
|
|
767 |
:param timezone: How to display the time: 'utc', 'original' for the
|
|
768 |
timezone specified by offset, or 'local' for the process's current
|
|
769 |
timezone.
|
|
770 |
:param date_fmt: strftime format.
|
|
771 |
:param show_offset: Whether to append the timezone.
|
|
772 |
"""
|
|
773 |
(date_fmt, tt, offset_str) = \ |
|
774 |
_format_date(t, offset, timezone, date_fmt, show_offset) |
|
775 |
date_str = time.strftime(date_fmt, tt) |
|
776 |
if not isinstance(date_str, unicode): |
|
4385.4.1
by Alexander Belchenko
removed all references to bzrlib.user_encoding |
777 |
date_str = date_str.decode(get_user_encoding(), 'replace') |
3526.5.4
by Martin von Gagern
Use separate function format_local_date for local weekday formats in unicode. |
778 |
return date_str + offset_str |
779 |
||
4379.4.1
by Ian Clatworthy
make log --long faster |
780 |
|
3526.5.4
by Martin von Gagern
Use separate function format_local_date for local weekday formats in unicode. |
781 |
def _format_date(t, offset, timezone, date_fmt, show_offset): |
8
by mbp at sourcefrog
store committer's timezone in revision and show |
782 |
if timezone == 'utc': |
1
by mbp at sourcefrog
import from baz patch-364 |
783 |
tt = time.gmtime(t) |
784 |
offset = 0 |
|
8
by mbp at sourcefrog
store committer's timezone in revision and show |
785 |
elif timezone == 'original': |
1963.2.6
by Robey Pointer
pychecker is on crack; go back to using 'is None'. |
786 |
if offset is None: |
23
by mbp at sourcefrog
format_date: handle revisions with no timezone offset |
787 |
offset = 0 |
16
by mbp at sourcefrog
fix inverted calculation for original timezone -> utc |
788 |
tt = time.gmtime(t + offset) |
12
by mbp at sourcefrog
new --timezone option for bzr log |
789 |
elif timezone == 'local': |
1
by mbp at sourcefrog
import from baz patch-364 |
790 |
tt = time.localtime(t) |
49
by mbp at sourcefrog
fix local-time-offset calculation |
791 |
offset = local_time_offset(t) |
12
by mbp at sourcefrog
new --timezone option for bzr log |
792 |
else: |
3144.1.1
by Lukáš Lalinský
Fixed error reporting of unsupported timezone format. |
793 |
raise errors.UnsupportedTimezoneFormat(timezone) |
1185.12.24
by Aaron Bentley
Made format_date more flexible |
794 |
if date_fmt is None: |
795 |
date_fmt = "%a %Y-%m-%d %H:%M:%S" |
|
796 |
if show_offset: |
|
797 |
offset_str = ' %+03d%02d' % (offset / 3600, (offset / 60) % 60) |
|
798 |
else: |
|
799 |
offset_str = '' |
|
3526.5.4
by Martin von Gagern
Use separate function format_local_date for local weekday formats in unicode. |
800 |
return (date_fmt, tt, offset_str) |
1
by mbp at sourcefrog
import from baz patch-364 |
801 |
|
802 |
||
803 |
def compact_date(when): |
|
804 |
return time.strftime('%Y%m%d%H%M%S', time.gmtime(when)) |
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
805 |
|
1
by mbp at sourcefrog
import from baz patch-364 |
806 |
|
1957.1.4
by John Arbash Meinel
create a helper for formatting a time delta |
807 |
def format_delta(delta): |
808 |
"""Get a nice looking string for a time delta.
|
|
809 |
||
810 |
:param delta: The time difference in seconds, can be positive or negative.
|
|
811 |
positive indicates time in the past, negative indicates time in the
|
|
812 |
future. (usually time.time() - stored_time)
|
|
813 |
:return: String formatted to show approximate resolution
|
|
814 |
"""
|
|
815 |
delta = int(delta) |
|
816 |
if delta >= 0: |
|
817 |
direction = 'ago' |
|
818 |
else: |
|
819 |
direction = 'in the future' |
|
820 |
delta = -delta |
|
821 |
||
822 |
seconds = delta |
|
823 |
if seconds < 90: # print seconds up to 90 seconds |
|
824 |
if seconds == 1: |
|
825 |
return '%d second %s' % (seconds, direction,) |
|
826 |
else: |
|
827 |
return '%d seconds %s' % (seconds, direction) |
|
828 |
||
829 |
minutes = int(seconds / 60) |
|
830 |
seconds -= 60 * minutes |
|
831 |
if seconds == 1: |
|
832 |
plural_seconds = '' |
|
833 |
else: |
|
834 |
plural_seconds = 's' |
|
835 |
if minutes < 90: # print minutes, seconds up to 90 minutes |
|
836 |
if minutes == 1: |
|
837 |
return '%d minute, %d second%s %s' % ( |
|
838 |
minutes, seconds, plural_seconds, direction) |
|
839 |
else: |
|
840 |
return '%d minutes, %d second%s %s' % ( |
|
841 |
minutes, seconds, plural_seconds, direction) |
|
842 |
||
843 |
hours = int(minutes / 60) |
|
844 |
minutes -= 60 * hours |
|
845 |
if minutes == 1: |
|
846 |
plural_minutes = '' |
|
847 |
else: |
|
848 |
plural_minutes = 's' |
|
849 |
||
850 |
if hours == 1: |
|
851 |
return '%d hour, %d minute%s %s' % (hours, minutes, |
|
852 |
plural_minutes, direction) |
|
853 |
return '%d hours, %d minute%s %s' % (hours, minutes, |
|
854 |
plural_minutes, direction) |
|
1
by mbp at sourcefrog
import from baz patch-364 |
855 |
|
856 |
def filesize(f): |
|
857 |
"""Return size of given open file."""
|
|
858 |
return os.fstat(f.fileno())[ST_SIZE] |
|
859 |
||
1553.5.5
by Martin Pool
New utility routine rand_chars |
860 |
|
1185.1.7
by Robert Collins
Nathaniel McCallums patch for urandom friendliness on aix. |
861 |
# Define rand_bytes based on platform.
|
862 |
try: |
|
863 |
# Python 2.4 and later have os.urandom,
|
|
864 |
# but it doesn't work on some arches
|
|
865 |
os.urandom(1) |
|
1
by mbp at sourcefrog
import from baz patch-364 |
866 |
rand_bytes = os.urandom |
1185.1.7
by Robert Collins
Nathaniel McCallums patch for urandom friendliness on aix. |
867 |
except (NotImplementedError, AttributeError): |
868 |
# If python doesn't have os.urandom, or it doesn't work,
|
|
869 |
# then try to first pull random data from /dev/urandom
|
|
2067.1.1
by John Arbash Meinel
Catch an exception while opening /dev/urandom rather than using os.path.exists() |
870 |
try: |
1185.1.7
by Robert Collins
Nathaniel McCallums patch for urandom friendliness on aix. |
871 |
rand_bytes = file('/dev/urandom', 'rb').read |
872 |
# Otherwise, use this hack as a last resort
|
|
2067.1.1
by John Arbash Meinel
Catch an exception while opening /dev/urandom rather than using os.path.exists() |
873 |
except (IOError, OSError): |
1185.1.7
by Robert Collins
Nathaniel McCallums patch for urandom friendliness on aix. |
874 |
# not well seeded, but better than nothing
|
875 |
def rand_bytes(n): |
|
876 |
import random |
|
877 |
s = '' |
|
878 |
while n: |
|
879 |
s += chr(random.randint(0, 255)) |
|
880 |
n -= 1 |
|
881 |
return s |
|
1
by mbp at sourcefrog
import from baz patch-364 |
882 |
|
1553.5.5
by Martin Pool
New utility routine rand_chars |
883 |
|
884 |
ALNUM = '0123456789abcdefghijklmnopqrstuvwxyz' |
|
885 |
def rand_chars(num): |
|
886 |
"""Return a random string of num alphanumeric characters
|
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
887 |
|
888 |
The result only contains lowercase chars because it may be used on
|
|
1553.5.5
by Martin Pool
New utility routine rand_chars |
889 |
case-insensitive filesystems.
|
890 |
"""
|
|
891 |
s = '' |
|
892 |
for raw_byte in rand_bytes(num): |
|
893 |
s += ALNUM[ord(raw_byte) % 36] |
|
894 |
return s |
|
895 |
||
896 |
||
1
by mbp at sourcefrog
import from baz patch-364 |
897 |
## TODO: We could later have path objects that remember their list
|
1759.2.2
by Jelmer Vernooij
Revert some of my spelling fixes and fix some typos after review by Aaron. |
898 |
## decomposition (might be too tricksy though.)
|
1
by mbp at sourcefrog
import from baz patch-364 |
899 |
|
900 |
def splitpath(p): |
|
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
901 |
"""Turn string into list of parts."""
|
271
by Martin Pool
- Windows path fixes |
902 |
# split on either delimiter because people might use either on
|
903 |
# Windows
|
|
904 |
ps = re.split(r'[\\/]', p) |
|
905 |
||
906 |
rps = [] |
|
1
by mbp at sourcefrog
import from baz patch-364 |
907 |
for f in ps: |
908 |
if f == '..': |
|
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
909 |
raise errors.BzrError("sorry, %r not allowed in path" % f) |
271
by Martin Pool
- Windows path fixes |
910 |
elif (f == '.') or (f == ''): |
911 |
pass
|
|
912 |
else: |
|
913 |
rps.append(f) |
|
914 |
return rps |
|
1
by mbp at sourcefrog
import from baz patch-364 |
915 |
|
3890.2.4
by John Arbash Meinel
Add a new function that can convert 'chunks' format to a 'lines' format. |
916 |
|
1
by mbp at sourcefrog
import from baz patch-364 |
917 |
def joinpath(p): |
918 |
for f in p: |
|
1963.2.6
by Robey Pointer
pychecker is on crack; go back to using 'is None'. |
919 |
if (f == '..') or (f is None) or (f == ''): |
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
920 |
raise errors.BzrError("sorry, %r not allowed in path" % f) |
1185.31.32
by John Arbash Meinel
Updated the bzr sourcecode to use bzrlib.osutils.pathjoin rather than os.path.join to enforce internal use of / instead of \ |
921 |
return pathjoin(*p) |
1
by mbp at sourcefrog
import from baz patch-364 |
922 |
|
923 |
||
4370.1.1
by Ian Clatworthy
add osutils.parent_directories() API |
924 |
def parent_directories(filename): |
4371.1.1
by Ian Clatworthy
(igc) added osutils.parent_directories() (Ian Clatworthy) |
925 |
"""Return the list of parent directories, deepest first.
|
926 |
|
|
927 |
For example, parent_directories("a/b/c") -> ["a/b", "a"].
|
|
928 |
"""
|
|
4370.1.1
by Ian Clatworthy
add osutils.parent_directories() API |
929 |
parents = [] |
930 |
parts = splitpath(dirname(filename)) |
|
931 |
while parts: |
|
932 |
parents.append(joinpath(parts)) |
|
933 |
parts.pop() |
|
934 |
return parents |
|
935 |
||
936 |
||
4574.3.8
by Martin Pool
Only mutter extension load errors when they occur, and record for later |
937 |
_extension_load_failures = [] |
938 |
||
939 |
||
940 |
def failed_to_load_extension(exception): |
|
4574.3.1
by Martin Pool
Give a warning when failing to load _chunks_to_lines_pyx |
941 |
"""Handle failing to load a binary extension.
|
942 |
||
943 |
This should be called from the ImportError block guarding the attempt to
|
|
944 |
import the native extension. If this function returns, the pure-Python
|
|
945 |
implementation should be loaded instead::
|
|
946 |
||
947 |
>>> try:
|
|
948 |
>>> import bzrlib._fictional_extension_pyx
|
|
949 |
>>> except ImportError, e:
|
|
4574.3.8
by Martin Pool
Only mutter extension load errors when they occur, and record for later |
950 |
>>> bzrlib.osutils.failed_to_load_extension(e)
|
4574.3.1
by Martin Pool
Give a warning when failing to load _chunks_to_lines_pyx |
951 |
>>> import bzrlib._fictional_extension_py
|
952 |
"""
|
|
953 |
# NB: This docstring is just an example, not a doctest, because doctest
|
|
954 |
# currently can't cope with the use of lazy imports in this namespace --
|
|
955 |
# mbp 20090729
|
|
4574.3.8
by Martin Pool
Only mutter extension load errors when they occur, and record for later |
956 |
|
957 |
# This currently doesn't report the failure at the time it occurs, because
|
|
958 |
# they tend to happen very early in startup when we can't check config
|
|
959 |
# files etc, and also we want to report all failures but not spam the user
|
|
960 |
# with 10 warnings.
|
|
961 |
from bzrlib import trace |
|
962 |
exception_str = str(exception) |
|
963 |
if exception_str not in _extension_load_failures: |
|
964 |
trace.mutter("failed to load compiled extension: %s" % exception_str) |
|
965 |
_extension_load_failures.append(exception_str) |
|
966 |
||
967 |
||
968 |
def report_extension_load_failures(): |
|
969 |
if not _extension_load_failures: |
|
970 |
return
|
|
971 |
from bzrlib.config import GlobalConfig |
|
972 |
if GlobalConfig().get_user_option_as_bool('ignore_missing_extensions'): |
|
973 |
return
|
|
974 |
# the warnings framework should by default show this only once
|
|
4695.4.1
by Martin Pool
Give a shorter/cleaner message for missing extensions |
975 |
from bzrlib.trace import warning |
976 |
warning( |
|
977 |
"bzr: warning: some compiled extensions could not be loaded; "
|
|
978 |
"see <https://answers.launchpad.net/bzr/+faq/703>") |
|
979 |
# we no longer show the specific missing extensions here, because it makes
|
|
980 |
# the message too long and scary - see
|
|
981 |
# https://bugs.launchpad.net/bzr/+bug/430529
|
|
4574.3.1
by Martin Pool
Give a warning when failing to load _chunks_to_lines_pyx |
982 |
|
983 |
||
3890.2.7
by John Arbash Meinel
A Pyrex extension is about 5x faster than the fastest python code I could write. |
984 |
try: |
985 |
from bzrlib._chunks_to_lines_pyx import chunks_to_lines |
|
4574.3.1
by Martin Pool
Give a warning when failing to load _chunks_to_lines_pyx |
986 |
except ImportError, e: |
4574.3.8
by Martin Pool
Only mutter extension load errors when they occur, and record for later |
987 |
failed_to_load_extension(e) |
3890.2.8
by John Arbash Meinel
Move everything into properly parameterized tests. |
988 |
from bzrlib._chunks_to_lines_py import chunks_to_lines |
3890.2.7
by John Arbash Meinel
A Pyrex extension is about 5x faster than the fastest python code I could write. |
989 |
|
990 |
||
1231
by Martin Pool
- more progress on fetch on top of weaves |
991 |
def split_lines(s): |
992 |
"""Split s into lines, but without removing the newline characters."""
|
|
3890.2.18
by John Arbash Meinel
Implement osutils.split_lines() in terms of chunks_to_lines if possible. |
993 |
# Trivially convert a fulltext into a 'chunked' representation, and let
|
994 |
# chunks_to_lines do the heavy lifting.
|
|
995 |
if isinstance(s, str): |
|
996 |
# chunks_to_lines only supports 8-bit strings
|
|
997 |
return chunks_to_lines([s]) |
|
998 |
else: |
|
999 |
return _split_lines(s) |
|
1000 |
||
1001 |
||
1002 |
def _split_lines(s): |
|
1003 |
"""Split s into lines, but without removing the newline characters.
|
|
1004 |
||
1005 |
This supports Unicode or plain string objects.
|
|
1006 |
"""
|
|
1666.1.6
by Robert Collins
Make knit the default format. |
1007 |
lines = s.split('\n') |
1008 |
result = [line + '\n' for line in lines[:-1]] |
|
1009 |
if lines[-1]: |
|
1010 |
result.append(lines[-1]) |
|
1011 |
return result |
|
1391
by Robert Collins
merge from integration |
1012 |
|
1013 |
||
1185.10.4
by Aaron Bentley
Disabled hardlinks on cygwin, mac OS |
1014 |
def hardlinks_good(): |
1185.10.5
by Aaron Bentley
Fixed hardlinks_good test |
1015 |
return sys.platform not in ('win32', 'cygwin', 'darwin') |
1185.10.4
by Aaron Bentley
Disabled hardlinks on cygwin, mac OS |
1016 |
|
1185.1.46
by Robert Collins
Aarons branch --basis patch |
1017 |
|
1185.10.3
by Aaron Bentley
Made copy_multi_immutable create hardlinks opportunistically |
1018 |
def link_or_copy(src, dest): |
1019 |
"""Hardlink a file, or copy it if it can't be hardlinked."""
|
|
1185.10.4
by Aaron Bentley
Disabled hardlinks on cygwin, mac OS |
1020 |
if not hardlinks_good(): |
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
1021 |
shutil.copyfile(src, dest) |
1185.10.3
by Aaron Bentley
Made copy_multi_immutable create hardlinks opportunistically |
1022 |
return
|
1023 |
try: |
|
1024 |
os.link(src, dest) |
|
1025 |
except (OSError, IOError), e: |
|
1026 |
if e.errno != errno.EXDEV: |
|
1027 |
raise
|
|
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
1028 |
shutil.copyfile(src, dest) |
1399.1.4
by Robert Collins
move diff and symlink conditionals into inventory.py from diff.py |
1029 |
|
2831.5.2
by Vincent Ladeuil
Review feedback. |
1030 |
|
1031 |
def delete_any(path): |
|
4490.1.1
by Martin Pool
merge fix for forcing readonly deletion, and tweak |
1032 |
"""Delete a file, symlink or directory.
|
1033 |
|
|
1034 |
Will delete even if readonly.
|
|
1035 |
"""
|
|
4440.1.2
by Craig Hewetson
Fixes made after first code review. |
1036 |
try: |
4490.1.1
by Martin Pool
merge fix for forcing readonly deletion, and tweak |
1037 |
_delete_file_or_dir(path) |
4440.1.2
by Craig Hewetson
Fixes made after first code review. |
1038 |
except (OSError, IOError), e: |
1039 |
if e.errno in (errno.EPERM, errno.EACCES): |
|
4490.1.1
by Martin Pool
merge fix for forcing readonly deletion, and tweak |
1040 |
# make writable and try again
|
1041 |
try: |
|
4440.1.2
by Craig Hewetson
Fixes made after first code review. |
1042 |
make_writable(path) |
4490.1.1
by Martin Pool
merge fix for forcing readonly deletion, and tweak |
1043 |
except (OSError, IOError): |
4440.1.2
by Craig Hewetson
Fixes made after first code review. |
1044 |
pass
|
4490.1.1
by Martin Pool
merge fix for forcing readonly deletion, and tweak |
1045 |
_delete_file_or_dir(path) |
1046 |
else: |
|
1047 |
raise
|
|
1048 |
||
1049 |
||
1050 |
def _delete_file_or_dir(path): |
|
1051 |
# Look Before You Leap (LBYL) is appropriate here instead of Easier to Ask for
|
|
1052 |
# Forgiveness than Permission (EAFP) because:
|
|
1053 |
# - root can damage a solaris file system by using unlink,
|
|
1054 |
# - unlink raises different exceptions on different OSes (linux: EISDIR, win32:
|
|
1055 |
# EACCES, OSX: EPERM) when invoked on a directory.
|
|
2831.5.2
by Vincent Ladeuil
Review feedback. |
1056 |
if isdir(path): # Takes care of symlinks |
1057 |
os.rmdir(path) |
|
1058 |
else: |
|
1059 |
os.unlink(path) |
|
1558.12.9
by Aaron Bentley
Handle resolving conflicts with directories properly |
1060 |
|
1399.1.4
by Robert Collins
move diff and symlink conditionals into inventory.py from diff.py |
1061 |
|
1062 |
def has_symlinks(): |
|
1963.2.6
by Robey Pointer
pychecker is on crack; go back to using 'is None'. |
1063 |
if getattr(os, 'symlink', None) is not None: |
1399.1.4
by Robert Collins
move diff and symlink conditionals into inventory.py from diff.py |
1064 |
return True |
1065 |
else: |
|
1066 |
return False |
|
2831.5.2
by Vincent Ladeuil
Review feedback. |
1067 |
|
1185.16.38
by Martin Pool
- move contains_whitespace and contains_linebreaks to osutils |
1068 |
|
3136.1.1
by Aaron Bentley
Add support for hardlinks to TreeTransform |
1069 |
def has_hardlinks(): |
1070 |
if getattr(os, 'link', None) is not None: |
|
1071 |
return True |
|
1072 |
else: |
|
1073 |
return False |
|
1074 |
||
1075 |
||
3287.18.14
by Matt McClure
Extracted a host_os_dereferences_symlinks method. |
1076 |
def host_os_dereferences_symlinks(): |
1077 |
return (has_symlinks() |
|
3287.18.19
by Matt McClure
Changed tested sys.platform value from 'windows' (mistaken) to 'win32' |
1078 |
and sys.platform not in ('cygwin', 'win32')) |
3287.18.14
by Matt McClure
Extracted a host_os_dereferences_symlinks method. |
1079 |
|
1080 |
||
4241.14.14
by Vincent Ladeuil
Test and implements osutils.readlink(). |
1081 |
def readlink(abspath): |
1082 |
"""Return a string representing the path to which the symbolic link points.
|
|
1083 |
||
1084 |
:param abspath: The link absolute unicode path.
|
|
1085 |
||
1086 |
This his guaranteed to return the symbolic link in unicode in all python
|
|
1087 |
versions.
|
|
1088 |
"""
|
|
1089 |
link = abspath.encode(_fs_enc) |
|
1090 |
target = os.readlink(link) |
|
1091 |
target = target.decode(_fs_enc) |
|
1092 |
return target |
|
1093 |
||
1094 |
||
1185.16.38
by Martin Pool
- move contains_whitespace and contains_linebreaks to osutils |
1095 |
def contains_whitespace(s): |
1096 |
"""True if there are any whitespace characters in s."""
|
|
2249.2.1
by John Arbash Meinel
(John Arbash Meinel) hard-code the whitespace chars to avoid problems in some locales. |
1097 |
# string.whitespace can include '\xa0' in certain locales, because it is
|
1098 |
# considered "non-breaking-space" as part of ISO-8859-1. But it
|
|
1099 |
# 1) Isn't a breaking whitespace
|
|
1100 |
# 2) Isn't one of ' \t\r\n' which are characters we sometimes use as
|
|
1101 |
# separators
|
|
1102 |
# 3) '\xa0' isn't unicode safe since it is >128.
|
|
2249.5.16
by John Arbash Meinel
[merge] bzr.dev 2283 |
1103 |
|
1104 |
# This should *not* be a unicode set of characters in case the source
|
|
1105 |
# string is not a Unicode string. We can auto-up-cast the characters since
|
|
1106 |
# they are ascii, but we don't want to auto-up-cast the string in case it
|
|
1107 |
# is utf-8
|
|
1108 |
for ch in ' \t\n\r\v\f': |
|
1185.16.38
by Martin Pool
- move contains_whitespace and contains_linebreaks to osutils |
1109 |
if ch in s: |
1110 |
return True |
|
1111 |
else: |
|
1112 |
return False |
|
1113 |
||
1114 |
||
1115 |
def contains_linebreaks(s): |
|
1116 |
"""True if there is any vertical whitespace in s."""
|
|
1117 |
for ch in '\f\n\r': |
|
1118 |
if ch in s: |
|
1119 |
return True |
|
1120 |
else: |
|
1121 |
return False |
|
1457.1.2
by Robert Collins
move branch._relpath into osutils as relpath |
1122 |
|
1123 |
||
1124 |
def relpath(base, path): |
|
1125 |
"""Return path relative to base, or raise exception.
|
|
1126 |
||
1127 |
The path may be either an absolute path or a path relative to the
|
|
1128 |
current working directory.
|
|
1129 |
||
1130 |
os.path.commonprefix (python2.4) has a bad bug that it works just
|
|
1131 |
on string prefixes, assuming that '/u' is a prefix of '/u2'. This
|
|
1636.1.1
by Robert Collins
Fix calling relpath() and abspath() on transports at their root. |
1132 |
avoids that problem.
|
1133 |
"""
|
|
1685.1.12
by John Arbash Meinel
Some more work to get LocalTransport to only support URLs |
1134 |
|
3376.2.4
by Martin Pool
Remove every assert statement from bzrlib! |
1135 |
if len(base) < MIN_ABS_PATHLENGTH: |
1136 |
# must have space for e.g. a drive letter
|
|
1137 |
raise ValueError('%r is too short to calculate a relative path' |
|
1138 |
% (base,)) |
|
1685.1.9
by John Arbash Meinel
Updated LocalTransport so that it's base is now a URL rather than a local path. This helps consistency with all other functions. To do so, I added local_abspath() which returns the local path, and local_path_to/from_url |
1139 |
|
1685.1.12
by John Arbash Meinel
Some more work to get LocalTransport to only support URLs |
1140 |
rp = abspath(path) |
1457.1.2
by Robert Collins
move branch._relpath into osutils as relpath |
1141 |
|
1142 |
s = [] |
|
1685.1.12
by John Arbash Meinel
Some more work to get LocalTransport to only support URLs |
1143 |
head = rp |
4555.2.1
by John Arbash Meinel
Fix bug #394227, osutils.relpath() could get into an infinite loop. |
1144 |
while True: |
1145 |
if len(head) <= len(base) and head != base: |
|
1146 |
raise errors.PathNotChild(rp, base) |
|
1457.1.2
by Robert Collins
move branch._relpath into osutils as relpath |
1147 |
if head == base: |
1148 |
break
|
|
4555.2.1
by John Arbash Meinel
Fix bug #394227, osutils.relpath() could get into an infinite loop. |
1149 |
head, tail = split(head) |
1457.1.2
by Robert Collins
move branch._relpath into osutils as relpath |
1150 |
if tail: |
4555.2.1
by John Arbash Meinel
Fix bug #394227, osutils.relpath() could get into an infinite loop. |
1151 |
s.append(tail) |
1457.1.2
by Robert Collins
move branch._relpath into osutils as relpath |
1152 |
|
1185.31.35
by John Arbash Meinel
Couple small fixes, all tests pass on cygwin. |
1153 |
if s: |
4555.2.3
by John Arbash Meinel
Fix a trivial bug that should have been caught earlier. :) |
1154 |
return pathjoin(*reversed(s)) |
1185.31.35
by John Arbash Meinel
Couple small fixes, all tests pass on cygwin. |
1155 |
else: |
1156 |
return '' |
|
1185.33.60
by Martin Pool
Use full terminal width for verbose test output. |
1157 |
|
1158 |
||
3794.5.29
by Mark Hammond
cicp_canonical_relpath -> _cicp_canonical_relpath |
1159 |
def _cicp_canonical_relpath(base, path): |
3794.5.1
by Mark Hammond
Add canonical_relpath api function |
1160 |
"""Return the canonical path relative to base.
|
1161 |
||
1162 |
Like relpath, but on case-insensitive-case-preserving file-systems, this
|
|
3794.5.13
by Mark Hammond
Tweaks suggested by Martin |
1163 |
will return the relpath as stored on the file-system rather than in the
|
1164 |
case specified in the input string, for all existing portions of the path.
|
|
1165 |
||
3794.5.28
by Mark Hammond
Update comments. |
1166 |
This will cause O(N) behaviour if called for every path in a tree; if you
|
1167 |
have a number of paths to convert, you should use canonical_relpaths().
|
|
3794.5.31
by Mark Hammond
bulk of the simple review comments from igc. |
1168 |
"""
|
1169 |
# TODO: it should be possible to optimize this for Windows by using the
|
|
1170 |
# win32 API FindFiles function to look for the specified name - but using
|
|
1171 |
# os.listdir() still gives us the correct, platform agnostic semantics in
|
|
1172 |
# the short term.
|
|
3794.5.13
by Mark Hammond
Tweaks suggested by Martin |
1173 |
|
3794.5.1
by Mark Hammond
Add canonical_relpath api function |
1174 |
rel = relpath(base, path) |
1175 |
# '.' will have been turned into ''
|
|
1176 |
if not rel: |
|
1177 |
return rel |
|
1178 |
||
1179 |
abs_base = abspath(base) |
|
1180 |
current = abs_base |
|
1181 |
_listdir = os.listdir |
|
1182 |
||
1183 |
# use an explicit iterator so we can easily consume the rest on early exit.
|
|
3794.5.36
by Mark Hammond
test for, and fix problem with canonical_relpath when the tail does not exist. |
1184 |
bit_iter = iter(rel.split('/')) |
3794.5.1
by Mark Hammond
Add canonical_relpath api function |
1185 |
for bit in bit_iter: |
1186 |
lbit = bit.lower() |
|
4634.70.2
by John Arbash Meinel
Fix bug #322807, teach cicp_canonical_relpath how to handle |
1187 |
try: |
1188 |
next_entries = _listdir(current) |
|
4634.70.3
by John Arbash Meinel
Clean up some terminology, catch a double _listdir request, thanks spiv. |
1189 |
except OSError: # enoent, eperm, etc |
1190 |
# We can't find this in the filesystem, so just append the
|
|
1191 |
# remaining bits.
|
|
4634.70.2
by John Arbash Meinel
Fix bug #322807, teach cicp_canonical_relpath how to handle |
1192 |
current = pathjoin(current, bit, *list(bit_iter)) |
1193 |
break
|
|
4634.70.3
by John Arbash Meinel
Clean up some terminology, catch a double _listdir request, thanks spiv. |
1194 |
for look in next_entries: |
3794.5.1
by Mark Hammond
Add canonical_relpath api function |
1195 |
if lbit == look.lower(): |
1196 |
current = pathjoin(current, look) |
|
1197 |
break
|
|
1198 |
else: |
|
1199 |
# got to the end, nothing matched, so we just return the
|
|
1200 |
# non-existing bits as they were specified (the filename may be
|
|
1201 |
# the target of a move, for example).
|
|
1202 |
current = pathjoin(current, bit, *list(bit_iter)) |
|
1203 |
break
|
|
4634.70.2
by John Arbash Meinel
Fix bug #322807, teach cicp_canonical_relpath how to handle |
1204 |
return current[len(abs_base):].lstrip('/') |
3794.5.1
by Mark Hammond
Add canonical_relpath api function |
1205 |
|
3794.5.13
by Mark Hammond
Tweaks suggested by Martin |
1206 |
# XXX - TODO - we need better detection/integration of case-insensitive
|
4241.9.5
by Vincent Ladeuil
Fix unicode related OSX failures. |
1207 |
# file-systems; Linux often sees FAT32 devices (or NFS-mounted OSX
|
1208 |
# filesystems), for example, so could probably benefit from the same basic
|
|
1209 |
# support there. For now though, only Windows and OSX get that support, and
|
|
1210 |
# they get it for *all* file-systems!
|
|
4241.9.2
by Vincent Ladeuil
Fix most of cicp related failures on OSX. |
1211 |
if sys.platform in ('win32', 'darwin'): |
3794.5.29
by Mark Hammond
cicp_canonical_relpath -> _cicp_canonical_relpath |
1212 |
canonical_relpath = _cicp_canonical_relpath |
3794.5.1
by Mark Hammond
Add canonical_relpath api function |
1213 |
else: |
1214 |
canonical_relpath = relpath |
|
1215 |
||
3794.5.15
by Mark Hammond
Add canonical_relpaths() as a placeholder for a future caching implementation. |
1216 |
def canonical_relpaths(base, paths): |
1217 |
"""Create an iterable to canonicalize a sequence of relative paths.
|
|
1218 |
||
1219 |
The intent is for this implementation to use a cache, vastly speeding
|
|
1220 |
up multiple transformations in the same directory.
|
|
1221 |
"""
|
|
1222 |
# but for now, we haven't optimized...
|
|
1223 |
return [canonical_relpath(base, p) for p in paths] |
|
3794.5.1
by Mark Hammond
Add canonical_relpath api function |
1224 |
|
1534.3.1
by Robert Collins
* bzrlib.osutils.safe_unicode now exists to provide parameter coercion |
1225 |
def safe_unicode(unicode_or_utf8_string): |
1226 |
"""Coerce unicode_or_utf8_string into unicode.
|
|
1227 |
||
1228 |
If it is unicode, it is returned.
|
|
4204.2.1
by Matt Nordhoff
Fix a broken sentence in osutils.safe_unicode's docstring |
1229 |
Otherwise it is decoded from utf-8. If decoding fails, the exception is
|
1230 |
wrapped in a BzrBadParameterNotUnicode exception.
|
|
1534.3.1
by Robert Collins
* bzrlib.osutils.safe_unicode now exists to provide parameter coercion |
1231 |
"""
|
1232 |
if isinstance(unicode_or_utf8_string, unicode): |
|
1233 |
return unicode_or_utf8_string |
|
1234 |
try: |
|
1235 |
return unicode_or_utf8_string.decode('utf8') |
|
1236 |
except UnicodeDecodeError: |
|
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
1237 |
raise errors.BzrBadParameterNotUnicode(unicode_or_utf8_string) |
1534.3.1
by Robert Collins
* bzrlib.osutils.safe_unicode now exists to provide parameter coercion |
1238 |
|
1239 |
||
2249.5.8
by John Arbash Meinel
Add osutils.safe_utf8 and safe_revision_id for the new revision_id work. |
1240 |
def safe_utf8(unicode_or_utf8_string): |
1241 |
"""Coerce unicode_or_utf8_string to a utf8 string.
|
|
1242 |
||
1243 |
If it is a str, it is returned.
|
|
1244 |
If it is Unicode, it is encoded into a utf-8 string.
|
|
1245 |
"""
|
|
1246 |
if isinstance(unicode_or_utf8_string, str): |
|
1247 |
# TODO: jam 20070209 This is overkill, and probably has an impact on
|
|
1248 |
# performance if we are dealing with lots of apis that want a
|
|
1249 |
# utf-8 revision id
|
|
1250 |
try: |
|
1251 |
# Make sure it is a valid utf-8 string
|
|
1252 |
unicode_or_utf8_string.decode('utf-8') |
|
1253 |
except UnicodeDecodeError: |
|
1254 |
raise errors.BzrBadParameterNotUnicode(unicode_or_utf8_string) |
|
1255 |
return unicode_or_utf8_string |
|
1256 |
return unicode_or_utf8_string.encode('utf-8') |
|
1257 |
||
1258 |
||
2309.4.4
by John Arbash Meinel
Change what warnings are raised, and add tests that they are used. |
1259 |
_revision_id_warning = ('Unicode revision ids were deprecated in bzr 0.15.' |
1260 |
' Revision id generators should be creating utf8'
|
|
1261 |
' revision ids.') |
|
1262 |
||
1263 |
||
1264 |
def safe_revision_id(unicode_or_utf8_string, warn=True): |
|
2249.5.8
by John Arbash Meinel
Add osutils.safe_utf8 and safe_revision_id for the new revision_id work. |
1265 |
"""Revision ids should now be utf8, but at one point they were unicode.
|
1266 |
||
2309.4.4
by John Arbash Meinel
Change what warnings are raised, and add tests that they are used. |
1267 |
:param unicode_or_utf8_string: A possibly Unicode revision_id. (can also be
|
1268 |
utf8 or None).
|
|
1269 |
:param warn: Functions that are sanitizing user data can set warn=False
|
|
1270 |
:return: None or a utf8 revision id.
|
|
2249.5.8
by John Arbash Meinel
Add osutils.safe_utf8 and safe_revision_id for the new revision_id work. |
1271 |
"""
|
2309.4.3
by John Arbash Meinel
(broken) change safe_*_id to emit a warning. |
1272 |
if (unicode_or_utf8_string is None |
1273 |
or unicode_or_utf8_string.__class__ == str): |
|
1274 |
return unicode_or_utf8_string |
|
2309.4.4
by John Arbash Meinel
Change what warnings are raised, and add tests that they are used. |
1275 |
if warn: |
1276 |
symbol_versioning.warn(_revision_id_warning, DeprecationWarning, |
|
1277 |
stacklevel=2) |
|
2309.4.3
by John Arbash Meinel
(broken) change safe_*_id to emit a warning. |
1278 |
return cache_utf8.encode(unicode_or_utf8_string) |
1279 |
||
1280 |
||
2309.4.4
by John Arbash Meinel
Change what warnings are raised, and add tests that they are used. |
1281 |
_file_id_warning = ('Unicode file ids were deprecated in bzr 0.15. File id' |
1282 |
' generators should be creating utf8 file ids.') |
|
1283 |
||
1284 |
||
1285 |
def safe_file_id(unicode_or_utf8_string, warn=True): |
|
2309.4.3
by John Arbash Meinel
(broken) change safe_*_id to emit a warning. |
1286 |
"""File ids should now be utf8, but at one point they were unicode.
|
1287 |
||
1288 |
This is the same as safe_utf8, except it uses the cached encode functions
|
|
1289 |
to save a little bit of performance.
|
|
2309.4.4
by John Arbash Meinel
Change what warnings are raised, and add tests that they are used. |
1290 |
|
1291 |
:param unicode_or_utf8_string: A possibly Unicode file_id. (can also be
|
|
1292 |
utf8 or None).
|
|
1293 |
:param warn: Functions that are sanitizing user data can set warn=False
|
|
1294 |
:return: None or a utf8 file id.
|
|
2309.4.3
by John Arbash Meinel
(broken) change safe_*_id to emit a warning. |
1295 |
"""
|
1296 |
if (unicode_or_utf8_string is None |
|
1297 |
or unicode_or_utf8_string.__class__ == str): |
|
1298 |
return unicode_or_utf8_string |
|
2309.4.4
by John Arbash Meinel
Change what warnings are raised, and add tests that they are used. |
1299 |
if warn: |
1300 |
symbol_versioning.warn(_file_id_warning, DeprecationWarning, |
|
1301 |
stacklevel=2) |
|
2309.4.3
by John Arbash Meinel
(broken) change safe_*_id to emit a warning. |
1302 |
return cache_utf8.encode(unicode_or_utf8_string) |
2294.1.4
by John Arbash Meinel
Add safe_file_id as a helper in osutils. |
1303 |
|
1304 |
||
1185.85.75
by John Arbash Meinel
Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. |
1305 |
_platform_normalizes_filenames = False |
1306 |
if sys.platform == 'darwin': |
|
1307 |
_platform_normalizes_filenames = True |
|
1308 |
||
1309 |
||
1310 |
def normalizes_filenames(): |
|
1311 |
"""Return True if this platform normalizes unicode filenames.
|
|
1312 |
||
1313 |
Mac OSX does, Windows/Linux do not.
|
|
1314 |
"""
|
|
1315 |
return _platform_normalizes_filenames |
|
1316 |
||
1317 |
||
1830.3.2
by John Arbash Meinel
normalized_filename is a much better name |
1318 |
def _accessible_normalized_filename(path): |
1830.3.1
by John Arbash Meinel
Change the return value of unicode_filename, and make it testable on all platforms |
1319 |
"""Get the unicode normalized path, and if you can access the file.
|
1320 |
||
1321 |
On platforms where the system normalizes filenames (Mac OSX),
|
|
1322 |
you can access a file by any path which will normalize correctly.
|
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1323 |
On platforms where the system does not normalize filenames
|
1830.3.1
by John Arbash Meinel
Change the return value of unicode_filename, and make it testable on all platforms |
1324 |
(Windows, Linux), you have to access a file by its exact path.
|
1325 |
||
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1326 |
Internally, bzr only supports NFC normalization, since that is
|
1830.3.1
by John Arbash Meinel
Change the return value of unicode_filename, and make it testable on all platforms |
1327 |
the standard for XML documents.
|
1328 |
||
1329 |
So return the normalized path, and a flag indicating if the file
|
|
1330 |
can be accessed by that path.
|
|
1331 |
"""
|
|
1332 |
||
3201.1.1
by jameinel
Fix bug #185458, switch from NFKC to NFC and add tests for filenames that would be broken under NFKC |
1333 |
return unicodedata.normalize('NFC', unicode(path)), True |
1830.3.1
by John Arbash Meinel
Change the return value of unicode_filename, and make it testable on all platforms |
1334 |
|
1335 |
||
1830.3.2
by John Arbash Meinel
normalized_filename is a much better name |
1336 |
def _inaccessible_normalized_filename(path): |
1337 |
__doc__ = _accessible_normalized_filename.__doc__ |
|
1830.3.1
by John Arbash Meinel
Change the return value of unicode_filename, and make it testable on all platforms |
1338 |
|
3201.1.1
by jameinel
Fix bug #185458, switch from NFKC to NFC and add tests for filenames that would be broken under NFKC |
1339 |
normalized = unicodedata.normalize('NFC', unicode(path)) |
1830.3.1
by John Arbash Meinel
Change the return value of unicode_filename, and make it testable on all platforms |
1340 |
return normalized, normalized == path |
1341 |
||
1342 |
||
1185.85.75
by John Arbash Meinel
Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. |
1343 |
if _platform_normalizes_filenames: |
1830.3.2
by John Arbash Meinel
normalized_filename is a much better name |
1344 |
normalized_filename = _accessible_normalized_filename |
1185.85.75
by John Arbash Meinel
Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. |
1345 |
else: |
1830.3.2
by John Arbash Meinel
normalized_filename is a much better name |
1346 |
normalized_filename = _inaccessible_normalized_filename |
1185.85.75
by John Arbash Meinel
Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. |
1347 |
|
1348 |
||
4747.3.6
by Vincent Ladeuil
terminal_width can now returns None. |
1349 |
default_terminal_width = 80 |
1350 |
"""The default terminal width for ttys.
|
|
1351 |
||
1352 |
This is defined so that higher levels can share a common fallback value when
|
|
1353 |
terminal_width() returns None.
|
|
1354 |
"""
|
|
1355 |
||
1356 |
||
1185.33.60
by Martin Pool
Use full terminal width for verbose test output. |
1357 |
def terminal_width(): |
4747.3.6
by Vincent Ladeuil
terminal_width can now returns None. |
1358 |
"""Return terminal width.
|
1359 |
||
1360 |
None is returned if the width can't established precisely.
|
|
4747.4.5
by Vincent Ladeuil
More robusts tests for osutils.terminal_width(). |
1361 |
|
1362 |
The rules are:
|
|
1363 |
- if BZR_COLUMNS is set, returns its value
|
|
1364 |
- if there is no controlling terminal, returns None
|
|
1365 |
- if COLUMNS is set, returns its value,
|
|
1366 |
||
1367 |
From there, we need to query the OS to get the size of the controlling
|
|
1368 |
terminal.
|
|
1369 |
||
1370 |
Unices:
|
|
1371 |
- get termios.TIOCGWINSZ
|
|
1372 |
- if an error occurs or a negative value is obtained, returns None
|
|
1373 |
||
1374 |
Windows:
|
|
1375 |
|
|
1376 |
- win32utils.get_console_size() decides,
|
|
1377 |
- returns None on error (provided default value)
|
|
4747.3.6
by Vincent Ladeuil
terminal_width can now returns None. |
1378 |
"""
|
4747.3.4
by Vincent Ladeuil
Add tests, introduce explicit default values, always respect COLUMNS. |
1379 |
|
4747.3.7
by Vincent Ladeuil
Introduce BZR_COLUMNS since COLUMNS behaviour is too obscure. |
1380 |
# If BZR_COLUMNS is set, take it, user is always right
|
1381 |
try: |
|
1382 |
return int(os.environ['BZR_COLUMNS']) |
|
1383 |
except (KeyError, ValueError): |
|
1384 |
pass
|
|
1385 |
||
4747.3.3
by Vincent Ladeuil
More complete fix (previous one changed the focus). |
1386 |
isatty = getattr(sys.stdout, 'isatty', None) |
1387 |
if isatty is None or not isatty(): |
|
4747.3.7
by Vincent Ladeuil
Introduce BZR_COLUMNS since COLUMNS behaviour is too obscure. |
1388 |
# Don't guess, setting BZR_COLUMNS is the recommended way to override.
|
4747.3.6
by Vincent Ladeuil
terminal_width can now returns None. |
1389 |
return None |
4747.3.1
by Joke de Buhr
Prevent linebreaks in output if it's not connected to a tty. |
1390 |
|
4747.4.5
by Vincent Ladeuil
More robusts tests for osutils.terminal_width(). |
1391 |
# If COLUMNS is set, take it, the terminal knows better (even inside a
|
1392 |
# given terminal, the application can decide to set COLUMNS to a lower
|
|
1393 |
# value (splitted screen) or a bigger value (scroll bars))
|
|
4747.4.3
by Vincent Ladeuil
Re-fix the priority order since there is a known valid case. |
1394 |
try: |
1395 |
return int(os.environ['COLUMNS']) |
|
1396 |
except (KeyError, ValueError): |
|
1397 |
pass
|
|
1398 |
||
4747.4.5
by Vincent Ladeuil
More robusts tests for osutils.terminal_width(). |
1399 |
width, height = _terminal_size(None, None) |
1400 |
if width <= 0: |
|
1401 |
# Consider invalid values as meaning no width
|
|
1402 |
return None |
|
1403 |
||
1404 |
return width |
|
1405 |
||
1406 |
||
1407 |
def _win32_terminal_size(width, height): |
|
1408 |
width, height = win32utils.get_console_size(defaultx=width, defaulty=height) |
|
1409 |
return width, height |
|
1410 |
||
1411 |
||
1412 |
def _ioctl_terminal_size(width, height): |
|
1185.33.60
by Martin Pool
Use full terminal width for verbose test output. |
1413 |
try: |
1704.2.2
by Martin Pool
Detect terminal width using ioctl |
1414 |
import struct, fcntl, termios |
1415 |
s = struct.pack('HHHH', 0, 0, 0, 0) |
|
1416 |
x = fcntl.ioctl(1, termios.TIOCGWINSZ, s) |
|
4747.4.6
by Vincent Ladeuil
Fix parameter order. |
1417 |
height, width = struct.unpack('HHHH', x)[0:2] |
4747.3.4
by Vincent Ladeuil
Add tests, introduce explicit default values, always respect COLUMNS. |
1418 |
except (IOError, AttributeError): |
4747.4.5
by Vincent Ladeuil
More robusts tests for osutils.terminal_width(). |
1419 |
pass
|
1420 |
return width, height |
|
1421 |
||
1422 |
_terminal_size = None |
|
1423 |
"""Returns the terminal size as (width, height).
|
|
1424 |
||
1425 |
:param width: Default value for width.
|
|
1426 |
:param height: Default value for height.
|
|
1427 |
||
1428 |
This is defined specifically for each OS and query the size of the controlling
|
|
1429 |
terminal. If any error occurs, the provided default values should be returned.
|
|
1430 |
"""
|
|
1431 |
if sys.platform == 'win32': |
|
1432 |
_terminal_size = _win32_terminal_size |
|
1433 |
else: |
|
1434 |
_terminal_size = _ioctl_terminal_size |
|
1534.7.25
by Aaron Bentley
Added set_executability |
1435 |
|
1963.1.5
by John Arbash Meinel
Create an osutils helper function for modifying the environment |
1436 |
|
4747.5.1
by Vincent Ladeuil
catch SIGWINCH, but that means soem IO can be interrupted and the code |
1437 |
def _terminal_size_changed(signum, frame): |
1438 |
"""Set COLUMNS upon receiving a SIGnal for WINdow size CHange."""
|
|
1439 |
width, height = _terminal_size(None, None) |
|
1440 |
if width is not None: |
|
1441 |
os.environ['COLUMNS'] = str(width) |
|
4747.5.3
by Vincent Ladeuil
Review feedback: import signal lazily and don't install SIGWINCH on windows. |
1442 |
|
4797.20.2
by
Register SIGWINCH only when creating a TextUIFactory |
1443 |
|
1444 |
_registered_sigwinch = False |
|
1445 |
||
1446 |
def watch_sigwinch(): |
|
1447 |
"""Register for SIGWINCH, once and only once."""
|
|
1448 |
global _registered_sigwinch |
|
1449 |
if not _registered_sigwinch: |
|
1450 |
if sys.platform == 'win32': |
|
1451 |
# Martin (gz) mentioned WINDOW_BUFFER_SIZE_RECORD from
|
|
1452 |
# ReadConsoleInput but I've no idea how to plug that in
|
|
1453 |
# the current design -- vila 20091216
|
|
1454 |
pass
|
|
1455 |
else: |
|
1456 |
signal.signal(signal.SIGWINCH, _terminal_size_changed) |
|
1457 |
_registered_sigwinch = True |
|
4747.5.1
by Vincent Ladeuil
catch SIGWINCH, but that means soem IO can be interrupted and the code |
1458 |
|
1459 |
||
1534.7.25
by Aaron Bentley
Added set_executability |
1460 |
def supports_executable(): |
1534.7.160
by Aaron Bentley
Changed implementation of supports_executable |
1461 |
return sys.platform != "win32" |
1551.2.53
by abentley
Strip trailing slashes in a platform-sensible way |
1462 |
|
1463 |
||
1551.10.4
by Aaron Bentley
Update to skip on win32 |
1464 |
def supports_posix_readonly(): |
1465 |
"""Return True if 'readonly' has POSIX semantics, False otherwise.
|
|
1466 |
||
1467 |
Notably, a win32 readonly file cannot be deleted, unlike POSIX where the
|
|
1468 |
directory controls creation/deletion, etc.
|
|
1469 |
||
1470 |
And under win32, readonly means that the directory itself cannot be
|
|
1471 |
deleted. The contents of a readonly directory can be changed, unlike POSIX
|
|
1472 |
where files in readonly directories cannot be added, deleted or renamed.
|
|
1473 |
"""
|
|
1474 |
return sys.platform != "win32" |
|
1475 |
||
1476 |
||
1963.1.5
by John Arbash Meinel
Create an osutils helper function for modifying the environment |
1477 |
def set_or_unset_env(env_variable, value): |
1478 |
"""Modify the environment, setting or removing the env_variable.
|
|
1479 |
||
1480 |
:param env_variable: The environment variable in question
|
|
1481 |
:param value: The value to set the environment to. If None, then
|
|
1482 |
the variable will be removed.
|
|
1483 |
:return: The original value of the environment variable.
|
|
1484 |
"""
|
|
1485 |
orig_val = os.environ.get(env_variable) |
|
1486 |
if value is None: |
|
1487 |
if orig_val is not None: |
|
1488 |
del os.environ[env_variable] |
|
1489 |
else: |
|
1490 |
if isinstance(value, unicode): |
|
3224.5.4
by Andrew Bennetts
Fix test suite, mainly weeding out uses of bzrlib.user_encoding. |
1491 |
value = value.encode(get_user_encoding()) |
1963.1.5
by John Arbash Meinel
Create an osutils helper function for modifying the environment |
1492 |
os.environ[env_variable] = value |
1493 |
return orig_val |
|
1494 |
||
1495 |
||
1551.2.56
by Aaron Bentley
Better illegal pathname check for Windows |
1496 |
_validWin32PathRE = re.compile(r'^([A-Za-z]:[/\\])?[^:<>*"?\|]*$') |
1497 |
||
1498 |
||
1499 |
def check_legal_path(path): |
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1500 |
"""Check whether the supplied path is legal.
|
1551.2.56
by Aaron Bentley
Better illegal pathname check for Windows |
1501 |
This is only required on Windows, so we don't test on other platforms
|
1502 |
right now.
|
|
1503 |
"""
|
|
1504 |
if sys.platform != "win32": |
|
1505 |
return
|
|
1506 |
if _validWin32PathRE.match(path) is None: |
|
1996.3.25
by John Arbash Meinel
Make importing errors lazy for osutils |
1507 |
raise errors.IllegalPath(path) |
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1508 |
|
1509 |
||
3596.2.2
by John Arbash Meinel
Factor out the common exception handling looking for ENOTDIR and use it |
1510 |
_WIN32_ERROR_DIRECTORY = 267 # Similar to errno.ENOTDIR |
1511 |
||
1512 |
def _is_error_enotdir(e): |
|
1513 |
"""Check if this exception represents ENOTDIR.
|
|
1514 |
||
1515 |
Unfortunately, python is very inconsistent about the exception
|
|
1516 |
here. The cases are:
|
|
1517 |
1) Linux, Mac OSX all versions seem to set errno == ENOTDIR
|
|
1518 |
2) Windows, Python2.4, uses errno == ERROR_DIRECTORY (267)
|
|
1519 |
which is the windows error code.
|
|
1520 |
3) Windows, Python2.5 uses errno == EINVAL and
|
|
1521 |
winerror == ERROR_DIRECTORY
|
|
1522 |
||
1523 |
:param e: An Exception object (expected to be OSError with an errno
|
|
1524 |
attribute, but we should be able to cope with anything)
|
|
1525 |
:return: True if this represents an ENOTDIR error. False otherwise.
|
|
1526 |
"""
|
|
1527 |
en = getattr(e, 'errno', None) |
|
1528 |
if (en == errno.ENOTDIR |
|
1529 |
or (sys.platform == 'win32' |
|
1530 |
and (en == _WIN32_ERROR_DIRECTORY |
|
1531 |
or (en == errno.EINVAL |
|
1532 |
and getattr(e, 'winerror', None) == _WIN32_ERROR_DIRECTORY) |
|
1533 |
))):
|
|
1534 |
return True |
|
1535 |
return False |
|
1536 |
||
1537 |
||
1757.2.8
by Robert Collins
Teach walkdirs to walk a subdir of a tree. |
1538 |
def walkdirs(top, prefix=""): |
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1539 |
"""Yield data about all the directories in a tree.
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1540 |
|
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1541 |
This yields all the data about the contents of a directory at a time.
|
1542 |
After each directory has been yielded, if the caller has mutated the list
|
|
1543 |
to exclude some directories, they are then not descended into.
|
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1544 |
|
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1545 |
The data yielded is of the form:
|
1897.1.2
by Robert Collins
cleanup osutils.walkdirs changes after review. |
1546 |
((directory-relpath, directory-path-from-top),
|
2694.4.1
by Alexander Belchenko
trivial fix for docstring of osutils.walkdirs() |
1547 |
[(relpath, basename, kind, lstat, path-from-top), ...]),
|
1897.1.2
by Robert Collins
cleanup osutils.walkdirs changes after review. |
1548 |
- directory-relpath is the relative path of the directory being returned
|
1549 |
with respect to top. prefix is prepended to this.
|
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1550 |
- directory-path-from-root is the path including top for this directory.
|
1897.1.2
by Robert Collins
cleanup osutils.walkdirs changes after review. |
1551 |
It is suitable for use with os functions.
|
1897.1.1
by Robert Collins
Add some useful summary data to osutils.walkdirs output. |
1552 |
- relpath is the relative path within the subtree being walked.
|
1553 |
- basename is the basename of the path
|
|
1897.1.2
by Robert Collins
cleanup osutils.walkdirs changes after review. |
1554 |
- kind is the kind of the file now. If unknown then the file is not
|
1897.1.1
by Robert Collins
Add some useful summary data to osutils.walkdirs output. |
1555 |
present within the tree - but it may be recorded as versioned. See
|
1556 |
versioned_kind.
|
|
1557 |
- lstat is the stat data *if* the file was statted.
|
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1558 |
- planned, not implemented:
|
1897.1.1
by Robert Collins
Add some useful summary data to osutils.walkdirs output. |
1559 |
path_from_tree_root is the path from the root of the tree.
|
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1560 |
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1561 |
:param prefix: Prefix the relpaths that are yielded with 'prefix'. This
|
1757.2.16
by Robert Collins
Review comments. |
1562 |
allows one to walk a subtree but get paths that are relative to a tree
|
1563 |
rooted higher up.
|
|
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1564 |
:return: an iterator over the dirs.
|
1565 |
"""
|
|
1897.1.1
by Robert Collins
Add some useful summary data to osutils.walkdirs output. |
1566 |
#TODO there is a bit of a smell where the results of the directory-
|
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1567 |
# summary in this, and the path from the root, may not agree
|
1897.1.1
by Robert Collins
Add some useful summary data to osutils.walkdirs output. |
1568 |
# depending on top and prefix - i.e. ./foo and foo as a pair leads to
|
1569 |
# potentially confusing output. We should make this more robust - but
|
|
1897.1.2
by Robert Collins
cleanup osutils.walkdirs changes after review. |
1570 |
# not at a speed cost. RBC 20060731
|
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1571 |
_lstat = os.lstat |
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1572 |
_directory = _directory_kind |
1996.3.14
by John Arbash Meinel
lazy_import osutils and sign_my_commits |
1573 |
_listdir = os.listdir |
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1574 |
_kind_from_mode = file_kind_from_stat_mode |
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1575 |
pending = [(safe_unicode(prefix), "", _directory, None, safe_unicode(top))] |
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1576 |
while pending: |
1577 |
# 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath
|
|
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1578 |
relroot, _, _, _, top = pending.pop() |
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1579 |
if relroot: |
1580 |
relprefix = relroot + u'/' |
|
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1581 |
else: |
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1582 |
relprefix = '' |
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1583 |
top_slash = top + u'/' |
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1584 |
|
1585 |
dirblock = [] |
|
1586 |
append = dirblock.append |
|
3585.2.4
by Robert Collins
* Deleting directories by hand before running ``bzr rm`` will not |
1587 |
try: |
1588 |
names = sorted(_listdir(top)) |
|
3596.2.2
by John Arbash Meinel
Factor out the common exception handling looking for ENOTDIR and use it |
1589 |
except OSError, e: |
1590 |
if not _is_error_enotdir(e): |
|
3585.2.4
by Robert Collins
* Deleting directories by hand before running ``bzr rm`` will not |
1591 |
raise
|
1592 |
else: |
|
1593 |
for name in names: |
|
1594 |
abspath = top_slash + name |
|
1595 |
statvalue = _lstat(abspath) |
|
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1596 |
kind = _kind_from_mode(statvalue.st_mode) |
3585.2.4
by Robert Collins
* Deleting directories by hand before running ``bzr rm`` will not |
1597 |
append((relprefix + name, name, kind, statvalue, abspath)) |
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1598 |
yield (relroot, top), dirblock |
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1599 |
|
1753.1.1
by Robert Collins
(rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. |
1600 |
# push the user specified dirs from dirblock
|
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1601 |
pending.extend(d for d in reversed(dirblock) if d[2] == _directory) |
1773.3.1
by Robert Collins
Add path_prefix_key and compare_paths_prefix_order utility functions. |
1602 |
|
1603 |
||
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1604 |
class DirReader(object): |
1605 |
"""An interface for reading directories."""
|
|
1606 |
||
1607 |
def top_prefix_to_starting_dir(self, top, prefix=""): |
|
1608 |
"""Converts top and prefix to a starting dir entry
|
|
1609 |
||
1610 |
:param top: A utf8 path
|
|
1611 |
:param prefix: An optional utf8 path to prefix output relative paths
|
|
1612 |
with.
|
|
1613 |
:return: A tuple starting with prefix, and ending with the native
|
|
1614 |
encoding of top.
|
|
1615 |
"""
|
|
1616 |
raise NotImplementedError(self.top_prefix_to_starting_dir) |
|
1617 |
||
1618 |
def read_dir(self, prefix, top): |
|
1619 |
"""Read a specific dir.
|
|
1620 |
||
1621 |
:param prefix: A utf8 prefix to be preprended to the path basenames.
|
|
1622 |
:param top: A natively encoded path to read.
|
|
3696.3.10
by Robert Collins
Review feedback. |
1623 |
:return: A list of the directories contents. Each item contains:
|
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1624 |
(utf8_relpath, utf8_name, kind, lstatvalue, native_abspath)
|
1625 |
"""
|
|
1626 |
raise NotImplementedError(self.read_dir) |
|
1627 |
||
1628 |
||
1629 |
_selected_dir_reader = None |
|
1630 |
||
3557.2.3
by John Arbash Meinel
Change the logic for selecting a real _walkdirs_utf8 implementation, |
1631 |
|
2255.7.27
by John Arbash Meinel
Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems |
1632 |
def _walkdirs_utf8(top, prefix=""): |
1633 |
"""Yield data about all the directories in a tree.
|
|
1634 |
||
1635 |
This yields the same information as walkdirs() only each entry is yielded
|
|
1636 |
in utf-8. On platforms which have a filesystem encoding of utf8 the paths
|
|
1637 |
are returned as exact byte-strings.
|
|
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1638 |
|
1639 |
:return: yields a tuple of (dir_info, [file_info])
|
|
1640 |
dir_info is (utf8_relpath, path-from-top)
|
|
1641 |
file_info is (utf8_relpath, utf8_name, kind, lstat, path-from-top)
|
|
1642 |
if top is an absolute path, path-from-top is also an absolute path.
|
|
1643 |
path-from-top might be unicode or utf8, but it is the correct path to
|
|
1644 |
pass to os functions to affect the file in question. (such as os.lstat)
|
|
1645 |
"""
|
|
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1646 |
global _selected_dir_reader |
1647 |
if _selected_dir_reader is None: |
|
3557.2.3
by John Arbash Meinel
Change the logic for selecting a real _walkdirs_utf8 implementation, |
1648 |
fs_encoding = _fs_enc.upper() |
3224.5.17
by Andrew Bennetts
Avoid importing win32utils when sys.platform != win32 |
1649 |
if sys.platform == "win32" and win32utils.winver == 'Windows NT': |
3557.2.4
by John Arbash Meinel
Cleanup the tests a bit, and add a test that we downgrade if os.name isn't 'nt' |
1650 |
# Win98 doesn't have unicode apis like FindFirstFileW
|
1651 |
# TODO: We possibly could support Win98 by falling back to the
|
|
1652 |
# original FindFirstFile, and using TCHAR instead of WCHAR,
|
|
1653 |
# but that gets a bit tricky, and requires custom compiling
|
|
1654 |
# for win98 anyway.
|
|
3557.2.3
by John Arbash Meinel
Change the logic for selecting a real _walkdirs_utf8 implementation, |
1655 |
try: |
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1656 |
from bzrlib._walkdirs_win32 import Win32ReadDir |
1657 |
_selected_dir_reader = Win32ReadDir() |
|
4241.14.6
by Vincent Ladeuil
Start DirReader parametrized tests. |
1658 |
except ImportError: |
1659 |
pass
|
|
1660 |
elif fs_encoding in ('UTF-8', 'US-ASCII', 'ANSI_X3.4-1968'): |
|
3557.2.3
by John Arbash Meinel
Change the logic for selecting a real _walkdirs_utf8 implementation, |
1661 |
# ANSI_X3.4-1968 is a form of ASCII
|
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1662 |
try: |
1663 |
from bzrlib._readdir_pyx import UTF8DirReader |
|
1664 |
_selected_dir_reader = UTF8DirReader() |
|
4574.3.6
by Martin Pool
More warnings when failing to load extensions |
1665 |
except ImportError, e: |
4574.3.8
by Martin Pool
Only mutter extension load errors when they occur, and record for later |
1666 |
failed_to_load_extension(e) |
4241.14.6
by Vincent Ladeuil
Start DirReader parametrized tests. |
1667 |
pass
|
1668 |
||
1669 |
if _selected_dir_reader is None: |
|
1670 |
# Fallback to the python version
|
|
1671 |
_selected_dir_reader = UnicodeDirReader() |
|
1672 |
||
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1673 |
# 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath
|
1674 |
# But we don't actually uses 1-3 in pending, so set them to None
|
|
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1675 |
pending = [[_selected_dir_reader.top_prefix_to_starting_dir(top, prefix)]] |
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1676 |
read_dir = _selected_dir_reader.read_dir |
1677 |
_directory = _directory_kind |
|
2255.7.27
by John Arbash Meinel
Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems |
1678 |
while pending: |
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1679 |
relroot, _, _, _, top = pending[-1].pop() |
1680 |
if not pending[-1]: |
|
1681 |
pending.pop() |
|
1682 |
dirblock = sorted(read_dir(relroot, top)) |
|
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1683 |
yield (relroot, top), dirblock |
1684 |
# push the user specified dirs from dirblock
|
|
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1685 |
next = [d for d in reversed(dirblock) if d[2] == _directory] |
1686 |
if next: |
|
1687 |
pending.append(next) |
|
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1688 |
|
1689 |
||
1690 |
class UnicodeDirReader(DirReader): |
|
1691 |
"""A dir reader for non-utf8 file systems, which transcodes."""
|
|
1692 |
||
1693 |
__slots__ = ['_utf8_encode'] |
|
1694 |
||
1695 |
def __init__(self): |
|
1696 |
self._utf8_encode = codecs.getencoder('utf8') |
|
1697 |
||
1698 |
def top_prefix_to_starting_dir(self, top, prefix=""): |
|
1699 |
"""See DirReader.top_prefix_to_starting_dir."""
|
|
1700 |
return (safe_utf8(prefix), None, None, None, safe_unicode(top)) |
|
1701 |
||
1702 |
def read_dir(self, prefix, top): |
|
1703 |
"""Read a single directory from a non-utf8 file system.
|
|
1704 |
||
1705 |
top, and the abspath element in the output are unicode, all other paths
|
|
1706 |
are utf8. Local disk IO is done via unicode calls to listdir etc.
|
|
1707 |
||
1708 |
This is currently the fallback code path when the filesystem encoding is
|
|
1709 |
not UTF-8. It may be better to implement an alternative so that we can
|
|
1710 |
safely handle paths that are not properly decodable in the current
|
|
1711 |
encoding.
|
|
1712 |
||
1713 |
See DirReader.read_dir for details.
|
|
1714 |
"""
|
|
1715 |
_utf8_encode = self._utf8_encode |
|
1716 |
_lstat = os.lstat |
|
1717 |
_listdir = os.listdir |
|
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1718 |
_kind_from_mode = file_kind_from_stat_mode |
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1719 |
|
1720 |
if prefix: |
|
1721 |
relprefix = prefix + '/' |
|
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1722 |
else: |
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1723 |
relprefix = '' |
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1724 |
top_slash = top + u'/' |
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1725 |
|
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1726 |
dirblock = [] |
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1727 |
append = dirblock.append |
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1728 |
for name in sorted(_listdir(top)): |
3696.3.12
by Robert Collins
Fix PQM test failure. |
1729 |
try: |
1730 |
name_utf8 = _utf8_encode(name)[0] |
|
1731 |
except UnicodeDecodeError: |
|
1732 |
raise errors.BadFilenameEncoding( |
|
1733 |
_utf8_encode(relprefix)[0] + name, _fs_enc) |
|
2255.7.32
by John Arbash Meinel
Add tests that the walkdirs variants work on unicode paths. |
1734 |
abspath = top_slash + name |
1735 |
statvalue = _lstat(abspath) |
|
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1736 |
kind = _kind_from_mode(statvalue.st_mode) |
2255.7.33
by John Arbash Meinel
More inner loop tuning of walkdirs, can save as much as 5% |
1737 |
append((relprefix + name_utf8, name_utf8, kind, statvalue, abspath)) |
3696.3.1
by Robert Collins
Refactor bzrlib.osutils._walkdirs_utf8 to aid API migration in future. |
1738 |
return dirblock |
2255.7.27
by John Arbash Meinel
Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems |
1739 |
|
1740 |
||
1907.3.2
by John Arbash Meinel
Updated the copy_tree function to allow overriding functionality. |
1741 |
def copy_tree(from_path, to_path, handlers={}): |
1907.3.1
by John Arbash Meinel
create a copy_tree wrapper around walkdirs() |
1742 |
"""Copy all of the entries in from_path into to_path.
|
1743 |
||
3943.8.1
by Marius Kruger
remove all trailing whitespace from bzr source |
1744 |
:param from_path: The base directory to copy.
|
1907.3.1
by John Arbash Meinel
create a copy_tree wrapper around walkdirs() |
1745 |
:param to_path: The target directory. If it does not exist, it will
|
1746 |
be created.
|
|
1907.3.2
by John Arbash Meinel
Updated the copy_tree function to allow overriding functionality. |
1747 |
:param handlers: A dictionary of functions, which takes a source and
|
1748 |
destinations for files, directories, etc.
|
|
1749 |
It is keyed on the file kind, such as 'directory', 'symlink', or 'file'
|
|
1750 |
'file', 'directory', and 'symlink' should always exist.
|
|
1751 |
If they are missing, they will be replaced with 'os.mkdir()',
|
|
1752 |
'os.readlink() + os.symlink()', and 'shutil.copy2()', respectively.
|
|
1907.3.1
by John Arbash Meinel
create a copy_tree wrapper around walkdirs() |
1753 |
"""
|
1754 |
# Now, just copy the existing cached tree to the new location
|
|
1755 |
# We use a cheap trick here.
|
|
1756 |
# Absolute paths are prefixed with the first parameter
|
|
1757 |
# relative paths are prefixed with the second.
|
|
1758 |
# So we can get both the source and target returned
|
|
1759 |
# without any extra work.
|
|
1760 |
||
1907.3.2
by John Arbash Meinel
Updated the copy_tree function to allow overriding functionality. |
1761 |
def copy_dir(source, dest): |
1762 |
os.mkdir(dest) |
|
1763 |
||
1764 |
def copy_link(source, dest): |
|
1765 |
"""Copy the contents of a symlink"""
|
|
1766 |
link_to = os.readlink(source) |
|
1767 |
os.symlink(link_to, dest) |
|
1768 |
||
1769 |
real_handlers = {'file':shutil.copy2, |
|
1770 |
'symlink':copy_link, |
|
1771 |
'directory':copy_dir, |
|
1772 |
}
|
|
1773 |
real_handlers.update(handlers) |
|
1774 |
||
1907.3.1
by John Arbash Meinel
create a copy_tree wrapper around walkdirs() |
1775 |
if not os.path.exists(to_path): |
1907.3.2
by John Arbash Meinel
Updated the copy_tree function to allow overriding functionality. |
1776 |
real_handlers['directory'](from_path, to_path) |
1907.3.1
by John Arbash Meinel
create a copy_tree wrapper around walkdirs() |
1777 |
|
1778 |
for dir_info, entries in walkdirs(from_path, prefix=to_path): |
|
1779 |
for relpath, name, kind, st, abspath in entries: |
|
1907.3.2
by John Arbash Meinel
Updated the copy_tree function to allow overriding functionality. |
1780 |
real_handlers[kind](abspath, relpath) |
1907.3.1
by John Arbash Meinel
create a copy_tree wrapper around walkdirs() |
1781 |
|
1782 |
||
1773.3.1
by Robert Collins
Add path_prefix_key and compare_paths_prefix_order utility functions. |
1783 |
def path_prefix_key(path): |
1784 |
"""Generate a prefix-order path key for path.
|
|
1785 |
||
1786 |
This can be used to sort paths in the same way that walkdirs does.
|
|
1787 |
"""
|
|
1773.3.2
by Robert Collins
New corner case from John Meinel, showing up the need to check the directory lexographically outside of a single tree's root. Fixed. |
1788 |
return (dirname(path) , path) |
1773.3.1
by Robert Collins
Add path_prefix_key and compare_paths_prefix_order utility functions. |
1789 |
|
1790 |
||
1791 |
def compare_paths_prefix_order(path_a, path_b): |
|
1792 |
"""Compare path_a and path_b to generate the same order walkdirs uses."""
|
|
1793 |
key_a = path_prefix_key(path_a) |
|
1794 |
key_b = path_prefix_key(path_b) |
|
1795 |
return cmp(key_a, key_b) |
|
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1796 |
|
1797 |
||
1798 |
_cached_user_encoding = None |
|
1799 |
||
1800 |
||
2192.1.3
by Alexander Belchenko
Tests for osutils.get_user_encoding |
1801 |
def get_user_encoding(use_cache=True): |
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1802 |
"""Find out what the preferred user encoding is.
|
1803 |
||
1804 |
This is generally the encoding that is used for command line parameters
|
|
1805 |
and file contents. This may be different from the terminal encoding
|
|
1806 |
or the filesystem encoding.
|
|
1807 |
||
2192.1.3
by Alexander Belchenko
Tests for osutils.get_user_encoding |
1808 |
:param use_cache: Enable cache for detected encoding.
|
1809 |
(This parameter is turned on by default,
|
|
1810 |
and required only for selftesting)
|
|
1811 |
||
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1812 |
:return: A string defining the preferred user encoding
|
1813 |
"""
|
|
1814 |
global _cached_user_encoding |
|
2192.1.3
by Alexander Belchenko
Tests for osutils.get_user_encoding |
1815 |
if _cached_user_encoding is not None and use_cache: |
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1816 |
return _cached_user_encoding |
1817 |
||
1818 |
if sys.platform == 'darwin': |
|
3638.3.10
by Vincent Ladeuil
Provides a better default encoding on OSX. |
1819 |
# python locale.getpreferredencoding() always return
|
1820 |
# 'mac-roman' on darwin. That's a lie.
|
|
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1821 |
sys.platform = 'posix' |
1822 |
try: |
|
3638.3.10
by Vincent Ladeuil
Provides a better default encoding on OSX. |
1823 |
if os.environ.get('LANG', None) is None: |
1824 |
# If LANG is not set, we end up with 'ascii', which is bad
|
|
1825 |
# ('mac-roman' is more than ascii), so we set a default which
|
|
1826 |
# will give us UTF-8 (which appears to work in all cases on
|
|
1827 |
# OSX). Users are still free to override LANG of course, as
|
|
1828 |
# long as it give us something meaningful. This work-around
|
|
1829 |
# *may* not be needed with python 3k and/or OSX 10.5, but will
|
|
1830 |
# work with them too -- vila 20080908
|
|
1831 |
os.environ['LANG'] = 'en_US.UTF-8' |
|
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1832 |
import locale |
1833 |
finally: |
|
1834 |
sys.platform = 'darwin' |
|
1835 |
else: |
|
1836 |
import locale |
|
1837 |
||
1838 |
try: |
|
2192.1.3
by Alexander Belchenko
Tests for osutils.get_user_encoding |
1839 |
user_encoding = locale.getpreferredencoding() |
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1840 |
except locale.Error, e: |
1955.2.3
by John Arbash Meinel
Change error message text |
1841 |
sys.stderr.write('bzr: warning: %s\n' |
2001.2.1
by Jelmer Vernooij
Fix typo in encoding warning. |
1842 |
' Could not determine what text encoding to use.\n' |
1955.2.3
by John Arbash Meinel
Change error message text |
1843 |
' This error usually means your Python interpreter\n' |
1844 |
' doesn\'t support the locale set by $LANG (%s)\n' |
|
1845 |
" Continuing with ascii encoding.\n" |
|
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1846 |
% (e, os.environ.get('LANG'))) |
2192.1.7
by Alexander Belchenko
get_user_encoding: if locale.Error raised we need to set user_encoding to 'ascii' as warning says |
1847 |
user_encoding = 'ascii' |
1955.2.2
by John Arbash Meinel
Change the name of the test classes (test_lang => test_locale), move the function into osutils.py |
1848 |
|
2127.4.1
by Alexander Belchenko
(jam, bialix) Workaround for cp0 console encoding on Windows |
1849 |
# Windows returns 'cp0' to indicate there is no code page. So we'll just
|
1850 |
# treat that as ASCII, and not support printing unicode characters to the
|
|
1851 |
# console.
|
|
3405.3.1
by Neil Martinsen-Burrell
accept for an encoding to mean ascii |
1852 |
#
|
1853 |
# For python scripts run under vim, we get '', so also treat that as ASCII
|
|
1854 |
if user_encoding in (None, 'cp0', ''): |
|
2192.1.3
by Alexander Belchenko
Tests for osutils.get_user_encoding |
1855 |
user_encoding = 'ascii' |
2192.1.1
by Alexander Belchenko
Before actually using encoding need to check that Python has corresponding codec |
1856 |
else: |
1857 |
# check encoding
|
|
1858 |
try: |
|
2192.1.3
by Alexander Belchenko
Tests for osutils.get_user_encoding |
1859 |
codecs.lookup(user_encoding) |
2192.1.1
by Alexander Belchenko
Before actually using encoding need to check that Python has corresponding codec |
1860 |
except LookupError: |
1861 |
sys.stderr.write('bzr: warning:' |
|
1862 |
' unknown encoding %s.' |
|
1863 |
' Continuing with ascii encoding.\n' |
|
2192.1.3
by Alexander Belchenko
Tests for osutils.get_user_encoding |
1864 |
% user_encoding |
2192.1.1
by Alexander Belchenko
Before actually using encoding need to check that Python has corresponding codec |
1865 |
)
|
2192.1.3
by Alexander Belchenko
Tests for osutils.get_user_encoding |
1866 |
user_encoding = 'ascii' |
1867 |
||
1868 |
if use_cache: |
|
1869 |
_cached_user_encoding = user_encoding |
|
1870 |
||
1871 |
return user_encoding |
|
2091.1.1
by Martin Pool
Avoid MSG_WAITALL as it doesn't work on Windows |
1872 |
|
1873 |
||
3626.1.1
by Mark Hammond
Add osutils.get_host_name() to return a unicode hostname to prevent |
1874 |
def get_host_name(): |
3626.1.4
by John Arbash Meinel
Document the difference in get_host_name, per Robert's request. |
1875 |
"""Return the current unicode host name.
|
1876 |
||
1877 |
This is meant to be used in place of socket.gethostname() because that
|
|
1878 |
behaves inconsistently on different platforms.
|
|
1879 |
"""
|
|
3626.1.1
by Mark Hammond
Add osutils.get_host_name() to return a unicode hostname to prevent |
1880 |
if sys.platform == "win32": |
1881 |
import win32utils |
|
1882 |
return win32utils.get_host_name() |
|
1883 |
else: |
|
1884 |
import socket |
|
1885 |
return socket.gethostname().decode(get_user_encoding()) |
|
1886 |
||
1887 |
||
2091.1.1
by Martin Pool
Avoid MSG_WAITALL as it doesn't work on Windows |
1888 |
def recv_all(socket, bytes): |
1889 |
"""Receive an exact number of bytes.
|
|
1890 |
||
1891 |
Regular Socket.recv() may return less than the requested number of bytes,
|
|
1892 |
dependning on what's in the OS buffer. MSG_WAITALL is not available
|
|
1893 |
on all platforms, but this should work everywhere. This will return
|
|
1894 |
less than the requested amount if the remote end closes.
|
|
1895 |
||
1896 |
This isn't optimized and is intended mostly for use in testing.
|
|
1897 |
"""
|
|
1898 |
b = '' |
|
1899 |
while len(b) < bytes: |
|
3923.3.1
by Andrew Bennetts
Quick attempt at adding some EINTR-proofing to smart protocol code. |
1900 |
new = until_no_eintr(socket.recv, bytes - len(b)) |
2091.1.1
by Martin Pool
Avoid MSG_WAITALL as it doesn't work on Windows |
1901 |
if new == '': |
1902 |
break # eof |
|
1903 |
b += new |
|
1904 |
return b |
|
1905 |
||
3118.2.1
by Andrew Bennetts
(andrew) Fix #115781 by passing no more than 64k at a time to socket.sendall. |
1906 |
|
3958.1.5
by Andrew Bennetts
Remove unnecessary 'direction' argument to osutils.send_all. |
1907 |
def send_all(socket, bytes, report_activity=None): |
3118.2.1
by Andrew Bennetts
(andrew) Fix #115781 by passing no more than 64k at a time to socket.sendall. |
1908 |
"""Send all bytes on a socket.
|
1909 |
||
1910 |
Regular socket.sendall() can give socket error 10053 on Windows. This
|
|
1911 |
implementation sends no more than 64k at a time, which avoids this problem.
|
|
3958.1.1
by Andrew Bennetts
Report traffic on smart media as transport activity. |
1912 |
|
1913 |
:param report_activity: Call this as bytes are read, see
|
|
1914 |
Transport._report_activity
|
|
3118.2.1
by Andrew Bennetts
(andrew) Fix #115781 by passing no more than 64k at a time to socket.sendall. |
1915 |
"""
|
1916 |
chunk_size = 2**16 |
|
1917 |
for pos in xrange(0, len(bytes), chunk_size): |
|
3958.1.1
by Andrew Bennetts
Report traffic on smart media as transport activity. |
1918 |
block = bytes[pos:pos+chunk_size] |
1919 |
if report_activity is not None: |
|
3958.1.5
by Andrew Bennetts
Remove unnecessary 'direction' argument to osutils.send_all. |
1920 |
report_activity(len(block), 'write') |
3958.1.1
by Andrew Bennetts
Report traffic on smart media as transport activity. |
1921 |
until_no_eintr(socket.sendall, block) |
3118.2.1
by Andrew Bennetts
(andrew) Fix #115781 by passing no more than 64k at a time to socket.sendall. |
1922 |
|
1923 |
||
2091.3.7
by Aaron Bentley
Rename real_parent to dereferenced_path |
1924 |
def dereference_path(path): |
1925 |
"""Determine the real path to a file.
|
|
1926 |
||
1927 |
All parent elements are dereferenced. But the file itself is not
|
|
1928 |
dereferenced.
|
|
1929 |
:param path: The original path. May be absolute or relative.
|
|
1930 |
:return: the real path *to* the file
|
|
1931 |
"""
|
|
2091.3.5
by Aaron Bentley
Move realpath functionality into osutils |
1932 |
parent, base = os.path.split(path) |
1933 |
# The pathjoin for '.' is a workaround for Python bug #1213894.
|
|
1934 |
# (initial path components aren't dereferenced)
|
|
1935 |
return pathjoin(realpath(pathjoin('.', parent)), base) |
|
2681.3.4
by Lukáš Lalinsky
- Rename 'windows' to 'mapi' |
1936 |
|
1937 |
||
1938 |
def supports_mapi(): |
|
1939 |
"""Return True if we can use MAPI to launch a mail client."""
|
|
1940 |
return sys.platform == "win32" |
|
3089.3.8
by Ian Clatworthy
move resource loading into a reusable function |
1941 |
|
1942 |
||
1943 |
def resource_string(package, resource_name): |
|
1944 |
"""Load a resource from a package and return it as a string.
|
|
1945 |
||
1946 |
Note: Only packages that start with bzrlib are currently supported.
|
|
1947 |
||
1948 |
This is designed to be a lightweight implementation of resource
|
|
1949 |
loading in a way which is API compatible with the same API from
|
|
1950 |
pkg_resources. See
|
|
1951 |
http://peak.telecommunity.com/DevCenter/PkgResources#basic-resource-access.
|
|
1952 |
If and when pkg_resources becomes a standard library, this routine
|
|
1953 |
can delegate to it.
|
|
1954 |
"""
|
|
1955 |
# Check package name is within bzrlib
|
|
1956 |
if package == "bzrlib": |
|
1957 |
resource_relpath = resource_name |
|
1958 |
elif package.startswith("bzrlib."): |
|
1959 |
package = package[len("bzrlib."):].replace('.', os.sep) |
|
1960 |
resource_relpath = pathjoin(package, resource_name) |
|
1961 |
else: |
|
1962 |
raise errors.BzrError('resource package %s not in bzrlib' % package) |
|
1963 |
||
1964 |
# Map the resource to a file and read its contents
|
|
1965 |
base = dirname(bzrlib.__file__) |
|
1966 |
if getattr(sys, 'frozen', None): # bzr.exe |
|
1967 |
base = abspath(pathjoin(base, '..', '..')) |
|
1968 |
filename = pathjoin(base, resource_relpath) |
|
1969 |
return open(filename, 'rU').read() |
|
1739.2.7
by Robert Collins
Update readdir pyrex source files and usage in line with current practice. |
1970 |
|
1971 |
||
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1972 |
def file_kind_from_stat_mode_thunk(mode): |
1973 |
global file_kind_from_stat_mode |
|
1974 |
if file_kind_from_stat_mode is file_kind_from_stat_mode_thunk: |
|
1975 |
try: |
|
1976 |
from bzrlib._readdir_pyx import UTF8DirReader |
|
1977 |
file_kind_from_stat_mode = UTF8DirReader().kind_from_mode |
|
4574.3.6
by Martin Pool
More warnings when failing to load extensions |
1978 |
except ImportError, e: |
4694.2.1
by John Arbash Meinel
Fix bug #430645, don't issue a warning when failing to import _readdir_pyx the second time. |
1979 |
# This is one time where we won't warn that an extension failed to
|
1980 |
# load. The extension is never available on Windows anyway.
|
|
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1981 |
from bzrlib._readdir_py import ( |
3696.4.8
by Robert Collins
Fix up inter_changes with dirstate both C and python. |
1982 |
_kind_from_mode as file_kind_from_stat_mode |
3696.3.5
by Robert Collins
Streamline _walkdirs_utf8 for utf8 file systems, reducing time to traverse a mozilla tree from 1s to .6 seconds. (Robert Collins) |
1983 |
)
|
1984 |
return file_kind_from_stat_mode(mode) |
|
1985 |
file_kind_from_stat_mode = file_kind_from_stat_mode_thunk |
|
1986 |
||
1987 |
||
1988 |
def file_kind(f, _lstat=os.lstat): |
|
1989 |
try: |
|
1990 |
return file_kind_from_stat_mode(_lstat(f).st_mode) |
|
1991 |
except OSError, e: |
|
1992 |
if getattr(e, 'errno', None) in (errno.ENOENT, errno.ENOTDIR): |
|
1993 |
raise errors.NoSuchFile(f) |
|
1994 |
raise
|
|
1995 |
||
3923.3.1
by Andrew Bennetts
Quick attempt at adding some EINTR-proofing to smart protocol code. |
1996 |
|
1997 |
def until_no_eintr(f, *a, **kw): |
|
3923.3.2
by Andrew Bennetts
Use e.errno rather than e.args[0]. |
1998 |
"""Run f(*a, **kw), retrying if an EINTR error occurs."""
|
3923.3.1
by Andrew Bennetts
Quick attempt at adding some EINTR-proofing to smart protocol code. |
1999 |
# Borrowed from Twisted's twisted.python.util.untilConcludes function.
|
2000 |
while True: |
|
2001 |
try: |
|
2002 |
return f(*a, **kw) |
|
2003 |
except (IOError, OSError), e: |
|
3923.3.2
by Andrew Bennetts
Use e.errno rather than e.args[0]. |
2004 |
if e.errno == errno.EINTR: |
3923.3.1
by Andrew Bennetts
Quick attempt at adding some EINTR-proofing to smart protocol code. |
2005 |
continue
|
2006 |
raise
|
|
2007 |
||
4183.6.4
by Martin Pool
Separate out re_compile_checked |
2008 |
def re_compile_checked(re_string, flags=0, where=""): |
2009 |
"""Return a compiled re, or raise a sensible error.
|
|
4325.3.2
by Johan Walles
Use a linear algorithm for osutil.minimum_path_selection(). |
2010 |
|
4183.6.4
by Martin Pool
Separate out re_compile_checked |
2011 |
This should only be used when compiling user-supplied REs.
|
2012 |
||
2013 |
:param re_string: Text form of regular expression.
|
|
2014 |
:param flags: eg re.IGNORECASE
|
|
4325.3.2
by Johan Walles
Use a linear algorithm for osutil.minimum_path_selection(). |
2015 |
:param where: Message explaining to the user the context where
|
4183.6.4
by Martin Pool
Separate out re_compile_checked |
2016 |
it occurred, eg 'log search filter'.
|
2017 |
"""
|
|
2018 |
# from https://bugs.launchpad.net/bzr/+bug/251352
|
|
2019 |
try: |
|
2020 |
re_obj = re.compile(re_string, flags) |
|
2021 |
re_obj.search("") |
|
2022 |
return re_obj |
|
2023 |
except re.error, e: |
|
2024 |
if where: |
|
2025 |
where = ' in ' + where |
|
2026 |
# despite the name 'error' is a type
|
|
2027 |
raise errors.BzrCommandError('Invalid regular expression%s: %r: %s' |
|
2028 |
% (where, re_string, e)) |
|
2029 |
||
3923.3.1
by Andrew Bennetts
Quick attempt at adding some EINTR-proofing to smart protocol code. |
2030 |
|
0.16.79
by Aaron Bentley
Remove dependencies on bzrtools |
2031 |
if sys.platform == "win32": |
2032 |
import msvcrt |
|
2033 |
def getchar(): |
|
2034 |
return msvcrt.getch() |
|
2035 |
else: |
|
2036 |
import tty |
|
2037 |
import termios |
|
2038 |
def getchar(): |
|
2039 |
fd = sys.stdin.fileno() |
|
2040 |
settings = termios.tcgetattr(fd) |
|
2041 |
try: |
|
2042 |
tty.setraw(fd) |
|
2043 |
ch = sys.stdin.read(1) |
|
2044 |
finally: |
|
2045 |
termios.tcsetattr(fd, termios.TCSADRAIN, settings) |
|
2046 |
return ch |
|
4398.4.3
by Vincent Ladeuil
Detect # cores on win32 and Solaris too. |
2047 |
|
2048 |
||
2049 |
if sys.platform == 'linux2': |
|
2050 |
def _local_concurrency(): |
|
2051 |
concurrency = None |
|
2052 |
prefix = 'processor' |
|
2053 |
for line in file('/proc/cpuinfo', 'rb'): |
|
2054 |
if line.startswith(prefix): |
|
2055 |
concurrency = int(line[line.find(':')+1:]) + 1 |
|
2056 |
return concurrency |
|
2057 |
elif sys.platform == 'darwin': |
|
2058 |
def _local_concurrency(): |
|
2059 |
return subprocess.Popen(['sysctl', '-n', 'hw.availcpu'], |
|
2060 |
stdout=subprocess.PIPE).communicate()[0] |
|
4413.1.1
by Matthew Fuller
Catch the number of cores on FreeBSD too. |
2061 |
elif sys.platform[0:7] == 'freebsd': |
2062 |
def _local_concurrency(): |
|
2063 |
return subprocess.Popen(['sysctl', '-n', 'hw.ncpu'], |
|
2064 |
stdout=subprocess.PIPE).communicate()[0] |
|
4398.4.3
by Vincent Ladeuil
Detect # cores on win32 and Solaris too. |
2065 |
elif sys.platform == 'sunos5': |
2066 |
def _local_concurrency(): |
|
2067 |
return subprocess.Popen(['psrinfo', '-p',], |
|
2068 |
stdout=subprocess.PIPE).communicate()[0] |
|
2069 |
elif sys.platform == "win32": |
|
2070 |
def _local_concurrency(): |
|
4398.4.4
by Vincent Ladeuil
Fixed as per John's review. |
2071 |
# This appears to return the number of cores.
|
4398.4.3
by Vincent Ladeuil
Detect # cores on win32 and Solaris too. |
2072 |
return os.environ.get('NUMBER_OF_PROCESSORS') |
2073 |
else: |
|
2074 |
def _local_concurrency(): |
|
2075 |
# Who knows ?
|
|
2076 |
return None |
|
2077 |
||
2078 |
||
4398.4.4
by Vincent Ladeuil
Fixed as per John's review. |
2079 |
_cached_local_concurrency = None |
2080 |
||
2081 |
def local_concurrency(use_cache=True): |
|
4398.4.3
by Vincent Ladeuil
Detect # cores on win32 and Solaris too. |
2082 |
"""Return how many processes can be run concurrently.
|
2083 |
||
2084 |
Rely on platform specific implementations and default to 1 (one) if
|
|
2085 |
anything goes wrong.
|
|
2086 |
"""
|
|
4398.4.4
by Vincent Ladeuil
Fixed as per John's review. |
2087 |
global _cached_local_concurrency |
4766.3.4
by Matt Nordhoff
Change the environment variable to a global option. |
2088 |
|
4398.4.4
by Vincent Ladeuil
Fixed as per John's review. |
2089 |
if _cached_local_concurrency is not None and use_cache: |
2090 |
return _cached_local_concurrency |
|
2091 |
||
4766.3.7
by Vincent Ladeuil
Mix BZR_CONCURRENCY and --concurrency so both are available. |
2092 |
concurrency = os.environ.get('BZR_CONCURRENCY', None) |
2093 |
if concurrency is None: |
|
2094 |
try: |
|
2095 |
concurrency = _local_concurrency() |
|
2096 |
except (OSError, IOError): |
|
2097 |
pass
|
|
4398.4.3
by Vincent Ladeuil
Detect # cores on win32 and Solaris too. |
2098 |
try: |
2099 |
concurrency = int(concurrency) |
|
2100 |
except (TypeError, ValueError): |
|
2101 |
concurrency = 1 |
|
4398.4.4
by Vincent Ladeuil
Fixed as per John's review. |
2102 |
if use_cache: |
2103 |
_cached_concurrency = concurrency |
|
4398.4.3
by Vincent Ladeuil
Detect # cores on win32 and Solaris too. |
2104 |
return concurrency |
4794.1.12
by Robert Collins
Create a StreamWriter helper that doesn't trigger implicit decode('ascii') on write(a_str). |
2105 |
|
2106 |
||
4794.1.15
by Robert Collins
Review feedback. |
2107 |
class UnicodeOrBytesToBytesWriter(codecs.StreamWriter): |
4794.1.12
by Robert Collins
Create a StreamWriter helper that doesn't trigger implicit decode('ascii') on write(a_str). |
2108 |
"""A stream writer that doesn't decode str arguments."""
|
2109 |
||
4794.1.21
by Robert Collins
Python 2.4 doesn't use CodecInfo, so do a type check on the result of codecs.lookup. |
2110 |
def __init__(self, encode, stream, errors='strict'): |
4794.1.12
by Robert Collins
Create a StreamWriter helper that doesn't trigger implicit decode('ascii') on write(a_str). |
2111 |
codecs.StreamWriter.__init__(self, stream, errors) |
4794.1.21
by Robert Collins
Python 2.4 doesn't use CodecInfo, so do a type check on the result of codecs.lookup. |
2112 |
self.encode = encode |
4794.1.12
by Robert Collins
Create a StreamWriter helper that doesn't trigger implicit decode('ascii') on write(a_str). |
2113 |
|
2114 |
def write(self, object): |
|
4794.1.15
by Robert Collins
Review feedback. |
2115 |
if type(object) is str: |
4794.1.12
by Robert Collins
Create a StreamWriter helper that doesn't trigger implicit decode('ascii') on write(a_str). |
2116 |
self.stream.write(object) |
2117 |
else: |
|
2118 |
data, _ = self.encode(object, self.errors) |
|
2119 |
self.stream.write(data) |