697
671
:param timezone: How to display the time: 'utc', 'original' for the
698
672
timezone specified by offset, or 'local' for the process's current
700
:param date_fmt: strftime format.
701
:param show_offset: Whether to append the timezone.
703
(date_fmt, tt, offset_str) = \
704
_format_date(t, offset, timezone, date_fmt, show_offset)
705
date_fmt = date_fmt.replace('%a', weekdays[tt[6]])
706
date_str = time.strftime(date_fmt, tt)
707
return date_str + offset_str
709
def format_local_date(t, offset=0, timezone='original', date_fmt=None,
711
"""Return an unicode date string formatted according to the current locale.
713
:param t: Seconds since the epoch.
714
:param offset: Timezone offset in seconds east of utc.
715
:param timezone: How to display the time: 'utc', 'original' for the
716
timezone specified by offset, or 'local' for the process's current
718
:param date_fmt: strftime format.
719
:param show_offset: Whether to append the timezone.
721
(date_fmt, tt, offset_str) = \
722
_format_date(t, offset, timezone, date_fmt, show_offset)
723
date_str = time.strftime(date_fmt, tt)
724
if not isinstance(date_str, unicode):
725
date_str = date_str.decode(get_user_encoding(), 'replace')
726
return date_str + offset_str
728
def _format_date(t, offset, timezone, date_fmt, show_offset):
674
:param show_offset: Whether to append the timezone.
675
:param date_fmt: strftime format.
729
677
if timezone == 'utc':
730
678
tt = time.gmtime(t)
927
843
shutil.copyfile(src, dest)
846
# Look Before You Leap (LBYL) is appropriate here instead of Easier to Ask for
847
# Forgiveness than Permission (EAFP) because:
848
# - root can damage a solaris file system by using unlink,
849
# - unlink raises different exceptions on different OSes (linux: EISDIR, win32:
850
# EACCES, OSX: EPERM) when invoked on a directory.
930
851
def delete_any(path):
931
"""Delete a file, symlink or directory.
933
Will delete even if readonly.
936
_delete_file_or_dir(path)
937
except (OSError, IOError), e:
938
if e.errno in (errno.EPERM, errno.EACCES):
939
# make writable and try again
942
except (OSError, IOError):
944
_delete_file_or_dir(path)
949
def _delete_file_or_dir(path):
950
# Look Before You Leap (LBYL) is appropriate here instead of Easier to Ask for
951
# Forgiveness than Permission (EAFP) because:
952
# - root can damage a solaris file system by using unlink,
953
# - unlink raises different exceptions on different OSes (linux: EISDIR, win32:
954
# EACCES, OSX: EPERM) when invoked on a directory.
852
"""Delete a file or directory."""
955
853
if isdir(path): # Takes care of symlinks
1044
if len(head) <= len(base) and head != base:
1045
raise errors.PathNotChild(rp, base)
927
while len(head) >= len(base):
1046
928
if head == base:
1048
head, tail = split(head)
930
head, tail = os.path.split(head)
934
raise errors.PathNotChild(rp, base)
1053
return pathjoin(*reversed(s))
1058
def _cicp_canonical_relpath(base, path):
1059
"""Return the canonical path relative to base.
1061
Like relpath, but on case-insensitive-case-preserving file-systems, this
1062
will return the relpath as stored on the file-system rather than in the
1063
case specified in the input string, for all existing portions of the path.
1065
This will cause O(N) behaviour if called for every path in a tree; if you
1066
have a number of paths to convert, you should use canonical_relpaths().
1068
# TODO: it should be possible to optimize this for Windows by using the
1069
# win32 API FindFiles function to look for the specified name - but using
1070
# os.listdir() still gives us the correct, platform agnostic semantics in
1073
rel = relpath(base, path)
1074
# '.' will have been turned into ''
1078
abs_base = abspath(base)
1080
_listdir = os.listdir
1082
# use an explicit iterator so we can easily consume the rest on early exit.
1083
bit_iter = iter(rel.split('/'))
1084
for bit in bit_iter:
1086
for look in _listdir(current):
1087
if lbit == look.lower():
1088
current = pathjoin(current, look)
1091
# got to the end, nothing matched, so we just return the
1092
# non-existing bits as they were specified (the filename may be
1093
# the target of a move, for example).
1094
current = pathjoin(current, bit, *list(bit_iter))
1096
return current[len(abs_base)+1:]
1098
# XXX - TODO - we need better detection/integration of case-insensitive
1099
# file-systems; Linux often sees FAT32 devices (or NFS-mounted OSX
1100
# filesystems), for example, so could probably benefit from the same basic
1101
# support there. For now though, only Windows and OSX get that support, and
1102
# they get it for *all* file-systems!
1103
if sys.platform in ('win32', 'darwin'):
1104
canonical_relpath = _cicp_canonical_relpath
1106
canonical_relpath = relpath
1108
def canonical_relpaths(base, paths):
1109
"""Create an iterable to canonicalize a sequence of relative paths.
1111
The intent is for this implementation to use a cache, vastly speeding
1112
up multiple transformations in the same directory.
1114
# but for now, we haven't optimized...
1115
return [canonical_relpath(base, p) for p in paths]
1117
942
def safe_unicode(unicode_or_utf8_string):
1118
943
"""Coerce unicode_or_utf8_string into unicode.
1120
945
If it is unicode, it is returned.
1121
Otherwise it is decoded from utf-8. If decoding fails, the exception is
1122
wrapped in a BzrBadParameterNotUnicode exception.
946
Otherwise it is decoded from utf-8. If a decoding error
947
occurs, it is wrapped as a If the decoding fails, the exception is wrapped
948
as a BzrBadParameter exception.
1124
950
if isinstance(unicode_or_utf8_string, unicode):
1125
951
return unicode_or_utf8_string
1342
1168
def walkdirs(top, prefix=""):
1343
1169
"""Yield data about all the directories in a tree.
1345
1171
This yields all the data about the contents of a directory at a time.
1346
1172
After each directory has been yielded, if the caller has mutated the list
1347
1173
to exclude some directories, they are then not descended into.
1349
1175
The data yielded is of the form:
1350
1176
((directory-relpath, directory-path-from-top),
1351
1177
[(relpath, basename, kind, lstat, path-from-top), ...]),
1352
1178
- directory-relpath is the relative path of the directory being returned
1353
1179
with respect to top. prefix is prepended to this.
1354
- directory-path-from-root is the path including top for this directory.
1180
- directory-path-from-root is the path including top for this directory.
1355
1181
It is suitable for use with os functions.
1356
1182
- relpath is the relative path within the subtree being walked.
1357
1183
- basename is the basename of the path
1359
1185
present within the tree - but it may be recorded as versioned. See
1360
1186
versioned_kind.
1361
1187
- lstat is the stat data *if* the file was statted.
1362
- planned, not implemented:
1188
- planned, not implemented:
1363
1189
path_from_tree_root is the path from the root of the tree.
1365
:param prefix: Prefix the relpaths that are yielded with 'prefix'. This
1191
:param prefix: Prefix the relpaths that are yielded with 'prefix'. This
1366
1192
allows one to walk a subtree but get paths that are relative to a tree
1367
1193
rooted higher up.
1368
1194
:return: an iterator over the dirs.
1370
1196
#TODO there is a bit of a smell where the results of the directory-
1371
# summary in this, and the path from the root, may not agree
1197
# summary in this, and the path from the root, may not agree
1372
1198
# depending on top and prefix - i.e. ./foo and foo as a pair leads to
1373
1199
# potentially confusing output. We should make this more robust - but
1374
1200
# not at a speed cost. RBC 20060731
1375
1201
_lstat = os.lstat
1376
1202
_directory = _directory_kind
1377
1203
_listdir = os.listdir
1378
_kind_from_mode = file_kind_from_stat_mode
1204
_kind_from_mode = _formats.get
1379
1205
pending = [(safe_unicode(prefix), "", _directory, None, safe_unicode(top))]
1381
1207
# 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath
1405
1231
pending.extend(d for d in reversed(dirblock) if d[2] == _directory)
1408
class DirReader(object):
1409
"""An interface for reading directories."""
1411
def top_prefix_to_starting_dir(self, top, prefix=""):
1412
"""Converts top and prefix to a starting dir entry
1414
:param top: A utf8 path
1415
:param prefix: An optional utf8 path to prefix output relative paths
1417
:return: A tuple starting with prefix, and ending with the native
1420
raise NotImplementedError(self.top_prefix_to_starting_dir)
1422
def read_dir(self, prefix, top):
1423
"""Read a specific dir.
1425
:param prefix: A utf8 prefix to be preprended to the path basenames.
1426
:param top: A natively encoded path to read.
1427
:return: A list of the directories contents. Each item contains:
1428
(utf8_relpath, utf8_name, kind, lstatvalue, native_abspath)
1430
raise NotImplementedError(self.read_dir)
1433
_selected_dir_reader = None
1234
_real_walkdirs_utf8 = None
1436
1236
def _walkdirs_utf8(top, prefix=""):
1437
1237
"""Yield data about all the directories in a tree.
1447
1247
path-from-top might be unicode or utf8, but it is the correct path to
1448
1248
pass to os functions to affect the file in question. (such as os.lstat)
1450
global _selected_dir_reader
1451
if _selected_dir_reader is None:
1250
global _real_walkdirs_utf8
1251
if _real_walkdirs_utf8 is None:
1452
1252
fs_encoding = _fs_enc.upper()
1453
if sys.platform == "win32" and win32utils.winver == 'Windows NT':
1253
if win32utils.winver == 'Windows NT':
1454
1254
# Win98 doesn't have unicode apis like FindFirstFileW
1455
1255
# TODO: We possibly could support Win98 by falling back to the
1456
1256
# original FindFirstFile, and using TCHAR instead of WCHAR,
1457
1257
# but that gets a bit tricky, and requires custom compiling
1458
1258
# for win98 anyway.
1460
from bzrlib._walkdirs_win32 import Win32ReadDir
1461
_selected_dir_reader = Win32ReadDir()
1260
from bzrlib._walkdirs_win32 import _walkdirs_utf8_win32_find_file
1462
1261
except ImportError:
1464
elif fs_encoding in ('UTF-8', 'US-ASCII', 'ANSI_X3.4-1968'):
1262
_real_walkdirs_utf8 = _walkdirs_unicode_to_utf8
1264
_real_walkdirs_utf8 = _walkdirs_utf8_win32_find_file
1265
elif fs_encoding not in ('UTF-8', 'US-ASCII', 'ANSI_X3.4-1968'):
1465
1266
# ANSI_X3.4-1968 is a form of ASCII
1467
from bzrlib._readdir_pyx import UTF8DirReader
1468
_selected_dir_reader = UTF8DirReader()
1472
if _selected_dir_reader is None:
1473
# Fallback to the python version
1474
_selected_dir_reader = UnicodeDirReader()
1267
_real_walkdirs_utf8 = _walkdirs_unicode_to_utf8
1269
_real_walkdirs_utf8 = _walkdirs_fs_utf8
1270
return _real_walkdirs_utf8(top, prefix=prefix)
1273
def _walkdirs_fs_utf8(top, prefix=""):
1274
"""See _walkdirs_utf8.
1276
This sub-function is called when we know the filesystem is already in utf8
1277
encoding. So we don't need to transcode filenames.
1280
_directory = _directory_kind
1281
# Use C accelerated directory listing.
1282
_listdir = _read_dir
1283
_kind_from_mode = _formats.get
1476
1285
# 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath
1477
1286
# But we don't actually uses 1-3 in pending, so set them to None
1478
pending = [[_selected_dir_reader.top_prefix_to_starting_dir(top, prefix)]]
1479
read_dir = _selected_dir_reader.read_dir
1480
_directory = _directory_kind
1287
pending = [(safe_utf8(prefix), None, None, None, safe_utf8(top))]
1482
relroot, _, _, _, top = pending[-1].pop()
1485
dirblock = sorted(read_dir(relroot, top))
1289
relroot, _, _, _, top = pending.pop()
1291
relprefix = relroot + '/'
1294
top_slash = top + '/'
1297
append = dirblock.append
1298
# read_dir supplies in should-stat order.
1299
for _, name in sorted(_listdir(top)):
1300
abspath = top_slash + name
1301
statvalue = _lstat(abspath)
1302
kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown')
1303
append((relprefix + name, name, kind, statvalue, abspath))
1486
1305
yield (relroot, top), dirblock
1487
1307
# push the user specified dirs from dirblock
1488
next = [d for d in reversed(dirblock) if d[2] == _directory]
1490
pending.append(next)
1493
class UnicodeDirReader(DirReader):
1494
"""A dir reader for non-utf8 file systems, which transcodes."""
1496
__slots__ = ['_utf8_encode']
1499
self._utf8_encode = codecs.getencoder('utf8')
1501
def top_prefix_to_starting_dir(self, top, prefix=""):
1502
"""See DirReader.top_prefix_to_starting_dir."""
1503
return (safe_utf8(prefix), None, None, None, safe_unicode(top))
1505
def read_dir(self, prefix, top):
1506
"""Read a single directory from a non-utf8 file system.
1508
top, and the abspath element in the output are unicode, all other paths
1509
are utf8. Local disk IO is done via unicode calls to listdir etc.
1511
This is currently the fallback code path when the filesystem encoding is
1512
not UTF-8. It may be better to implement an alternative so that we can
1513
safely handle paths that are not properly decodable in the current
1516
See DirReader.read_dir for details.
1518
_utf8_encode = self._utf8_encode
1520
_listdir = os.listdir
1521
_kind_from_mode = file_kind_from_stat_mode
1524
relprefix = prefix + '/'
1308
pending.extend(d for d in reversed(dirblock) if d[2] == _directory)
1311
def _walkdirs_unicode_to_utf8(top, prefix=""):
1312
"""See _walkdirs_utf8
1314
Because Win32 has a Unicode api, all of the 'path-from-top' entries will be
1316
This is currently the fallback code path when the filesystem encoding is
1317
not UTF-8. It may be better to implement an alternative so that we can
1318
safely handle paths that are not properly decodable in the current
1321
_utf8_encode = codecs.getencoder('utf8')
1323
_directory = _directory_kind
1324
_listdir = os.listdir
1325
_kind_from_mode = _formats.get
1327
pending = [(safe_utf8(prefix), None, None, None, safe_unicode(top))]
1329
relroot, _, _, _, top = pending.pop()
1331
relprefix = relroot + '/'
1527
1334
top_slash = top + u'/'
1530
1337
append = dirblock.append
1531
1338
for name in sorted(_listdir(top)):
1533
name_utf8 = _utf8_encode(name)[0]
1534
except UnicodeDecodeError:
1535
raise errors.BadFilenameEncoding(
1536
_utf8_encode(relprefix)[0] + name, _fs_enc)
1339
name_utf8 = _utf8_encode(name)[0]
1537
1340
abspath = top_slash + name
1538
1341
statvalue = _lstat(abspath)
1539
kind = _kind_from_mode(statvalue.st_mode)
1342
kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown')
1540
1343
append((relprefix + name_utf8, name_utf8, kind, statvalue, abspath))
1344
yield (relroot, top), dirblock
1346
# push the user specified dirs from dirblock
1347
pending.extend(d for d in reversed(dirblock) if d[2] == _directory)
1544
1350
def copy_tree(from_path, to_path, handlers={}):
1545
1351
"""Copy all of the entries in from_path into to_path.
1547
:param from_path: The base directory to copy.
1353
:param from_path: The base directory to copy.
1548
1354
:param to_path: The target directory. If it does not exist, it will
1550
1356
:param handlers: A dictionary of functions, which takes a source and
1702
1498
while len(b) < bytes:
1703
new = until_no_eintr(socket.recv, bytes - len(b))
1499
new = socket.recv(bytes - len(b))
1710
def send_all(socket, bytes, report_activity=None):
1506
def send_all(socket, bytes):
1711
1507
"""Send all bytes on a socket.
1713
1509
Regular socket.sendall() can give socket error 10053 on Windows. This
1714
1510
implementation sends no more than 64k at a time, which avoids this problem.
1716
:param report_activity: Call this as bytes are read, see
1717
Transport._report_activity
1719
1512
chunk_size = 2**16
1720
1513
for pos in xrange(0, len(bytes), chunk_size):
1721
block = bytes[pos:pos+chunk_size]
1722
if report_activity is not None:
1723
report_activity(len(block), 'write')
1724
until_no_eintr(socket.sendall, block)
1514
socket.sendall(bytes[pos:pos+chunk_size])
1727
1517
def dereference_path(path):
1772
1562
return open(filename, 'rU').read()
1775
def file_kind_from_stat_mode_thunk(mode):
1776
global file_kind_from_stat_mode
1777
if file_kind_from_stat_mode is file_kind_from_stat_mode_thunk:
1779
from bzrlib._readdir_pyx import UTF8DirReader
1780
file_kind_from_stat_mode = UTF8DirReader().kind_from_mode
1782
from bzrlib._readdir_py import (
1783
_kind_from_mode as file_kind_from_stat_mode
1785
return file_kind_from_stat_mode(mode)
1786
file_kind_from_stat_mode = file_kind_from_stat_mode_thunk
1789
def file_kind(f, _lstat=os.lstat):
1791
return file_kind_from_stat_mode(_lstat(f).st_mode)
1793
if getattr(e, 'errno', None) in (errno.ENOENT, errno.ENOTDIR):
1794
raise errors.NoSuchFile(f)
1798
def until_no_eintr(f, *a, **kw):
1799
"""Run f(*a, **kw), retrying if an EINTR error occurs."""
1800
# Borrowed from Twisted's twisted.python.util.untilConcludes function.
1804
except (IOError, OSError), e:
1805
if e.errno == errno.EINTR:
1809
def re_compile_checked(re_string, flags=0, where=""):
1810
"""Return a compiled re, or raise a sensible error.
1812
This should only be used when compiling user-supplied REs.
1814
:param re_string: Text form of regular expression.
1815
:param flags: eg re.IGNORECASE
1816
:param where: Message explaining to the user the context where
1817
it occurred, eg 'log search filter'.
1819
# from https://bugs.launchpad.net/bzr/+bug/251352
1821
re_obj = re.compile(re_string, flags)
1826
where = ' in ' + where
1827
# despite the name 'error' is a type
1828
raise errors.BzrCommandError('Invalid regular expression%s: %r: %s'
1829
% (where, re_string, e))
1832
if sys.platform == "win32":
1835
return msvcrt.getch()
1840
fd = sys.stdin.fileno()
1841
settings = termios.tcgetattr(fd)
1844
ch = sys.stdin.read(1)
1846
termios.tcsetattr(fd, termios.TCSADRAIN, settings)
1850
if sys.platform == 'linux2':
1851
def _local_concurrency():
1853
prefix = 'processor'
1854
for line in file('/proc/cpuinfo', 'rb'):
1855
if line.startswith(prefix):
1856
concurrency = int(line[line.find(':')+1:]) + 1
1858
elif sys.platform == 'darwin':
1859
def _local_concurrency():
1860
return subprocess.Popen(['sysctl', '-n', 'hw.availcpu'],
1861
stdout=subprocess.PIPE).communicate()[0]
1862
elif sys.platform[0:7] == 'freebsd':
1863
def _local_concurrency():
1864
return subprocess.Popen(['sysctl', '-n', 'hw.ncpu'],
1865
stdout=subprocess.PIPE).communicate()[0]
1866
elif sys.platform == 'sunos5':
1867
def _local_concurrency():
1868
return subprocess.Popen(['psrinfo', '-p',],
1869
stdout=subprocess.PIPE).communicate()[0]
1870
elif sys.platform == "win32":
1871
def _local_concurrency():
1872
# This appears to return the number of cores.
1873
return os.environ.get('NUMBER_OF_PROCESSORS')
1875
def _local_concurrency():
1880
_cached_local_concurrency = None
1882
def local_concurrency(use_cache=True):
1883
"""Return how many processes can be run concurrently.
1885
Rely on platform specific implementations and default to 1 (one) if
1886
anything goes wrong.
1888
global _cached_local_concurrency
1889
if _cached_local_concurrency is not None and use_cache:
1890
return _cached_local_concurrency
1893
concurrency = _local_concurrency()
1894
except (OSError, IOError):
1897
concurrency = int(concurrency)
1898
except (TypeError, ValueError):
1901
_cached_concurrency = concurrency
1566
from bzrlib._readdir_pyx import read_dir as _read_dir
1568
from bzrlib._readdir_py import read_dir as _read_dir