14
14
# along with this program; if not, write to the Free Software
15
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17
from __future__ import absolute_import
20
from stat import (S_ISREG, S_ISDIR, S_ISLNK, ST_MODE, ST_SIZE,
21
S_ISCHR, S_ISBLK, S_ISFIFO, S_ISSOCK)
27
from .lazy_import import lazy_import
27
from bzrlib.lazy_import import lazy_import
28
28
lazy_import(globals(), """
29
29
from datetime import datetime
31
from ntpath import (abspath as _nt_abspath,
33
normpath as _nt_normpath,
34
realpath as _nt_realpath,
35
splitdrive as _nt_splitdrive,
35
# We need to import both shutil and rmtree as we export the later on posix
36
# and need the former on windows
38
from shutil import rmtree
41
# We need to import both tempfile and mkdtemp as we export the later on posix
42
# and need the former on windows
44
from tempfile import mkdtemp
45
from tempfile import (
52
from breezy.i18n import gettext
57
# sha and md5 modules are deprecated in python2.6 but hashlib is available as
59
if sys.version_info < (2, 5):
60
import md5 as _mod_md5
62
import sha as _mod_sha
72
from bzrlib import symbol_versioning
73
75
# Cross platform wall-clock time functionality with decent resolution.
83
85
# be opened in binary mode, rather than text mode.
84
86
# On other platforms, O_BINARY doesn't exist, because
85
87
# they always open in binary mode, so it is okay to
86
# OR with 0 on those platforms.
87
# O_NOINHERIT and O_TEXT exists only on win32 too.
88
# OR with 0 on those platforms
88
89
O_BINARY = getattr(os, 'O_BINARY', 0)
89
O_TEXT = getattr(os, 'O_TEXT', 0)
90
O_NOINHERIT = getattr(os, 'O_NOINHERIT', 0)
93
class UnsupportedTimezoneFormat(errors.BzrError):
95
_fmt = ('Unsupported timezone format "%(timezone)s", '
96
'options are "utc", "original", "local".')
98
def __init__(self, timezone):
99
self.timezone = timezone
102
92
def get_unicode_argv():
106
94
user_encoding = get_user_encoding()
107
95
return [a.decode(user_encoding) for a in sys.argv[1:]]
108
96
except UnicodeDecodeError:
109
raise errors.BzrError(gettext("Parameter {0!r} encoding is unsupported by {1} "
110
"application locale.").format(a, user_encoding))
97
raise errors.BzrError(("Parameter '%r' is unsupported by the current "
113
101
def make_readonly(filename):
114
102
"""Make a filename read-only."""
115
103
mod = os.lstat(filename).st_mode
116
104
if not stat.S_ISLNK(mod):
118
chmod_if_possible(filename, mod)
106
os.chmod(filename, mod)
121
109
def make_writable(filename):
122
110
mod = os.lstat(filename).st_mode
123
111
if not stat.S_ISLNK(mod):
125
chmod_if_possible(filename, mod)
128
def chmod_if_possible(filename, mode):
129
# Set file mode if that can be safely done.
130
# Sometimes even on unix the filesystem won't allow it - see
131
# https://bugs.launchpad.net/bzr/+bug/606537
133
# It is probably faster to just do the chmod, rather than
134
# doing a stat, and then trying to compare
135
os.chmod(filename, mode)
136
except (IOError, OSError) as e:
137
# Permission/access denied seems to commonly happen on smbfs; there's
138
# probably no point warning about it.
139
# <https://bugs.launchpad.net/bzr/+bug/606537>
140
if getattr(e, 'errno') in (errno.EPERM, errno.EACCES):
141
trace.mutter("ignore error on chmod of %r: %r" % (
113
os.chmod(filename, mod)
147
116
def minimum_path_selection(paths):
256
225
file_existed = False
258
227
rename_func(new, tmp_name)
259
except (errors.NoSuchFile,) as e:
228
except (errors.NoSuchFile,), e:
262
231
# RBC 20060103 abstraction leakage: the paramiko SFTP clients rename
263
232
# function raises an IOError with errno is None when a rename fails.
264
233
# This then gets caught here.
265
234
if e.errno not in (None, errno.ENOENT, errno.ENOTDIR):
267
except Exception as e:
268
237
if (getattr(e, 'errno', None) is None
269
238
or e.errno not in (errno.ENOENT, errno.ENOTDIR)):
272
241
file_existed = True
276
# This may throw an exception, in which case success will
278
rename_func(old, new)
280
except (IOError, OSError) as e:
281
# source and target may be aliases of each other (e.g. on a
282
# case-insensitive filesystem), so we may have accidentally renamed
283
# source by when we tried to rename target
284
if (file_existed and e.errno in (None, errno.ENOENT)
285
and old.lower() == new.lower()):
286
# source and target are the same file on a case-insensitive
287
# filesystem, so we don't generate an exception
247
# This may throw an exception, in which case success will
249
rename_func(old, new)
251
except (IOError, OSError), e:
252
# source and target may be aliases of each other (e.g. on a
253
# case-insensitive filesystem), so we may have accidentally renamed
254
# source by when we tried to rename target
255
failure_exc = sys.exc_info()
256
if (file_existed and e.errno in (None, errno.ENOENT)
257
and old.lower() == new.lower()):
258
# source and target are the same file on a case-insensitive
259
# filesystem, so we don't generate an exception
293
263
# If the file used to exist, rename it back into place
296
266
unlink_func(tmp_name)
298
268
rename_func(tmp_name, new)
269
if failure_exc is not None:
270
raise failure_exc[0], failure_exc[1], failure_exc[2]
301
273
# In Python 2.4.2 and older, os.path.abspath and os.path.realpath
302
274
# choke on a Unicode string containing a relative path if
303
275
# os.getcwd() returns a non-sys.getdefaultencoding()-encoded
277
_fs_enc = sys.getfilesystemencoding() or 'utf-8'
305
278
def _posix_abspath(path):
306
279
# jam 20060426 rather than encoding to fsencoding
307
280
# copy posixpath.abspath, but use os.getcwdu instead
308
281
if not posixpath.isabs(path):
309
282
path = posixpath.join(getcwd(), path)
310
return _posix_normpath(path)
283
return posixpath.normpath(path)
313
286
def _posix_realpath(path):
314
287
return posixpath.realpath(path.encode(_fs_enc)).decode(_fs_enc)
317
def _posix_normpath(path):
318
path = posixpath.normpath(path)
319
# Bug 861008: posixpath.normpath() returns a path normalized according to
320
# the POSIX standard, which stipulates (for compatibility reasons) that two
321
# leading slashes must not be simplified to one, and only if there are 3 or
322
# more should they be simplified as one. So we treat the leading 2 slashes
323
# as a special case here by simply removing the first slash, as we consider
324
# that breaking POSIX compatibility for this obscure feature is acceptable.
325
# This is not a paranoid precaution, as we notably get paths like this when
326
# the repo is hosted at the root of the filesystem, i.e. in "/".
327
if path.startswith('//'):
332
def _posix_path_from_environ(key):
333
"""Get unicode path from `key` in environment or None if not present
335
Note that posix systems use arbitrary byte strings for filesystem objects,
336
so a path that raises BadFilenameEncoding here may still be accessible.
338
val = os.environ.get(key, None)
339
if PY3 or val is None:
342
return val.decode(_fs_enc)
343
except UnicodeDecodeError:
344
# GZ 2011-12-12:Ideally want to include `key` in the exception message
345
raise errors.BadFilenameEncoding(val, _fs_enc)
348
def _posix_get_home_dir():
349
"""Get the home directory of the current user as a unicode path"""
350
path = posixpath.expanduser("~")
352
return path.decode(_fs_enc)
353
except AttributeError:
355
except UnicodeDecodeError:
356
raise errors.BadFilenameEncoding(path, _fs_enc)
359
def _posix_getuser_unicode():
360
"""Get username from environment or password database as unicode"""
361
name = getpass.getuser()
364
user_encoding = get_user_encoding()
366
return name.decode(user_encoding)
367
except UnicodeDecodeError:
368
raise errors.BzrError("Encoding of username %r is unsupported by %s "
369
"application locale." % (name, user_encoding))
372
290
def _win32_fixdrive(path):
373
291
"""Force drive letters to be consistent.
378
296
running python.exe under cmd.exe return capital C:\\
379
297
running win32 python inside a cygwin shell returns lowercase c:\\
381
drive, path = ntpath.splitdrive(path)
299
drive, path = _nt_splitdrive(path)
382
300
return drive.upper() + path
385
303
def _win32_abspath(path):
386
# Real ntpath.abspath doesn't have a problem with a unicode cwd
387
return _win32_fixdrive(ntpath.abspath(path).replace('\\', '/'))
304
# Real _nt_abspath doesn't have a problem with a unicode cwd
305
return _win32_fixdrive(_nt_abspath(unicode(path)).replace('\\', '/'))
308
def _win98_abspath(path):
309
"""Return the absolute version of a path.
310
Windows 98 safe implementation (python reimplementation
311
of Win32 API function GetFullPathNameW)
316
# \\HOST\path => //HOST/path
317
# //HOST/path => //HOST/path
318
# path => C:/cwd/path
321
# check for absolute path
322
drive = _nt_splitdrive(path)[0]
323
if drive == '' and path[:2] not in('//','\\\\'):
325
# we cannot simply os.path.join cwd and path
326
# because os.path.join('C:','/path') produce '/path'
327
# and this is incorrect
328
if path[:1] in ('/','\\'):
329
cwd = _nt_splitdrive(cwd)[0]
331
path = cwd + '\\' + path
332
return _win32_fixdrive(_nt_normpath(path).replace('\\', '/'))
390
335
def _win32_realpath(path):
391
# Real ntpath.realpath doesn't have a problem with a unicode cwd
392
return _win32_fixdrive(ntpath.realpath(path).replace('\\', '/'))
336
# Real _nt_realpath doesn't have a problem with a unicode cwd
337
return _win32_fixdrive(_nt_realpath(unicode(path)).replace('\\', '/'))
395
340
def _win32_pathjoin(*args):
396
return ntpath.join(*args).replace('\\', '/')
341
return _nt_join(*args).replace('\\', '/')
399
344
def _win32_normpath(path):
400
return _win32_fixdrive(ntpath.normpath(path).replace('\\', '/'))
345
return _win32_fixdrive(_nt_normpath(unicode(path)).replace('\\', '/'))
403
348
def _win32_getcwd():
404
return _win32_fixdrive(_getcwd().replace('\\', '/'))
349
return _win32_fixdrive(os.getcwdu().replace('\\', '/'))
407
352
def _win32_mkdtemp(*args, **kwargs):
429
374
def _mac_getcwd():
430
return unicodedata.normalize('NFC', _getcwd())
433
def _rename_wrap_exception(rename_func):
434
"""Adds extra information to any exceptions that come from rename().
436
The exception has an updated message and 'old_filename' and 'new_filename'
440
def _rename_wrapper(old, new):
442
rename_func(old, new)
444
detailed_error = OSError(e.errno, e.strerror +
445
" [occurred when renaming '%s' to '%s']" %
447
detailed_error.old_filename = old
448
detailed_error.new_filename = new
451
return _rename_wrapper
454
if sys.version_info > (3,):
460
# Default rename wraps os.rename()
461
rename = _rename_wrap_exception(os.rename)
375
return unicodedata.normalize('NFC', os.getcwdu())
463
378
# Default is to just use the python builtins, but these can be rebound on
464
379
# particular platforms.
465
380
abspath = _posix_abspath
466
381
realpath = _posix_realpath
467
382
pathjoin = os.path.join
468
normpath = _posix_normpath
469
path_from_environ = _posix_path_from_environ
470
_get_home_dir = _posix_get_home_dir
471
getuser_unicode = _posix_getuser_unicode
383
normpath = os.path.normpath
473
386
dirname = os.path.dirname
474
387
basename = os.path.basename
475
388
split = os.path.split
476
389
splitext = os.path.splitext
477
# These were already lazily imported into local scope
390
# These were already imported into local scope
478
391
# mkdtemp = tempfile.mkdtemp
479
392
# rmtree = shutil.rmtree
487
394
MIN_ABS_PATHLENGTH = 1
490
397
if sys.platform == 'win32':
491
abspath = _win32_abspath
398
if win32utils.winver == 'Windows 98':
399
abspath = _win98_abspath
401
abspath = _win32_abspath
492
402
realpath = _win32_realpath
493
403
pathjoin = _win32_pathjoin
494
404
normpath = _win32_normpath
495
405
getcwd = _win32_getcwd
496
406
mkdtemp = _win32_mkdtemp
497
rename = _rename_wrap_exception(_win32_rename)
499
from . import _walkdirs_win32
503
lstat = _walkdirs_win32.lstat
504
fstat = _walkdirs_win32.fstat
505
wrap_stat = _walkdirs_win32.wrap_stat
407
rename = _win32_rename
507
409
MIN_ABS_PATHLENGTH = 3
547
446
On my standard US Windows XP, the preferred encoding is
548
447
cp1252, but the console is cp437
550
:param trace: If True trace the selected encoding via mutter().
552
from .trace import mutter
449
from bzrlib.trace import mutter
553
450
output_encoding = getattr(sys.stdout, 'encoding', None)
554
451
if not output_encoding:
555
452
input_encoding = getattr(sys.stdin, 'encoding', None)
556
453
if not input_encoding:
557
454
output_encoding = get_user_encoding()
559
mutter('encoding stdout as osutils.get_user_encoding() %r',
455
mutter('encoding stdout as osutils.get_user_encoding() %r',
562
458
output_encoding = input_encoding
564
mutter('encoding stdout as sys.stdin encoding %r',
459
mutter('encoding stdout as sys.stdin encoding %r', output_encoding)
568
mutter('encoding stdout as sys.stdout encoding %r', output_encoding)
461
mutter('encoding stdout as sys.stdout encoding %r', output_encoding)
569
462
if output_encoding == 'cp0':
570
463
# invalid encoding (cp0 means 'no codepage' on Windows)
571
464
output_encoding = get_user_encoding()
573
mutter('cp0 is invalid encoding.'
465
mutter('cp0 is invalid encoding.'
574
466
' encoding stdout as osutils.get_user_encoding() %r',
578
470
codecs.lookup(output_encoding)
579
471
except LookupError:
580
sys.stderr.write('brz: warning:'
472
sys.stderr.write('bzr: warning:'
581
473
' unknown terminal encoding %s.\n'
582
474
' Using encoding %s instead.\n'
583
475
% (output_encoding, get_user_encoding())
977
857
"""Return size of given open file."""
978
return os.fstat(f.fileno())[stat.ST_SIZE]
981
# Alias os.urandom to support platforms (which?) without /dev/urandom and
982
# override if it doesn't work. Avoid checking on windows where there is
983
# significant initialisation cost that can be avoided for some bzr calls.
985
rand_bytes = os.urandom
987
if rand_bytes.__module__ != "nt":
858
return os.fstat(f.fileno())[ST_SIZE]
861
# Define rand_bytes based on platform.
863
# Python 2.4 and later have os.urandom,
864
# but it doesn't work on some arches
866
rand_bytes = os.urandom
867
except (NotImplementedError, AttributeError):
868
# If python doesn't have os.urandom, or it doesn't work,
869
# then try to first pull random data from /dev/urandom
990
except NotImplementedError:
871
rand_bytes = file('/dev/urandom', 'rb').read
872
# Otherwise, use this hack as a last resort
873
except (IOError, OSError):
991
874
# not well seeded, but better than nothing
992
875
def rand_bytes(n):
1065
945
implementation should be loaded instead::
1068
>>> import breezy._fictional_extension_pyx
948
>>> import bzrlib._fictional_extension_pyx
1069
949
>>> except ImportError, e:
1070
>>> breezy.osutils.failed_to_load_extension(e)
1071
>>> import breezy._fictional_extension_py
950
>>> bzrlib.osutils.failed_to_load_extension(e)
951
>>> import bzrlib._fictional_extension_py
1073
953
# NB: This docstring is just an example, not a doctest, because doctest
1074
954
# currently can't cope with the use of lazy imports in this namespace --
1077
957
# This currently doesn't report the failure at the time it occurs, because
1078
958
# they tend to happen very early in startup when we can't check config
1079
959
# files etc, and also we want to report all failures but not spam the user
1080
960
# with 10 warnings.
961
from bzrlib import trace
1081
962
exception_str = str(exception)
1082
963
if exception_str not in _extension_load_failures:
1083
964
trace.mutter("failed to load compiled extension: %s" % exception_str)
1087
968
def report_extension_load_failures():
1088
969
if not _extension_load_failures:
1090
if config.GlobalConfig().suppress_warning('missing_extensions'):
971
from bzrlib.config import GlobalConfig
972
if GlobalConfig().get_user_option_as_bool('ignore_missing_extensions'):
1092
974
# the warnings framework should by default show this only once
1093
from .trace import warning
975
from bzrlib.trace import warning
1095
"brz: warning: some compiled extensions could not be loaded; "
1096
"see ``brz help missing-extensions``")
977
"bzr: warning: some compiled extensions could not be loaded; "
978
"see <https://answers.launchpad.net/bzr/+faq/703>")
1097
979
# we no longer show the specific missing extensions here, because it makes
1098
980
# the message too long and scary - see
1099
981
# https://bugs.launchpad.net/bzr/+bug/430529
1103
from ._chunks_to_lines_pyx import chunks_to_lines
1104
except ImportError as e:
985
from bzrlib._chunks_to_lines_pyx import chunks_to_lines
986
except ImportError, e:
1105
987
failed_to_load_extension(e)
1106
from ._chunks_to_lines_py import chunks_to_lines
988
from bzrlib._chunks_to_lines_py import chunks_to_lines
1109
991
def split_lines(s):
1394
1256
return unicode_or_utf8_string.encode('utf-8')
1397
def safe_revision_id(unicode_or_utf8_string):
1259
_revision_id_warning = ('Unicode revision ids were deprecated in bzr 0.15.'
1260
' Revision id generators should be creating utf8'
1264
def safe_revision_id(unicode_or_utf8_string, warn=True):
1398
1265
"""Revision ids should now be utf8, but at one point they were unicode.
1400
1267
:param unicode_or_utf8_string: A possibly Unicode revision_id. (can also be
1269
:param warn: Functions that are sanitizing user data can set warn=False
1402
1270
:return: None or a utf8 revision id.
1404
1272
if (unicode_or_utf8_string is None
1405
or unicode_or_utf8_string.__class__ == bytes):
1273
or unicode_or_utf8_string.__class__ == str):
1406
1274
return unicode_or_utf8_string
1407
raise TypeError('Unicode revision ids are no longer supported. '
1408
'Revision id generators should be creating utf8 revision '
1412
def safe_file_id(unicode_or_utf8_string):
1276
symbol_versioning.warn(_revision_id_warning, DeprecationWarning,
1278
return cache_utf8.encode(unicode_or_utf8_string)
1281
_file_id_warning = ('Unicode file ids were deprecated in bzr 0.15. File id'
1282
' generators should be creating utf8 file ids.')
1285
def safe_file_id(unicode_or_utf8_string, warn=True):
1413
1286
"""File ids should now be utf8, but at one point they were unicode.
1415
1288
This is the same as safe_utf8, except it uses the cached encode functions
1474
1346
normalized_filename = _inaccessible_normalized_filename
1477
def set_signal_handler(signum, handler, restart_syscall=True):
1478
"""A wrapper for signal.signal that also calls siginterrupt(signum, False)
1479
on platforms that support that.
1481
:param restart_syscall: if set, allow syscalls interrupted by a signal to
1482
automatically restart (by calling `signal.siginterrupt(signum,
1483
False)`). May be ignored if the feature is not available on this
1484
platform or Python version.
1488
siginterrupt = signal.siginterrupt
1490
# This python implementation doesn't provide signal support, hence no
1493
except AttributeError:
1494
# siginterrupt doesn't exist on this platform, or for this version
1496
siginterrupt = lambda signum, flag: None
1498
def sig_handler(*args):
1499
# Python resets the siginterrupt flag when a signal is
1500
# received. <http://bugs.python.org/issue8354>
1501
# As a workaround for some cases, set it back the way we want it.
1502
siginterrupt(signum, False)
1503
# Now run the handler function passed to set_signal_handler.
1506
sig_handler = handler
1507
old_handler = signal.signal(signum, sig_handler)
1509
siginterrupt(signum, False)
1513
1349
default_terminal_width = 80
1514
1350
"""The default terminal width for ttys.
1530
1360
None is returned if the width can't established precisely.
1533
- if BRZ_COLUMNS is set, returns its value
1363
- if BZR_COLUMNS is set, returns its value
1534
1364
- if there is no controlling terminal, returns None
1535
- query the OS, if the queried size has changed since the last query,
1537
1365
- if COLUMNS is set, returns its value,
1538
- if the OS has a value (even though it's never changed), return its value.
1540
1367
From there, we need to query the OS to get the size of the controlling
1543
On Unices we query the OS by:
1544
1371
- get termios.TIOCGWINSZ
1545
1372
- if an error occurs or a negative value is obtained, returns None
1547
On Windows we query the OS by:
1548
1376
- win32utils.get_console_size() decides,
1549
1377
- returns None on error (provided default value)
1551
# Note to implementors: if changing the rules for determining the width,
1552
# make sure you've considered the behaviour in these cases:
1553
# - M-x shell in emacs, where $COLUMNS is set and TIOCGWINSZ returns 0,0.
1554
# - brz log | less, in bash, where $COLUMNS not set and TIOCGWINSZ returns
1556
# - (add more interesting cases here, if you find any)
1557
# Some programs implement "Use $COLUMNS (if set) until SIGWINCH occurs",
1558
# but we don't want to register a signal handler because it is impossible
1559
# to do so without risking EINTR errors in Python <= 2.6.5 (see
1560
# <http://bugs.python.org/issue8354>). Instead we check TIOCGWINSZ every
1561
# time so we can notice if the reported size has changed, which should have
1564
# If BRZ_COLUMNS is set, take it, user is always right
1565
# Except if they specified 0 in which case, impose no limit here
1380
# If BZR_COLUMNS is set, take it, user is always right
1567
width = int(os.environ['BRZ_COLUMNS'])
1382
return int(os.environ['BZR_COLUMNS'])
1568
1383
except (KeyError, ValueError):
1570
if width is not None:
1576
1386
isatty = getattr(sys.stdout, 'isatty', None)
1577
if isatty is None or not isatty():
1578
# Don't guess, setting BRZ_COLUMNS is the recommended way to override.
1387
if isatty is None or not isatty():
1388
# Don't guess, setting BZR_COLUMNS is the recommended way to override.
1582
width, height = os_size = _terminal_size(None, None)
1583
global _first_terminal_size, _terminal_size_state
1584
if _terminal_size_state == 'no_data':
1585
_first_terminal_size = os_size
1586
_terminal_size_state = 'unchanged'
1587
elif (_terminal_size_state == 'unchanged' and
1588
_first_terminal_size != os_size):
1589
_terminal_size_state = 'changed'
1591
# If the OS claims to know how wide the terminal is, and this value has
1592
# ever changed, use that.
1593
if _terminal_size_state == 'changed':
1594
if width is not None and width > 0:
1597
# If COLUMNS is set, use it.
1391
# If COLUMNS is set, take it, the terminal knows better (even inside a
1392
# given terminal, the application can decide to set COLUMNS to a lower
1393
# value (splitted screen) or a bigger value (scroll bars))
1599
1395
return int(os.environ['COLUMNS'])
1600
1396
except (KeyError, ValueError):
1603
# Finally, use an unchanged size from the OS, if we have one.
1604
if _terminal_size_state == 'unchanged':
1605
if width is not None and width > 0:
1399
width, height = _terminal_size(None, None)
1401
# Consider invalid values as meaning no width
1608
# The width could not be determined.
1612
1407
def _win32_terminal_size(width, height):
1639
1434
_terminal_size = _ioctl_terminal_size
1437
def _terminal_size_changed(signum, frame):
1438
"""Set COLUMNS upon receiving a SIGnal for WINdow size CHange."""
1439
width, height = _terminal_size(None, None)
1440
if width is not None:
1441
os.environ['COLUMNS'] = str(width)
1444
_registered_sigwinch = False
1446
def watch_sigwinch():
1447
"""Register for SIGWINCH, once and only once."""
1448
global _registered_sigwinch
1449
if not _registered_sigwinch:
1450
if sys.platform == 'win32':
1451
# Martin (gz) mentioned WINDOW_BUFFER_SIZE_RECORD from
1452
# ReadConsoleInput but I've no idea how to plug that in
1453
# the current design -- vila 20091216
1456
signal.signal(signal.SIGWINCH, _terminal_size_changed)
1457
_registered_sigwinch = True
1642
1460
def supports_executable():
1643
1461
return sys.platform != "win32"
1828
1646
global _selected_dir_reader
1829
1647
if _selected_dir_reader is None:
1830
if sys.platform == "win32":
1648
fs_encoding = _fs_enc.upper()
1649
if sys.platform == "win32" and win32utils.winver == 'Windows NT':
1650
# Win98 doesn't have unicode apis like FindFirstFileW
1651
# TODO: We possibly could support Win98 by falling back to the
1652
# original FindFirstFile, and using TCHAR instead of WCHAR,
1653
# but that gets a bit tricky, and requires custom compiling
1832
from ._walkdirs_win32 import Win32ReadDir
1656
from bzrlib._walkdirs_win32 import Win32ReadDir
1833
1657
_selected_dir_reader = Win32ReadDir()
1834
1658
except ImportError:
1836
elif _fs_enc in ('utf-8', 'ascii'):
1660
elif fs_encoding in ('UTF-8', 'US-ASCII', 'ANSI_X3.4-1968'):
1661
# ANSI_X3.4-1968 is a form of ASCII
1838
from ._readdir_pyx import UTF8DirReader
1663
from bzrlib._readdir_pyx import UTF8DirReader
1839
1664
_selected_dir_reader = UTF8DirReader()
1840
except ImportError as e:
1665
except ImportError, e:
1841
1666
failed_to_load_extension(e)
1955
1780
real_handlers[kind](abspath, relpath)
1958
def copy_ownership_from_path(dst, src=None):
1959
"""Copy usr/grp ownership from src file/dir to dst file/dir.
1961
If src is None, the containing directory is used as source. If chown
1962
fails, the error is ignored and a warning is printed.
1964
chown = getattr(os, 'chown', None)
1969
src = os.path.dirname(dst)
1975
chown(dst, s.st_uid, s.st_gid)
1976
except OSError as e:
1978
'Unable to copy ownership from "%s" to "%s". '
1979
'You may want to set it manually.', src, dst)
1980
trace.log_exception_quietly()
1983
1783
def path_prefix_key(path):
1984
1784
"""Generate a prefix-order path key for path.
1986
1786
This can be used to sort paths in the same way that walkdirs does.
1988
return (dirname(path), path)
1788
return (dirname(path) , path)
1991
1791
def compare_paths_prefix_order(path_a, path_b):
1998
1798
_cached_user_encoding = None
2001
def get_user_encoding():
1801
def get_user_encoding(use_cache=True):
2002
1802
"""Find out what the preferred user encoding is.
2004
1804
This is generally the encoding that is used for command line parameters
2005
1805
and file contents. This may be different from the terminal encoding
2006
1806
or the filesystem encoding.
1808
:param use_cache: Enable cache for detected encoding.
1809
(This parameter is turned on by default,
1810
and required only for selftesting)
2008
1812
:return: A string defining the preferred user encoding
2010
1814
global _cached_user_encoding
2011
if _cached_user_encoding is not None:
1815
if _cached_user_encoding is not None and use_cache:
2012
1816
return _cached_user_encoding
2014
if os.name == 'posix' and getattr(locale, 'CODESET', None) is not None:
2015
# Use the existing locale settings and call nl_langinfo directly
2016
# rather than going through getpreferredencoding. This avoids
2017
# <http://bugs.python.org/issue6202> on OSX Python 2.6 and the
2018
# possibility of the setlocale call throwing an error.
2019
user_encoding = locale.nl_langinfo(locale.CODESET)
1818
if sys.platform == 'darwin':
1819
# python locale.getpreferredencoding() always return
1820
# 'mac-roman' on darwin. That's a lie.
1821
sys.platform = 'posix'
1823
if os.environ.get('LANG', None) is None:
1824
# If LANG is not set, we end up with 'ascii', which is bad
1825
# ('mac-roman' is more than ascii), so we set a default which
1826
# will give us UTF-8 (which appears to work in all cases on
1827
# OSX). Users are still free to override LANG of course, as
1828
# long as it give us something meaningful. This work-around
1829
# *may* not be needed with python 3k and/or OSX 10.5, but will
1830
# work with them too -- vila 20080908
1831
os.environ['LANG'] = 'en_US.UTF-8'
1834
sys.platform = 'darwin'
2021
# GZ 2011-12-19: On windows could call GetACP directly instead.
2022
user_encoding = locale.getpreferredencoding(False)
2025
user_encoding = codecs.lookup(user_encoding).name
2027
if user_encoding not in ("", "cp0"):
2028
sys.stderr.write('brz: warning:'
1839
user_encoding = locale.getpreferredencoding()
1840
except locale.Error, e:
1841
sys.stderr.write('bzr: warning: %s\n'
1842
' Could not determine what text encoding to use.\n'
1843
' This error usually means your Python interpreter\n'
1844
' doesn\'t support the locale set by $LANG (%s)\n'
1845
" Continuing with ascii encoding.\n"
1846
% (e, os.environ.get('LANG')))
1847
user_encoding = 'ascii'
1849
# Windows returns 'cp0' to indicate there is no code page. So we'll just
1850
# treat that as ASCII, and not support printing unicode characters to the
1853
# For python scripts run under vim, we get '', so also treat that as ASCII
1854
if user_encoding in (None, 'cp0', ''):
1855
user_encoding = 'ascii'
1859
codecs.lookup(user_encoding)
1861
sys.stderr.write('bzr: warning:'
2029
1862
' unknown encoding %s.'
2030
1863
' Continuing with ascii encoding.\n'
2031
1864
% user_encoding
2033
user_encoding = 'ascii'
2035
# Get 'ascii' when setlocale has not been called or LANG=C or unset.
2036
if user_encoding == 'ascii':
2037
if sys.platform == 'darwin':
2038
# OSX is special-cased in Python to have a UTF-8 filesystem
2039
# encoding and previously had LANG set here if not present.
2040
user_encoding = 'utf-8'
2041
# GZ 2011-12-19: Maybe UTF-8 should be the default in this case
2042
# for some other posix platforms as well.
2044
_cached_user_encoding = user_encoding
1866
user_encoding = 'ascii'
1869
_cached_user_encoding = user_encoding
2045
1871
return user_encoding
2048
def get_diff_header_encoding():
2049
return get_terminal_encoding()
2052
1874
def get_host_name():
2053
1875
"""Return the current unicode host name.
2056
1878
behaves inconsistently on different platforms.
2058
1880
if sys.platform == "win32":
2059
1882
return win32utils.get_host_name()
2063
return socket.gethostname()
2064
1885
return socket.gethostname().decode(get_user_encoding())
2067
# We must not read/write any more than 64k at a time from/to a socket so we
2068
# don't risk "no buffer space available" errors on some platforms. Windows in
2069
# particular is likely to throw WSAECONNABORTED or WSAENOBUFS if given too much
2071
MAX_SOCKET_CHUNK = 64 * 1024
2073
_end_of_stream_errors = [errno.ECONNRESET, errno.EPIPE, errno.EINVAL]
2074
for _eno in ['WSAECONNRESET', 'WSAECONNABORTED']:
2075
_eno = getattr(errno, _eno, None)
2076
if _eno is not None:
2077
_end_of_stream_errors.append(_eno)
2081
def read_bytes_from_socket(sock, report_activity=None,
2082
max_read_size=MAX_SOCKET_CHUNK):
2083
"""Read up to max_read_size of bytes from sock and notify of progress.
2085
Translates "Connection reset by peer" into file-like EOF (return an
2086
empty string rather than raise an error), and repeats the recv if
2087
interrupted by a signal.
2091
data = sock.recv(max_read_size)
2092
except socket.error as e:
2094
if eno in _end_of_stream_errors:
2095
# The connection was closed by the other side. Callers expect
2096
# an empty string to signal end-of-stream.
2098
elif eno == errno.EINTR:
2099
# Retry the interrupted recv.
2103
if report_activity is not None:
2104
report_activity(len(data), 'read')
2108
def recv_all(socket, count):
1888
def recv_all(socket, bytes):
2109
1889
"""Receive an exact number of bytes.
2111
1891
Regular Socket.recv() may return less than the requested number of bytes,
2112
depending on what's in the OS buffer. MSG_WAITALL is not available
1892
dependning on what's in the OS buffer. MSG_WAITALL is not available
2113
1893
on all platforms, but this should work everywhere. This will return
2114
1894
less than the requested amount if the remote end closes.
2116
1896
This isn't optimized and is intended mostly for use in testing.
2119
while len(b) < count:
2120
new = read_bytes_from_socket(socket, None, count - len(b))
1899
while len(b) < bytes:
1900
new = until_no_eintr(socket.recv, bytes - len(b))
2127
def send_all(sock, bytes, report_activity=None):
1907
def send_all(socket, bytes, report_activity=None):
2128
1908
"""Send all bytes on a socket.
2130
Breaks large blocks in smaller chunks to avoid buffering limitations on
2131
some platforms, and catches EINTR which may be thrown if the send is
2132
interrupted by a signal.
2134
This is preferred to socket.sendall(), because it avoids portability bugs
2135
and provides activity reporting.
1910
Regular socket.sendall() can give socket error 10053 on Windows. This
1911
implementation sends no more than 64k at a time, which avoids this problem.
2137
1913
:param report_activity: Call this as bytes are read, see
2138
1914
Transport._report_activity
2141
byte_count = len(bytes)
2142
view = memoryview(bytes)
2143
while sent_total < byte_count:
2145
sent = sock.send(view[sent_total:sent_total+MAX_SOCKET_CHUNK])
2146
except (socket.error, IOError) as e:
2147
if e.args[0] in _end_of_stream_errors:
2148
raise errors.ConnectionReset(
2149
"Error trying to write to socket", e)
2150
if e.args[0] != errno.EINTR:
2154
raise errors.ConnectionReset('Sending to %s returned 0 bytes'
2157
if report_activity is not None:
2158
report_activity(sent, 'write')
2161
def connect_socket(address):
2162
# Slight variation of the socket.create_connection() function (provided by
2163
# python-2.6) that can fail if getaddrinfo returns an empty list. We also
2164
# provide it for previous python versions. Also, we don't use the timeout
2165
# parameter (provided by the python implementation) so we don't implement
2167
err = socket.error('getaddrinfo returns an empty list')
2168
host, port = address
2169
for res in socket.getaddrinfo(host, port, 0, socket.SOCK_STREAM):
2170
af, socktype, proto, canonname, sa = res
2173
sock = socket.socket(af, socktype, proto)
2177
except socket.error as e:
2179
# 'err' is now the most recent error
2180
if sock is not None:
1917
for pos in xrange(0, len(bytes), chunk_size):
1918
block = bytes[pos:pos+chunk_size]
1919
if report_activity is not None:
1920
report_activity(len(block), 'write')
1921
until_no_eintr(socket.sendall, block)
2185
1924
def dereference_path(path):
2213
1952
If and when pkg_resources becomes a standard library, this routine
2214
1953
can delegate to it.
2216
# Check package name is within breezy
2217
if package == "breezy":
1955
# Check package name is within bzrlib
1956
if package == "bzrlib":
2218
1957
resource_relpath = resource_name
2219
elif package.startswith("breezy."):
2220
package = package[len("breezy."):].replace('.', os.sep)
1958
elif package.startswith("bzrlib."):
1959
package = package[len("bzrlib."):].replace('.', os.sep)
2221
1960
resource_relpath = pathjoin(package, resource_name)
2223
raise errors.BzrError('resource package %s not in breezy' % package)
1962
raise errors.BzrError('resource package %s not in bzrlib' % package)
2225
1964
# Map the resource to a file and read its contents
2226
base = dirname(breezy.__file__)
1965
base = dirname(bzrlib.__file__)
2227
1966
if getattr(sys, 'frozen', None): # bzr.exe
2228
1967
base = abspath(pathjoin(base, '..', '..'))
2229
with open(pathjoin(base, resource_relpath), "rU") as f:
1968
filename = pathjoin(base, resource_relpath)
1969
return open(filename, 'rU').read()
2232
1972
def file_kind_from_stat_mode_thunk(mode):
2233
1973
global file_kind_from_stat_mode
2234
1974
if file_kind_from_stat_mode is file_kind_from_stat_mode_thunk:
2236
from ._readdir_pyx import UTF8DirReader
1976
from bzrlib._readdir_pyx import UTF8DirReader
2237
1977
file_kind_from_stat_mode = UTF8DirReader().kind_from_mode
2238
except ImportError as e:
1978
except ImportError, e:
2239
1979
# This is one time where we won't warn that an extension failed to
2240
1980
# load. The extension is never available on Windows anyway.
2241
from ._readdir_py import (
1981
from bzrlib._readdir_py import (
2242
1982
_kind_from_mode as file_kind_from_stat_mode
2244
1984
return file_kind_from_stat_mode(mode)
2245
1985
file_kind_from_stat_mode = file_kind_from_stat_mode_thunk
2247
def file_stat(f, _lstat=os.lstat):
1988
def file_kind(f, _lstat=os.lstat):
2251
except OSError as e:
1990
return file_kind_from_stat_mode(_lstat(f).st_mode)
2252
1992
if getattr(e, 'errno', None) in (errno.ENOENT, errno.ENOTDIR):
2253
1993
raise errors.NoSuchFile(f)
2256
def file_kind(f, _lstat=os.lstat):
2257
stat_value = file_stat(f, _lstat)
2258
return file_kind_from_stat_mode(stat_value.st_mode)
2260
1997
def until_no_eintr(f, *a, **kw):
2261
"""Run f(*a, **kw), retrying if an EINTR error occurs.
2263
WARNING: you must be certain that it is safe to retry the call repeatedly
2264
if EINTR does occur. This is typically only true for low-level operations
2265
like os.read. If in any doubt, don't use this.
2267
Keep in mind that this is not a complete solution to EINTR. There is
2268
probably code in the Python standard library and other dependencies that
2269
may encounter EINTR if a signal arrives (and there is signal handler for
2270
that signal). So this function can reduce the impact for IO that breezy
2271
directly controls, but it is not a complete solution.
1998
"""Run f(*a, **kw), retrying if an EINTR error occurs."""
2273
1999
# Borrowed from Twisted's twisted.python.util.untilConcludes function.
2276
2002
return f(*a, **kw)
2277
except (IOError, OSError) as e:
2003
except (IOError, OSError), e:
2278
2004
if e.errno == errno.EINTR:
2008
def re_compile_checked(re_string, flags=0, where=""):
2009
"""Return a compiled re, or raise a sensible error.
2011
This should only be used when compiling user-supplied REs.
2013
:param re_string: Text form of regular expression.
2014
:param flags: eg re.IGNORECASE
2015
:param where: Message explaining to the user the context where
2016
it occurred, eg 'log search filter'.
2018
# from https://bugs.launchpad.net/bzr/+bug/251352
2020
re_obj = re.compile(re_string, flags)
2025
where = ' in ' + where
2026
# despite the name 'error' is a type
2027
raise errors.BzrCommandError('Invalid regular expression%s: %r: %s'
2028
% (where, re_string, e))
2283
2031
if sys.platform == "win32":
2286
2034
return msvcrt.getch()
2291
2039
fd = sys.stdin.fileno()
2292
2040
settings = termios.tcgetattr(fd)
2297
2045
termios.tcsetattr(fd, termios.TCSADRAIN, settings)
2300
if sys.platform.startswith('linux'):
2049
if sys.platform == 'linux2':
2301
2050
def _local_concurrency():
2303
return os.sysconf('SC_NPROCESSORS_ONLN')
2304
except (ValueError, OSError, AttributeError):
2052
prefix = 'processor'
2053
for line in file('/proc/cpuinfo', 'rb'):
2054
if line.startswith(prefix):
2055
concurrency = int(line[line.find(':')+1:]) + 1
2306
2057
elif sys.platform == 'darwin':
2307
2058
def _local_concurrency():
2308
2059
return subprocess.Popen(['sysctl', '-n', 'hw.availcpu'],
2309
2060
stdout=subprocess.PIPE).communicate()[0]
2310
elif "bsd" in sys.platform:
2061
elif sys.platform[0:7] == 'freebsd':
2311
2062
def _local_concurrency():
2312
2063
return subprocess.Popen(['sysctl', '-n', 'hw.ncpu'],
2313
2064
stdout=subprocess.PIPE).communicate()[0]
2366
2112
self.encode = encode
2368
2114
def write(self, object):
2369
if isinstance(object, str):
2115
if type(object) is str:
2370
2116
self.stream.write(object)
2372
2118
data, _ = self.encode(object, self.errors)
2373
2119
self.stream.write(data)
2375
if sys.platform == 'win32':
2376
def open_file(filename, mode='r', bufsize=-1):
2377
"""This function is used to override the ``open`` builtin.
2379
But it uses O_NOINHERIT flag so the file handle is not inherited by
2380
child processes. Deleting or renaming a closed file opened with this
2381
function is not blocking child processes.
2383
writing = 'w' in mode
2384
appending = 'a' in mode
2385
updating = '+' in mode
2386
binary = 'b' in mode
2389
# see http://msdn.microsoft.com/en-us/library/yeby3zcb%28VS.71%29.aspx
2390
# for flags for each modes.
2400
flags |= os.O_WRONLY
2401
flags |= os.O_CREAT | os.O_TRUNC
2406
flags |= os.O_WRONLY
2407
flags |= os.O_CREAT | os.O_APPEND
2412
flags |= os.O_RDONLY
2414
return os.fdopen(os.open(filename, flags), mode, bufsize)
2419
def available_backup_name(base, exists):
2420
"""Find a non-existing backup file name.
2422
This will *not* create anything, this only return a 'free' entry. This
2423
should be used for checking names in a directory below a locked
2424
tree/branch/repo to avoid race conditions. This is LBYL (Look Before You
2425
Leap) and generally discouraged.
2427
:param base: The base name.
2429
:param exists: A callable returning True if the path parameter exists.
2432
name = "%s.~%d~" % (base, counter)
2435
name = "%s.~%d~" % (base, counter)
2439
def set_fd_cloexec(fd):
2440
"""Set a Unix file descriptor's FD_CLOEXEC flag. Do nothing if platform
2441
support for this is not available.
2445
old = fcntl.fcntl(fd, fcntl.F_GETFD)
2446
fcntl.fcntl(fd, fcntl.F_SETFD, old | fcntl.FD_CLOEXEC)
2447
except (ImportError, AttributeError):
2448
# Either the fcntl module or specific constants are not present
2452
def find_executable_on_path(name):
2453
"""Finds an executable on the PATH.
2455
On Windows, this will try to append each extension in the PATHEXT
2456
environment variable to the name, if it cannot be found with the name
2459
:param name: The base name of the executable.
2460
:return: The path to the executable found or None.
2462
if sys.platform == 'win32':
2463
exts = os.environ.get('PATHEXT', '').split(os.pathsep)
2464
exts = [ext.lower() for ext in exts]
2465
base, ext = os.path.splitext(name)
2467
if ext.lower() not in exts:
2473
path = os.environ.get('PATH')
2474
if path is not None:
2475
path = path.split(os.pathsep)
2478
f = os.path.join(d, name) + ext
2479
if os.access(f, os.X_OK):
2481
if sys.platform == 'win32':
2482
app_path = win32utils.get_app_path(name)
2483
if app_path != name:
2488
def _posix_is_local_pid_dead(pid):
2489
"""True if pid doesn't correspond to live process on this machine"""
2491
# Special meaning of unix kill: just check if it's there.
2493
except OSError as e:
2494
if e.errno == errno.ESRCH:
2495
# On this machine, and really not found: as sure as we can be
2498
elif e.errno == errno.EPERM:
2499
# exists, though not ours
2502
mutter("os.kill(%d, 0) failed: %s" % (pid, e))
2503
# Don't really know.
2506
# Exists and our process: not dead.
2509
if sys.platform == "win32":
2510
is_local_pid_dead = win32utils.is_local_pid_dead
2512
is_local_pid_dead = _posix_is_local_pid_dead
2514
_maybe_ignored = ['EAGAIN', 'EINTR', 'ENOTSUP', 'EOPNOTSUPP', 'EACCES']
2515
_fdatasync_ignored = [getattr(errno, name) for name in _maybe_ignored
2516
if getattr(errno, name, None) is not None]
2519
def fdatasync(fileno):
2520
"""Flush file contents to disk if possible.
2522
:param fileno: Integer OS file handle.
2523
:raises TransportNotPossible: If flushing to disk is not possible.
2525
fn = getattr(os, 'fdatasync', getattr(os, 'fsync', None))
2529
except IOError as e:
2530
# See bug #1075108, on some platforms fdatasync exists, but can
2531
# raise ENOTSUP. However, we are calling fdatasync to be helpful
2532
# and reduce the chance of corruption-on-powerloss situations. It
2533
# is not a mandatory call, so it is ok to suppress failures.
2534
trace.mutter("ignoring error calling fdatasync: %s" % (e,))
2535
if getattr(e, 'errno', None) not in _fdatasync_ignored:
2539
def ensure_empty_directory_exists(path, exception_class):
2540
"""Make sure a local directory exists and is empty.
2542
If it does not exist, it is created. If it exists and is not empty, an
2543
instance of exception_class is raised.
2547
except OSError as e:
2548
if e.errno != errno.EEXIST:
2550
if os.listdir(path) != []:
2551
raise exception_class(path)
2554
def is_environment_error(evalue):
2555
"""True if exception instance is due to a process environment issue
2557
This includes OSError and IOError, but also other errors that come from
2558
the operating system or core libraries but are not subclasses of those.
2560
if isinstance(evalue, (EnvironmentError, select.error)):
2562
if sys.platform == "win32" and win32utils._is_pywintypes_error(evalue):