bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1 | # Copyright (C) 2005, 2006, 2007 Canonical Ltd
 | 
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 2 | #
 | 
| 1
by mbp at sourcefrog import from baz patch-364 | 3 | # This program is free software; you can redistribute it and/or modify
 | 
| 4 | # it under the terms of the GNU General Public License as published by
 | |
| 5 | # the Free Software Foundation; either version 2 of the License, or
 | |
| 6 | # (at your option) any later version.
 | |
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 7 | #
 | 
| 1
by mbp at sourcefrog import from baz patch-364 | 8 | # This program is distributed in the hope that it will be useful,
 | 
| 9 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
| 10 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
| 11 | # GNU General Public License for more details.
 | |
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 12 | #
 | 
| 1
by mbp at sourcefrog import from baz patch-364 | 13 | # You should have received a copy of the GNU General Public License
 | 
| 14 | # along with this program; if not, write to the Free Software
 | |
| 15 | # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 | |
| 16 | ||
| 1390
by Robert Collins pair programming worx... merge integration and weave | 17 | from cStringIO import StringIO | 
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 18 | import os | 
| 19 | import re | |
| 20 | import stat | |
| 21 | from stat import (S_ISREG, S_ISDIR, S_ISLNK, ST_MODE, ST_SIZE, | |
| 22 | S_ISCHR, S_ISBLK, S_ISFIFO, S_ISSOCK) | |
| 23 | import sys | |
| 24 | import time | |
| 25 | ||
| 26 | from bzrlib.lazy_import import lazy_import | |
| 27 | lazy_import(globals(), """ | |
| 2192.1.1
by Alexander Belchenko Before actually using encoding need to check that Python has corresponding codec | 28 | import codecs
 | 
| 2215.6.1
by James Henstridge Don't rely on time.timezone and time.altzone in local_time_offset(), | 29 | from datetime import datetime
 | 
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 30 | import errno
 | 
| 1711.4.5
by John Arbash Meinel the _posix_* routines should use posixpath not os.path, so tests pass on win32 | 31 | from ntpath import (abspath as _nt_abspath,
 | 
| 32 |                     join as _nt_join,
 | |
| 33 |                     normpath as _nt_normpath,
 | |
| 34 |                     realpath as _nt_realpath,
 | |
| 1711.5.2
by John Arbash Meinel win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this | 35 |                     splitdrive as _nt_splitdrive,
 | 
| 1711.4.5
by John Arbash Meinel the _posix_* routines should use posixpath not os.path, so tests pass on win32 | 36 |                     )
 | 
| 37 | import posixpath
 | |
| 1236
by Martin Pool - fix up imports | 38 | import sha
 | 
| 1692.7.6
by Martin Pool [patch] force deletion of trees containing readonly files (alexander) | 39 | import shutil
 | 
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 40 | from shutil import (
 | 
| 41 |     rmtree,
 | |
| 42 |     )
 | |
| 1185.31.40
by John Arbash Meinel Added osutils.mkdtemp() | 43 | import tempfile
 | 
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 44 | from tempfile import (
 | 
| 45 |     mkdtemp,
 | |
| 46 |     )
 | |
| 1185.85.75
by John Arbash Meinel Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. | 47 | import unicodedata
 | 
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 48 | |
| 49 | from bzrlib import (
 | |
| 2249.5.16
by John Arbash Meinel [merge] bzr.dev 2283 | 50 |     cache_utf8,
 | 
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 51 |     errors,
 | 
| 2245.4.6
by Alexander Belchenko osutils.py: terminal_width() now use win32utils.get_console_size() | 52 |     win32utils,
 | 
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 53 |     )
 | 
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 54 | """) | 
| 1
by mbp at sourcefrog import from baz patch-364 | 55 | |
| 3504.4.1
by John Arbash Meinel Write an alternative 'walkdirs' implementation that uses win32 apis. | 56 | |
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 57 | import bzrlib | 
| 2309.4.3
by John Arbash Meinel (broken) change safe_*_id to emit a warning. | 58 | from bzrlib import symbol_versioning | 
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 59 | from bzrlib.symbol_versioning import ( | 
| 60 | deprecated_function, | |
| 61 |     )
 | |
| 694
by Martin Pool - weed out all remaining calls to bailout() and remove the function | 62 | from bzrlib.trace import mutter | 
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 63 | |
| 1
by mbp at sourcefrog import from baz patch-364 | 64 | |
| 1755.3.7
by John Arbash Meinel Clean up and write tests for permissions. Now we use fstat which should be cheap, and lets us check the permissions and the file size | 65 | # On win32, O_BINARY is used to indicate the file should
 | 
| 66 | # be opened in binary mode, rather than text mode.
 | |
| 67 | # On other platforms, O_BINARY doesn't exist, because
 | |
| 68 | # they always open in binary mode, so it is okay to
 | |
| 69 | # OR with 0 on those platforms
 | |
| 70 | O_BINARY = getattr(os, 'O_BINARY', 0) | |
| 71 | ||
| 72 | ||
| 1
by mbp at sourcefrog import from baz patch-364 | 73 | def make_readonly(filename): | 
| 74 | """Make a filename read-only.""" | |
| 2949.6.1
by Alexander Belchenko windows python has os.lstat | 75 | mod = os.lstat(filename).st_mode | 
| 2568.1.1
by John Arbash Meinel (Elliot Murphy) Use os.lstat rather than os.stat for osutils.make_readonly/make_writeable | 76 | if not stat.S_ISLNK(mod): | 
| 77 | mod = mod & 0777555 | |
| 78 | os.chmod(filename, mod) | |
| 1
by mbp at sourcefrog import from baz patch-364 | 79 | |
| 80 | ||
| 81 | def make_writable(filename): | |
| 2949.6.1
by Alexander Belchenko windows python has os.lstat | 82 | mod = os.lstat(filename).st_mode | 
| 2568.1.1
by John Arbash Meinel (Elliot Murphy) Use os.lstat rather than os.stat for osutils.make_readonly/make_writeable | 83 | if not stat.S_ISLNK(mod): | 
| 84 | mod = mod | 0200 | |
| 85 | os.chmod(filename, mod) | |
| 1
by mbp at sourcefrog import from baz patch-364 | 86 | |
| 87 | ||
| 2825.7.1
by Robert Collins * Partial commits are now approximately 40% faster by walking over the | 88 | def minimum_path_selection(paths): | 
| 89 | """Return the smallset subset of paths which are outside paths. | |
| 90 | ||
| 2843.1.1
by Ian Clatworthy Faster partial commits by walking less data (Robert Collins) | 91 |     :param paths: A container (and hence not None) of paths.
 | 
| 2825.7.1
by Robert Collins * Partial commits are now approximately 40% faster by walking over the | 92 |     :return: A set of paths sufficient to include everything in paths via
 | 
| 93 |         is_inside_any, drawn from the paths parameter.
 | |
| 94 |     """
 | |
| 95 | search_paths = set() | |
| 96 | paths = set(paths) | |
| 97 | for path in paths: | |
| 2843.1.1
by Ian Clatworthy Faster partial commits by walking less data (Robert Collins) | 98 | other_paths = paths.difference([path]) | 
| 2825.7.1
by Robert Collins * Partial commits are now approximately 40% faster by walking over the | 99 | if not is_inside_any(other_paths, path): | 
| 100 |             # this is a top level path, we must check it.
 | |
| 101 | search_paths.add(path) | |
| 102 | return search_paths | |
| 103 | ||
| 104 | ||
| 1077
by Martin Pool - avoid compiling REs at module load time | 105 | _QUOTE_RE = None | 
| 969
by Martin Pool - Add less-sucky is_within_any | 106 | |
| 107 | ||
| 1
by mbp at sourcefrog import from baz patch-364 | 108 | def quotefn(f): | 
| 779
by Martin Pool - better quotefn for windows: use doublequotes for strings with | 109 | """Return a quoted filename filename | 
| 110 | ||
| 111 |     This previously used backslash quoting, but that works poorly on
 | |
| 112 |     Windows."""
 | |
| 113 |     # TODO: I'm not really sure this is the best format either.x
 | |
| 1077
by Martin Pool - avoid compiling REs at module load time | 114 | global _QUOTE_RE | 
| 1963.2.6
by Robey Pointer pychecker is on crack; go back to using 'is None'. | 115 | if _QUOTE_RE is None: | 
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 116 | _QUOTE_RE = re.compile(r'([^a-zA-Z0-9.,:/\\_~-])') | 
| 1077
by Martin Pool - avoid compiling REs at module load time | 117 | |
| 779
by Martin Pool - better quotefn for windows: use doublequotes for strings with | 118 | if _QUOTE_RE.search(f): | 
| 119 | return '"' + f + '"' | |
| 120 | else: | |
| 121 | return f | |
| 1
by mbp at sourcefrog import from baz patch-364 | 122 | |
| 123 | ||
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 124 | _directory_kind = 'directory' | 
| 125 | ||
| 1732.1.10
by John Arbash Meinel Updated version of file_kind. Rather than multiple function calls, one mask + dictionary lookup | 126 | _formats = { | 
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 127 | stat.S_IFDIR:_directory_kind, | 
| 1732.1.10
by John Arbash Meinel Updated version of file_kind. Rather than multiple function calls, one mask + dictionary lookup | 128 | stat.S_IFCHR:'chardev', | 
| 129 | stat.S_IFBLK:'block', | |
| 130 | stat.S_IFREG:'file', | |
| 131 | stat.S_IFIFO:'fifo', | |
| 132 | stat.S_IFLNK:'symlink', | |
| 133 | stat.S_IFSOCK:'socket', | |
| 134 | }
 | |
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 135 | |
| 136 | ||
| 137 | def file_kind_from_stat_mode(stat_mode, _formats=_formats, _unknown='unknown'): | |
| 138 | """Generate a file kind from a stat mode. This is used in walkdirs. | |
| 139 | ||
| 140 |     Its performance is critical: Do not mutate without careful benchmarking.
 | |
| 141 |     """
 | |
| 1732.1.12
by John Arbash Meinel improve bzrlib.osutils.file_kind performance from 324ms => 275ms | 142 | try: | 
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 143 | return _formats[stat_mode & 0170000] | 
| 1732.1.12
by John Arbash Meinel improve bzrlib.osutils.file_kind performance from 324ms => 275ms | 144 | except KeyError: | 
| 1732.1.30
by John Arbash Meinel More file_kind tweaks. Use keyword parameters to make everything a local variable. | 145 | return _unknown | 
| 488
by Martin Pool - new helper function kind_marker() | 146 | |
| 147 | ||
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 148 | def file_kind(f, _lstat=os.lstat, _mapper=file_kind_from_stat_mode): | 
| 1757.2.4
by Robert Collins Teach file_kind about NoSuchFile, reducing duplicate code, and add user files before entering the main loop in smart_add. | 149 | try: | 
| 150 | return _mapper(_lstat(f).st_mode) | |
| 151 | except OSError, e: | |
| 3146.8.18
by Aaron Bentley Merge with dev | 152 | if getattr(e, 'errno', None) in (errno.ENOENT, errno.ENOTDIR): | 
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 153 | raise errors.NoSuchFile(f) | 
| 1757.2.4
by Robert Collins Teach file_kind about NoSuchFile, reducing duplicate code, and add user files before entering the main loop in smart_add. | 154 |         raise
 | 
| 155 | ||
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 156 | |
| 1755.3.7
by John Arbash Meinel Clean up and write tests for permissions. Now we use fstat which should be cheap, and lets us check the permissions and the file size | 157 | def get_umask(): | 
| 158 | """Return the current umask""" | |
| 159 |     # Assume that people aren't messing with the umask while running
 | |
| 160 |     # XXX: This is not thread safe, but there is no way to get the
 | |
| 161 |     #      umask without setting it
 | |
| 162 | umask = os.umask(0) | |
| 163 | os.umask(umask) | |
| 164 | return umask | |
| 165 | ||
| 166 | ||
| 2324.2.1
by Dmitry Vasiliev kind_marker() optimization | 167 | _kind_marker_map = { | 
| 168 | "file": "", | |
| 169 | _directory_kind: "/", | |
| 170 | "symlink": "@", | |
| 1551.10.30
by Aaron Bentley Merge from bzr.dev | 171 | 'tree-reference': '+', | 
| 2324.2.1
by Dmitry Vasiliev kind_marker() optimization | 172 | }
 | 
| 1551.10.30
by Aaron Bentley Merge from bzr.dev | 173 | |
| 174 | ||
| 488
by Martin Pool - new helper function kind_marker() | 175 | def kind_marker(kind): | 
| 2324.2.1
by Dmitry Vasiliev kind_marker() optimization | 176 | try: | 
| 177 | return _kind_marker_map[kind] | |
| 178 | except KeyError: | |
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 179 | raise errors.BzrError('invalid file kind %r' % kind) | 
| 1
by mbp at sourcefrog import from baz patch-364 | 180 | |
| 2324.2.1
by Dmitry Vasiliev kind_marker() optimization | 181 | |
| 1732.1.2
by John Arbash Meinel just use os.path.lexists if it exists | 182 | lexists = getattr(os.path, 'lexists', None) | 
| 183 | if lexists is None: | |
| 184 | def lexists(f): | |
| 185 | try: | |
| 2324.2.2
by Dmitry Vasiliev Fixed lexists() implementation | 186 | stat = getattr(os, 'lstat', os.stat) | 
| 187 | stat(f) | |
| 1732.1.2
by John Arbash Meinel just use os.path.lexists if it exists | 188 | return True | 
| 2324.2.2
by Dmitry Vasiliev Fixed lexists() implementation | 189 | except OSError, e: | 
| 1732.1.2
by John Arbash Meinel just use os.path.lexists if it exists | 190 | if e.errno == errno.ENOENT: | 
| 191 | return False; | |
| 192 | else: | |
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 193 | raise errors.BzrError("lstat/stat of (%r): %r" % (f, e)) | 
| 1732.1.2
by John Arbash Meinel just use os.path.lexists if it exists | 194 | |
| 1
by mbp at sourcefrog import from baz patch-364 | 195 | |
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 196 | def fancy_rename(old, new, rename_func, unlink_func): | 
| 197 | """A fancy rename, when you don't have atomic rename. | |
| 198 |     
 | |
| 199 |     :param old: The old path, to rename from
 | |
| 200 |     :param new: The new path, to rename to
 | |
| 201 |     :param rename_func: The potentially non-atomic rename function
 | |
| 202 |     :param unlink_func: A way to delete the target file if the full rename succeeds
 | |
| 203 |     """
 | |
| 204 | ||
| 205 |     # sftp rename doesn't allow overwriting, so play tricks:
 | |
| 206 | import random | |
| 207 | base = os.path.basename(new) | |
| 208 | dirname = os.path.dirname(new) | |
| 1553.5.22
by Martin Pool Change fancy_rename to use rand_chars rather than reinvent it. | 209 | tmp_name = u'tmp.%s.%.9f.%d.%s' % (base, time.time(), os.getpid(), rand_chars(10)) | 
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 210 | tmp_name = pathjoin(dirname, tmp_name) | 
| 211 | ||
| 212 |     # Rename the file out of the way, but keep track if it didn't exist
 | |
| 213 |     # We don't want to grab just any exception
 | |
| 214 |     # something like EACCES should prevent us from continuing
 | |
| 215 |     # The downside is that the rename_func has to throw an exception
 | |
| 216 |     # with an errno = ENOENT, or NoSuchFile
 | |
| 217 | file_existed = False | |
| 218 | try: | |
| 219 | rename_func(new, tmp_name) | |
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 220 | except (errors.NoSuchFile,), e: | 
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 221 |         pass
 | 
| 1532
by Robert Collins Merge in John Meinels integration branch. | 222 | except IOError, e: | 
| 223 |         # RBC 20060103 abstraction leakage: the paramiko SFTP clients rename
 | |
| 1963.2.6
by Robey Pointer pychecker is on crack; go back to using 'is None'. | 224 |         # function raises an IOError with errno is None when a rename fails.
 | 
| 1532
by Robert Collins Merge in John Meinels integration branch. | 225 |         # This then gets caught here.
 | 
| 1185.50.37
by John Arbash Meinel Fixed exception handling for fancy_rename | 226 | if e.errno not in (None, errno.ENOENT, errno.ENOTDIR): | 
| 1532
by Robert Collins Merge in John Meinels integration branch. | 227 |             raise
 | 
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 228 | except Exception, e: | 
| 1963.2.6
by Robey Pointer pychecker is on crack; go back to using 'is None'. | 229 | if (getattr(e, 'errno', None) is None | 
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 230 | or e.errno not in (errno.ENOENT, errno.ENOTDIR)): | 
| 231 |             raise
 | |
| 232 | else: | |
| 233 | file_existed = True | |
| 234 | ||
| 235 | success = False | |
| 236 | try: | |
| 2978.8.2
by Alexander Belchenko teach fancy_rename to handle change case renames in possible case-insensitive filesystem | 237 | try: | 
| 238 |             # This may throw an exception, in which case success will
 | |
| 239 |             # not be set.
 | |
| 240 | rename_func(old, new) | |
| 241 | success = True | |
| 242 | except (IOError, OSError), e: | |
| 2978.8.3
by Alexander Belchenko Aaron's review | 243 |             # source and target may be aliases of each other (e.g. on a
 | 
| 244 |             # case-insensitive filesystem), so we may have accidentally renamed
 | |
| 245 |             # source by when we tried to rename target
 | |
| 2978.8.4
by Alexander Belchenko fancy_rename: lower() test removed. | 246 | if not (file_existed and e.errno in (None, errno.ENOENT)): | 
| 2978.8.2
by Alexander Belchenko teach fancy_rename to handle change case renames in possible case-insensitive filesystem | 247 |                 raise
 | 
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 248 | finally: | 
| 249 | if file_existed: | |
| 250 |             # If the file used to exist, rename it back into place
 | |
| 251 |             # otherwise just delete it from the tmp location
 | |
| 252 | if success: | |
| 1551.15.4
by Aaron Bentley Revert now-unnecessary changes | 253 | unlink_func(tmp_name) | 
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 254 | else: | 
| 1185.31.49
by John Arbash Meinel Some corrections using the new osutils.rename. **ALL TESTS PASS** | 255 | rename_func(tmp_name, new) | 
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 256 | |
| 1685.1.9
by John Arbash Meinel Updated LocalTransport so that it's base is now a URL rather than a local path. This helps consistency with all other functions. To do so, I added local_abspath() which returns the local path, and local_path_to/from_url | 257 | |
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 258 | # In Python 2.4.2 and older, os.path.abspath and os.path.realpath
 | 
| 259 | # choke on a Unicode string containing a relative path if
 | |
| 260 | # os.getcwd() returns a non-sys.getdefaultencoding()-encoded
 | |
| 261 | # string.
 | |
| 2093.1.1
by John Arbash Meinel (Bart Teeuwisse) if sys.getfilesystemencoding() is None, use 'utf-8' | 262 | _fs_enc = sys.getfilesystemencoding() or 'utf-8' | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 263 | def _posix_abspath(path): | 
| 1711.4.5
by John Arbash Meinel the _posix_* routines should use posixpath not os.path, so tests pass on win32 | 264 |     # jam 20060426 rather than encoding to fsencoding
 | 
| 265 |     # copy posixpath.abspath, but use os.getcwdu instead
 | |
| 266 | if not posixpath.isabs(path): | |
| 267 | path = posixpath.join(getcwd(), path) | |
| 268 | return posixpath.normpath(path) | |
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 269 | |
| 270 | ||
| 271 | def _posix_realpath(path): | |
| 1711.4.5
by John Arbash Meinel the _posix_* routines should use posixpath not os.path, so tests pass on win32 | 272 | return posixpath.realpath(path.encode(_fs_enc)).decode(_fs_enc) | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 273 | |
| 274 | ||
| 1711.5.2
by John Arbash Meinel win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this | 275 | def _win32_fixdrive(path): | 
| 276 | """Force drive letters to be consistent. | |
| 277 | ||
| 278 |     win32 is inconsistent whether it returns lower or upper case
 | |
| 279 |     and even if it was consistent the user might type the other
 | |
| 280 |     so we force it to uppercase
 | |
| 281 |     running python.exe under cmd.exe return capital C:\\
 | |
| 282 |     running win32 python inside a cygwin shell returns lowercase c:\\
 | |
| 283 |     """
 | |
| 284 | drive, path = _nt_splitdrive(path) | |
| 285 | return drive.upper() + path | |
| 286 | ||
| 287 | ||
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 288 | def _win32_abspath(path): | 
| 1711.4.6
by John Arbash Meinel Removing hacks for _win32_abspath, on real win32 abspath handles unicode just fine, it doesn't handle encoding into 'mbcs' | 289 |     # Real _nt_abspath doesn't have a problem with a unicode cwd
 | 
| 1711.5.2
by John Arbash Meinel win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this | 290 | return _win32_fixdrive(_nt_abspath(unicode(path)).replace('\\', '/')) | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 291 | |
| 292 | ||
| 2279.4.1
by Alexander Belchenko Reimplementation of ntpath.abspath in Python for Windows98: unicode safe, UNC path safe | 293 | def _win98_abspath(path): | 
| 294 | """Return the absolute version of a path. | |
| 295 |     Windows 98 safe implementation (python reimplementation
 | |
| 296 |     of Win32 API function GetFullPathNameW)
 | |
| 297 |     """
 | |
| 298 |     # Corner cases:
 | |
| 299 |     #   C:\path     => C:/path
 | |
| 300 |     #   C:/path     => C:/path
 | |
| 301 |     #   \\HOST\path => //HOST/path
 | |
| 302 |     #   //HOST/path => //HOST/path
 | |
| 303 |     #   path        => C:/cwd/path
 | |
| 304 |     #   /path       => C:/path
 | |
| 305 | path = unicode(path) | |
| 306 |     # check for absolute path
 | |
| 307 | drive = _nt_splitdrive(path)[0] | |
| 308 | if drive == '' and path[:2] not in('//','\\\\'): | |
| 309 | cwd = os.getcwdu() | |
| 310 |         # we cannot simply os.path.join cwd and path
 | |
| 311 |         # because os.path.join('C:','/path') produce '/path'
 | |
| 312 |         # and this is incorrect
 | |
| 313 | if path[:1] in ('/','\\'): | |
| 314 | cwd = _nt_splitdrive(cwd)[0] | |
| 2279.4.3
by Alexander Belchenko win98_abspath: support for running in POSIX environment: cwd path has not drive letter | 315 | path = path[1:] | 
| 2279.4.1
by Alexander Belchenko Reimplementation of ntpath.abspath in Python for Windows98: unicode safe, UNC path safe | 316 | path = cwd + '\\' + path | 
| 317 | return _win32_fixdrive(_nt_normpath(path).replace('\\', '/')) | |
| 318 | ||
| 319 | if win32utils.winver == 'Windows 98': | |
| 320 | _win32_abspath = _win98_abspath | |
| 321 | ||
| 322 | ||
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 323 | def _win32_realpath(path): | 
| 1711.4.6
by John Arbash Meinel Removing hacks for _win32_abspath, on real win32 abspath handles unicode just fine, it doesn't handle encoding into 'mbcs' | 324 |     # Real _nt_realpath doesn't have a problem with a unicode cwd
 | 
| 1711.5.2
by John Arbash Meinel win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this | 325 | return _win32_fixdrive(_nt_realpath(unicode(path)).replace('\\', '/')) | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 326 | |
| 327 | ||
| 328 | def _win32_pathjoin(*args): | |
| 1685.1.31
by John Arbash Meinel Adding tests for the rest of the _win32 functions. | 329 | return _nt_join(*args).replace('\\', '/') | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 330 | |
| 331 | ||
| 332 | def _win32_normpath(path): | |
| 1711.5.2
by John Arbash Meinel win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this | 333 | return _win32_fixdrive(_nt_normpath(unicode(path)).replace('\\', '/')) | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 334 | |
| 335 | ||
| 336 | def _win32_getcwd(): | |
| 1711.5.2
by John Arbash Meinel win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this | 337 | return _win32_fixdrive(os.getcwdu().replace('\\', '/')) | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 338 | |
| 339 | ||
| 340 | def _win32_mkdtemp(*args, **kwargs): | |
| 1711.5.2
by John Arbash Meinel win32 likes to return lowercase drive letters sometimes, and uppercase at other times. normalize this | 341 | return _win32_fixdrive(tempfile.mkdtemp(*args, **kwargs).replace('\\', '/')) | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 342 | |
| 343 | ||
| 344 | def _win32_rename(old, new): | |
| 1711.7.6
by John Arbash Meinel Change _win32_rename() so that it raises ENOENT *before* it tries any renaming. | 345 | """We expect to be able to atomically replace 'new' with old. | 
| 346 | ||
| 1711.7.17
by John Arbash Meinel Delay the extra syscall in _win32_rename until we get a failure. | 347 |     On win32, if new exists, it must be moved out of the way first,
 | 
| 348 |     and then deleted. 
 | |
| 1711.7.6
by John Arbash Meinel Change _win32_rename() so that it raises ENOENT *before* it tries any renaming. | 349 |     """
 | 
| 1711.7.17
by John Arbash Meinel Delay the extra syscall in _win32_rename until we get a failure. | 350 | try: | 
| 351 | fancy_rename(old, new, rename_func=os.rename, unlink_func=os.unlink) | |
| 352 | except OSError, e: | |
| 1830.3.15
by John Arbash Meinel On Mac we get EINVAL when renaming cwd | 353 | if e.errno in (errno.EPERM, errno.EACCES, errno.EBUSY, errno.EINVAL): | 
| 354 |             # If we try to rename a non-existant file onto cwd, we get 
 | |
| 355 |             # EPERM or EACCES instead of ENOENT, this will raise ENOENT 
 | |
| 356 |             # if the old path doesn't exist, sometimes we get EACCES
 | |
| 357 |             # On Linux, we seem to get EBUSY, on Mac we get EINVAL
 | |
| 1711.7.17
by John Arbash Meinel Delay the extra syscall in _win32_rename until we get a failure. | 358 | os.lstat(old) | 
| 359 |         raise
 | |
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 360 | |
| 361 | ||
| 1830.3.11
by John Arbash Meinel Create a mac version of 'getcwd()' which normalizes the path. | 362 | def _mac_getcwd(): | 
| 3201.1.1
by jameinel Fix bug #185458, switch from NFKC to NFC and add tests for filenames that would be broken under NFKC | 363 | return unicodedata.normalize('NFC', os.getcwdu()) | 
| 1830.3.11
by John Arbash Meinel Create a mac version of 'getcwd()' which normalizes the path. | 364 | |
| 365 | ||
| 1692.7.6
by Martin Pool [patch] force deletion of trees containing readonly files (alexander) | 366 | # Default is to just use the python builtins, but these can be rebound on
 | 
| 367 | # particular platforms.
 | |
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 368 | abspath = _posix_abspath | 
| 369 | realpath = _posix_realpath | |
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 370 | pathjoin = os.path.join | 
| 371 | normpath = os.path.normpath | |
| 372 | getcwd = os.getcwdu | |
| 373 | rename = os.rename | |
| 374 | dirname = os.path.dirname | |
| 375 | basename = os.path.basename | |
| 2215.4.2
by Alexander Belchenko split and splitext now the part of osutils | 376 | split = os.path.split | 
| 377 | splitext = os.path.splitext | |
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 378 | # These were already imported into local scope
 | 
| 379 | # mkdtemp = tempfile.mkdtemp
 | |
| 380 | # rmtree = shutil.rmtree
 | |
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 381 | |
| 1551.2.53
by abentley Strip trailing slashes in a platform-sensible way | 382 | MIN_ABS_PATHLENGTH = 1 | 
| 383 | ||
| 1685.1.9
by John Arbash Meinel Updated LocalTransport so that it's base is now a URL rather than a local path. This helps consistency with all other functions. To do so, I added local_abspath() which returns the local path, and local_path_to/from_url | 384 | |
| 1185.31.47
by John Arbash Meinel Added a fancy footwork rename to osutils, made SftpTransport use it. | 385 | if sys.platform == 'win32': | 
| 1685.1.20
by John Arbash Meinel More changes to get 'bzr branch' and 'bzr pull' to work | 386 | abspath = _win32_abspath | 
| 387 | realpath = _win32_realpath | |
| 388 | pathjoin = _win32_pathjoin | |
| 389 | normpath = _win32_normpath | |
| 390 | getcwd = _win32_getcwd | |
| 391 | mkdtemp = _win32_mkdtemp | |
| 392 | rename = _win32_rename | |
| 393 | ||
| 1551.2.53
by abentley Strip trailing slashes in a platform-sensible way | 394 | MIN_ABS_PATHLENGTH = 3 | 
| 1532
by Robert Collins Merge in John Meinels integration branch. | 395 | |
| 1692.7.6
by Martin Pool [patch] force deletion of trees containing readonly files (alexander) | 396 | def _win32_delete_readonly(function, path, excinfo): | 
| 397 | """Error handler for shutil.rmtree function [for win32] | |
| 398 |         Helps to remove files and dirs marked as read-only.
 | |
| 399 |         """
 | |
| 2116.5.1
by Henri Wiechers Fixes osutils.rmtree on Windows with Python 2.5 | 400 | exception = excinfo[1] | 
| 1692.7.6
by Martin Pool [patch] force deletion of trees containing readonly files (alexander) | 401 | if function in (os.remove, os.rmdir) \ | 
| 2116.5.1
by Henri Wiechers Fixes osutils.rmtree on Windows with Python 2.5 | 402 | and isinstance(exception, OSError) \ | 
| 403 | and exception.errno == errno.EACCES: | |
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 404 | make_writable(path) | 
| 1692.7.6
by Martin Pool [patch] force deletion of trees containing readonly files (alexander) | 405 | function(path) | 
| 406 | else: | |
| 407 |             raise
 | |
| 408 | ||
| 409 | def rmtree(path, ignore_errors=False, onerror=_win32_delete_readonly): | |
| 410 | """Replacer for shutil.rmtree: could remove readonly dirs/files""" | |
| 411 | return shutil.rmtree(path, ignore_errors, onerror) | |
| 1830.3.11
by John Arbash Meinel Create a mac version of 'getcwd()' which normalizes the path. | 412 | elif sys.platform == 'darwin': | 
| 413 | getcwd = _mac_getcwd | |
| 1692.7.6
by Martin Pool [patch] force deletion of trees containing readonly files (alexander) | 414 | |
| 1685.1.31
by John Arbash Meinel Adding tests for the rest of the _win32 functions. | 415 | |
| 1711.4.10
by John Arbash Meinel Pull out sys.stdout.encoding handling into a separate function so it can be tested, and used elsewhere. | 416 | def get_terminal_encoding(): | 
| 417 | """Find the best encoding for printing to the screen. | |
| 418 | ||
| 419 |     This attempts to check both sys.stdout and sys.stdin to see
 | |
| 420 |     what encoding they are in, and if that fails it falls back to
 | |
| 421 |     bzrlib.user_encoding.
 | |
| 422 |     The problem is that on Windows, locale.getpreferredencoding()
 | |
| 423 |     is not the same encoding as that used by the console:
 | |
| 424 |     http://mail.python.org/pipermail/python-list/2003-May/162357.html
 | |
| 425 | ||
| 426 |     On my standard US Windows XP, the preferred encoding is
 | |
| 427 |     cp1252, but the console is cp437
 | |
| 428 |     """
 | |
| 429 | output_encoding = getattr(sys.stdout, 'encoding', None) | |
| 430 | if not output_encoding: | |
| 431 | input_encoding = getattr(sys.stdin, 'encoding', None) | |
| 432 | if not input_encoding: | |
| 433 | output_encoding = bzrlib.user_encoding | |
| 434 | mutter('encoding stdout as bzrlib.user_encoding %r', output_encoding) | |
| 435 | else: | |
| 436 | output_encoding = input_encoding | |
| 437 | mutter('encoding stdout as sys.stdin encoding %r', output_encoding) | |
| 438 | else: | |
| 439 | mutter('encoding stdout as sys.stdout encoding %r', output_encoding) | |
| 2127.4.1
by Alexander Belchenko (jam, bialix) Workaround for cp0 console encoding on Windows | 440 | if output_encoding == 'cp0': | 
| 441 |         # invalid encoding (cp0 means 'no codepage' on Windows)
 | |
| 442 | output_encoding = bzrlib.user_encoding | |
| 443 | mutter('cp0 is invalid encoding.' | |
| 444 | ' encoding stdout as bzrlib.user_encoding %r', output_encoding) | |
| 2192.1.1
by Alexander Belchenko Before actually using encoding need to check that Python has corresponding codec | 445 |     # check encoding
 | 
| 446 | try: | |
| 447 | codecs.lookup(output_encoding) | |
| 448 | except LookupError: | |
| 449 | sys.stderr.write('bzr: warning:' | |
| 2192.1.9
by Alexander Belchenko final fix suggested by John Meinel | 450 | ' unknown terminal encoding %s.\n' | 
| 2192.1.1
by Alexander Belchenko Before actually using encoding need to check that Python has corresponding codec | 451 | ' Using encoding %s instead.\n' | 
| 452 | % (output_encoding, bzrlib.user_encoding) | |
| 453 |                         )
 | |
| 454 | output_encoding = bzrlib.user_encoding | |
| 455 | ||
| 1711.4.10
by John Arbash Meinel Pull out sys.stdout.encoding handling into a separate function so it can be tested, and used elsewhere. | 456 | return output_encoding | 
| 457 | ||
| 458 | ||
| 1185.31.32
by John Arbash Meinel Updated the bzr sourcecode to use bzrlib.osutils.pathjoin rather than os.path.join to enforce internal use of / instead of \ | 459 | def normalizepath(f): | 
| 3287.18.2
by Matt McClure Reverts to 3290. | 460 | if getattr(os.path, 'realpath', None) is not None: | 
| 1185.31.32
by John Arbash Meinel Updated the bzr sourcecode to use bzrlib.osutils.pathjoin rather than os.path.join to enforce internal use of / instead of \ | 461 | F = realpath | 
| 462 | else: | |
| 463 | F = abspath | |
| 464 | [p,e] = os.path.split(f) | |
| 465 | if e == "" or e == "." or e == "..": | |
| 466 | return F(f) | |
| 467 | else: | |
| 468 | return pathjoin(F(p), e) | |
| 469 | ||
| 1
by mbp at sourcefrog import from baz patch-364 | 470 | |
| 471 | def isdir(f): | |
| 472 | """True if f is an accessible directory.""" | |
| 473 | try: | |
| 474 | return S_ISDIR(os.lstat(f)[ST_MODE]) | |
| 475 | except OSError: | |
| 476 | return False | |
| 477 | ||
| 478 | ||
| 479 | def isfile(f): | |
| 480 | """True if f is a regular file.""" | |
| 481 | try: | |
| 482 | return S_ISREG(os.lstat(f)[ST_MODE]) | |
| 483 | except OSError: | |
| 484 | return False | |
| 485 | ||
| 1092.2.6
by Robert Collins symlink support updated to work | 486 | def islink(f): | 
| 487 | """True if f is a symlink.""" | |
| 488 | try: | |
| 489 | return S_ISLNK(os.lstat(f)[ST_MODE]) | |
| 490 | except OSError: | |
| 491 | return False | |
| 1
by mbp at sourcefrog import from baz patch-364 | 492 | |
| 485
by Martin Pool - move commit code into its own module | 493 | def is_inside(dir, fname): | 
| 494 | """True if fname is inside dir. | |
| 969
by Martin Pool - Add less-sucky is_within_any | 495 |     
 | 
| 1185.31.38
by John Arbash Meinel Changing os.path.normpath to osutils.normpath | 496 |     The parameters should typically be passed to osutils.normpath first, so
 | 
| 969
by Martin Pool - Add less-sucky is_within_any | 497 |     that . and .. and repeated slashes are eliminated, and the separators
 | 
| 498 |     are canonical for the platform.
 | |
| 499 |     
 | |
| 974.1.26
by aaron.bentley at utoronto merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472 | 500 |     The empty string as a dir name is taken as top-of-tree and matches 
 | 
| 501 |     everything.
 | |
| 485
by Martin Pool - move commit code into its own module | 502 |     """
 | 
| 969
by Martin Pool - Add less-sucky is_within_any | 503 |     # XXX: Most callers of this can actually do something smarter by 
 | 
| 504 |     # looking at the inventory
 | |
| 972
by Martin Pool - less dodgy is_inside function | 505 | if dir == fname: | 
| 506 | return True | |
| 507 | ||
| 974.1.26
by aaron.bentley at utoronto merged mbp@sourcefrog.net-20050817233101-0939da1cf91f2472 | 508 | if dir == '': | 
| 509 | return True | |
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 510 | |
| 1185.31.34
by John Arbash Meinel Removing instances of os.sep | 511 | if dir[-1] != '/': | 
| 512 | dir += '/' | |
| 1185.1.41
by Robert Collins massive patch from Alexander Belchenko - many PEP8 fixes, removes unused function uuid | 513 | |
| 972
by Martin Pool - less dodgy is_inside function | 514 | return fname.startswith(dir) | 
| 515 | ||
| 485
by Martin Pool - move commit code into its own module | 516 | |
| 517 | def is_inside_any(dir_list, fname): | |
| 518 | """True if fname is inside any of given dirs.""" | |
| 519 | for dirname in dir_list: | |
| 520 | if is_inside(dirname, fname): | |
| 521 | return True | |
| 2324.2.3
by Dmitry Vasiliev Fixed is_inside_* methods implementation | 522 | return False | 
| 485
by Martin Pool - move commit code into its own module | 523 | |
| 524 | ||
| 1740.3.4
by Jelmer Vernooij Move inventory to commit builder. | 525 | def is_inside_or_parent_of_any(dir_list, fname): | 
| 526 | """True if fname is a child or a parent of any of the given files.""" | |
| 527 | for dirname in dir_list: | |
| 528 | if is_inside(dirname, fname) or is_inside(fname, dirname): | |
| 529 | return True | |
| 2324.2.3
by Dmitry Vasiliev Fixed is_inside_* methods implementation | 530 | return False | 
| 1740.3.4
by Jelmer Vernooij Move inventory to commit builder. | 531 | |
| 532 | ||
| 3408.6.1
by Eric Holmberg Fix for Bug #215426 in which bzr can cause a MemoryError in socket.recv while | 533 | def pumpfile(from_file, to_file, read_length=-1, buff_size=32768): | 
| 2745.5.2
by Robert Collins * ``bzrlib.transport.Transport.put_file`` now returns the number of bytes | 534 | """Copy contents of one file to another. | 
| 3408.6.1
by Eric Holmberg Fix for Bug #215426 in which bzr can cause a MemoryError in socket.recv while | 535 | |
| 536 |     The read_length can either be -1 to read to end-of-file (EOF) or
 | |
| 537 |     it can specify the maximum number of bytes to read.
 | |
| 538 | ||
| 539 |     The buff_size represents the maximum size for each read operation
 | |
| 540 |     performed on from_file.
 | |
| 541 | ||
| 2745.5.2
by Robert Collins * ``bzrlib.transport.Transport.put_file`` now returns the number of bytes | 542 |     :return: The number of bytes copied.
 | 
| 543 |     """
 | |
| 544 | length = 0 | |
| 3408.6.1
by Eric Holmberg Fix for Bug #215426 in which bzr can cause a MemoryError in socket.recv while | 545 | if read_length >= 0: | 
| 546 |         # read specified number of bytes
 | |
| 547 | ||
| 548 | while read_length > 0: | |
| 549 | num_bytes_to_read = min(read_length, buff_size) | |
| 550 | ||
| 551 | block = from_file.read(num_bytes_to_read) | |
| 552 | if not block: | |
| 553 |                 # EOF reached
 | |
| 554 |                 break
 | |
| 555 | to_file.write(block) | |
| 556 | ||
| 557 | actual_bytes_read = len(block) | |
| 558 | read_length -= actual_bytes_read | |
| 559 | length += actual_bytes_read | |
| 560 | else: | |
| 561 |         # read to EOF
 | |
| 562 | while True: | |
| 563 | block = from_file.read(buff_size) | |
| 564 | if not block: | |
| 565 |                 # EOF reached
 | |
| 566 |                 break
 | |
| 567 | to_file.write(block) | |
| 568 | length += len(block) | |
| 2745.5.2
by Robert Collins * ``bzrlib.transport.Transport.put_file`` now returns the number of bytes | 569 | return length | 
| 1
by mbp at sourcefrog import from baz patch-364 | 570 | |
| 571 | ||
| 1185.67.7
by Aaron Bentley Refactored a bit | 572 | def file_iterator(input_file, readsize=32768): | 
| 573 | while True: | |
| 574 | b = input_file.read(readsize) | |
| 575 | if len(b) == 0: | |
| 576 |             break
 | |
| 577 | yield b | |
| 578 | ||
| 579 | ||
| 1
by mbp at sourcefrog import from baz patch-364 | 580 | def sha_file(f): | 
| 3376.2.4
by Martin Pool Remove every assert statement from bzrlib! | 581 | """Calculate the hexdigest of an open file. | 
| 582 | ||
| 583 |     The file cursor should be already at the start.
 | |
| 584 |     """
 | |
| 1
by mbp at sourcefrog import from baz patch-364 | 585 | s = sha.new() | 
| 320
by Martin Pool - Compute SHA-1 of files in chunks | 586 | BUFSIZE = 128<<10 | 
| 587 | while True: | |
| 588 | b = f.read(BUFSIZE) | |
| 589 | if not b: | |
| 590 |             break
 | |
| 591 | s.update(b) | |
| 1
by mbp at sourcefrog import from baz patch-364 | 592 | return s.hexdigest() | 
| 593 | ||
| 594 | ||
| 2872.3.1
by Martin Pool Add -Dhashcache option; clean up dirstate sha1 code | 595 | def sha_file_by_name(fname): | 
| 596 | """Calculate the SHA1 of a file by reading the full text""" | |
| 2872.3.2
by Martin Pool Do sha_file_by_name using raw os files rather than file objects; makes this routine about 12osutils.py faster | 597 | s = sha.new() | 
| 2922.1.1
by John Arbash Meinel Fix bug #153493, use O_BINARY when reading files. | 598 | f = os.open(fname, os.O_RDONLY | O_BINARY) | 
| 2872.3.1
by Martin Pool Add -Dhashcache option; clean up dirstate sha1 code | 599 | try: | 
| 2872.3.2
by Martin Pool Do sha_file_by_name using raw os files rather than file objects; makes this routine about 12osutils.py faster | 600 | while True: | 
| 601 | b = os.read(f, 1<<16) | |
| 602 | if not b: | |
| 603 | return s.hexdigest() | |
| 604 | s.update(b) | |
| 2872.3.1
by Martin Pool Add -Dhashcache option; clean up dirstate sha1 code | 605 | finally: | 
| 2872.3.2
by Martin Pool Do sha_file_by_name using raw os files rather than file objects; makes this routine about 12osutils.py faster | 606 | os.close(f) | 
| 2872.3.1
by Martin Pool Add -Dhashcache option; clean up dirstate sha1 code | 607 | |
| 608 | ||
| 2825.2.1
by Robert Collins Micro-tweaks to sha routines. | 609 | def sha_strings(strings, _factory=sha.new): | 
| 1235
by Martin Pool - split sha_strings into osutils | 610 | """Return the sha-1 of concatenation of strings""" | 
| 2825.2.1
by Robert Collins Micro-tweaks to sha routines. | 611 | s = _factory() | 
| 1235
by Martin Pool - split sha_strings into osutils | 612 | map(s.update, strings) | 
| 613 | return s.hexdigest() | |
| 614 | ||
| 615 | ||
| 2825.2.1
by Robert Collins Micro-tweaks to sha routines. | 616 | def sha_string(f, _factory=sha.new): | 
| 617 | return _factory(f).hexdigest() | |
| 1
by mbp at sourcefrog import from baz patch-364 | 618 | |
| 619 | ||
| 124
by mbp at sourcefrog - check file text for past revisions is correct | 620 | def fingerprint_file(f): | 
| 126
by mbp at sourcefrog Use just one big read to fingerprint files | 621 | b = f.read() | 
| 2825.2.1
by Robert Collins Micro-tweaks to sha routines. | 622 | return {'size': len(b), | 
| 623 | 'sha1': sha.new(b).hexdigest()} | |
| 124
by mbp at sourcefrog - check file text for past revisions is correct | 624 | |
| 625 | ||
| 1
by mbp at sourcefrog import from baz patch-364 | 626 | def compare_files(a, b): | 
| 627 | """Returns true if equal in contents""" | |
| 74
by mbp at sourcefrog compare_files: read in one page at a time rather than | 628 | BUFSIZE = 4096 | 
| 629 | while True: | |
| 630 | ai = a.read(BUFSIZE) | |
| 631 | bi = b.read(BUFSIZE) | |
| 632 | if ai != bi: | |
| 633 | return False | |
| 634 | if ai == '': | |
| 635 | return True | |
| 1
by mbp at sourcefrog import from baz patch-364 | 636 | |
| 637 | ||
| 49
by mbp at sourcefrog fix local-time-offset calculation | 638 | def local_time_offset(t=None): | 
| 639 | """Return offset of local zone from GMT, either at present or at time t.""" | |
| 1963.2.6
by Robey Pointer pychecker is on crack; go back to using 'is None'. | 640 | if t is None: | 
| 73
by mbp at sourcefrog fix time.localtime call for python 2.3 | 641 | t = time.time() | 
| 2215.6.1
by James Henstridge Don't rely on time.timezone and time.altzone in local_time_offset(), | 642 | offset = datetime.fromtimestamp(t) - datetime.utcfromtimestamp(t) | 
| 643 | return offset.days * 86400 + offset.seconds | |
| 8
by mbp at sourcefrog store committer's timezone in revision and show | 644 | |
| 3512.3.1
by Martin von Gagern Hand-selected minimalistic set of changes from my setlocale branch. | 645 | weekdays = ['Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun'] | 
| 8
by mbp at sourcefrog store committer's timezone in revision and show | 646 | |
| 2425.6.2
by Martin Pool Make timestamps use existing format_date; document that function more | 647 | def format_date(t, offset=0, timezone='original', date_fmt=None, | 
| 1185.12.24
by Aaron Bentley Made format_date more flexible | 648 | show_offset=True): | 
| 2425.6.2
by Martin Pool Make timestamps use existing format_date; document that function more | 649 | """Return a formatted date string. | 
| 650 | ||
| 651 |     :param t: Seconds since the epoch.
 | |
| 652 |     :param offset: Timezone offset in seconds east of utc.
 | |
| 653 |     :param timezone: How to display the time: 'utc', 'original' for the
 | |
| 654 |          timezone specified by offset, or 'local' for the process's current
 | |
| 655 |          timezone.
 | |
| 656 |     :param show_offset: Whether to append the timezone.
 | |
| 657 |     :param date_fmt: strftime format.
 | |
| 658 |     """
 | |
| 8
by mbp at sourcefrog store committer's timezone in revision and show | 659 | if timezone == 'utc': | 
| 1
by mbp at sourcefrog import from baz patch-364 | 660 | tt = time.gmtime(t) | 
| 661 | offset = 0 | |
| 8
by mbp at sourcefrog store committer's timezone in revision and show | 662 | elif timezone == 'original': | 
| 1963.2.6
by Robey Pointer pychecker is on crack; go back to using 'is None'. | 663 | if offset is None: | 
| 23
by mbp at sourcefrog format_date: handle revisions with no timezone offset | 664 | offset = 0 | 
| 16
by mbp at sourcefrog fix inverted calculation for original timezone -> utc | 665 | tt = time.gmtime(t + offset) | 
| 12
by mbp at sourcefrog new --timezone option for bzr log | 666 | elif timezone == 'local': | 
| 1
by mbp at sourcefrog import from baz patch-364 | 667 | tt = time.localtime(t) | 
| 49
by mbp at sourcefrog fix local-time-offset calculation | 668 | offset = local_time_offset(t) | 
| 12
by mbp at sourcefrog new --timezone option for bzr log | 669 | else: | 
| 3144.1.1
by Lukáš Lalinský Fixed error reporting of unsupported timezone format. | 670 | raise errors.UnsupportedTimezoneFormat(timezone) | 
| 1185.12.24
by Aaron Bentley Made format_date more flexible | 671 | if date_fmt is None: | 
| 672 | date_fmt = "%a %Y-%m-%d %H:%M:%S" | |
| 673 | if show_offset: | |
| 674 | offset_str = ' %+03d%02d' % (offset / 3600, (offset / 60) % 60) | |
| 675 | else: | |
| 676 | offset_str = '' | |
| 3512.3.1
by Martin von Gagern Hand-selected minimalistic set of changes from my setlocale branch. | 677 |     # day of week depends on locale, so we do this ourself
 | 
| 678 | date_fmt = date_fmt.replace('%a', weekdays[tt[6]]) | |
| 1185.12.24
by Aaron Bentley Made format_date more flexible | 679 | return (time.strftime(date_fmt, tt) + offset_str) | 
| 1
by mbp at sourcefrog import from baz patch-364 | 680 | |
| 681 | ||
| 682 | def compact_date(when): | |
| 683 | return time.strftime('%Y%m%d%H%M%S', time.gmtime(when)) | |
| 684 | ||
| 685 | ||
| 1957.1.4
by John Arbash Meinel create a helper for formatting a time delta | 686 | def format_delta(delta): | 
| 687 | """Get a nice looking string for a time delta. | |
| 688 | ||
| 689 |     :param delta: The time difference in seconds, can be positive or negative.
 | |
| 690 |         positive indicates time in the past, negative indicates time in the
 | |
| 691 |         future. (usually time.time() - stored_time)
 | |
| 692 |     :return: String formatted to show approximate resolution
 | |
| 693 |     """
 | |
| 694 | delta = int(delta) | |
| 695 | if delta >= 0: | |
| 696 | direction = 'ago' | |
| 697 | else: | |
| 698 | direction = 'in the future' | |
| 699 | delta = -delta | |
| 700 | ||
| 701 | seconds = delta | |
| 702 | if seconds < 90: # print seconds up to 90 seconds | |
| 703 | if seconds == 1: | |
| 704 | return '%d second %s' % (seconds, direction,) | |
| 705 | else: | |
| 706 | return '%d seconds %s' % (seconds, direction) | |
| 707 | ||
| 708 | minutes = int(seconds / 60) | |
| 709 | seconds -= 60 * minutes | |
| 710 | if seconds == 1: | |
| 711 | plural_seconds = '' | |
| 712 | else: | |
| 713 | plural_seconds = 's' | |
| 714 | if minutes < 90: # print minutes, seconds up to 90 minutes | |
| 715 | if minutes == 1: | |
| 716 | return '%d minute, %d second%s %s' % ( | |
| 717 | minutes, seconds, plural_seconds, direction) | |
| 718 | else: | |
| 719 | return '%d minutes, %d second%s %s' % ( | |
| 720 | minutes, seconds, plural_seconds, direction) | |
| 721 | ||
| 722 | hours = int(minutes / 60) | |
| 723 | minutes -= 60 * hours | |
| 724 | if minutes == 1: | |
| 725 | plural_minutes = '' | |
| 726 | else: | |
| 727 | plural_minutes = 's' | |
| 728 | ||
| 729 | if hours == 1: | |
| 730 | return '%d hour, %d minute%s %s' % (hours, minutes, | |
| 731 | plural_minutes, direction) | |
| 732 | return '%d hours, %d minute%s %s' % (hours, minutes, | |
| 733 | plural_minutes, direction) | |
| 1
by mbp at sourcefrog import from baz patch-364 | 734 | |
| 735 | def filesize(f): | |
| 736 | """Return size of given open file.""" | |
| 737 | return os.fstat(f.fileno())[ST_SIZE] | |
| 738 | ||
| 1553.5.5
by Martin Pool New utility routine rand_chars | 739 | |
| 1185.1.7
by Robert Collins Nathaniel McCallums patch for urandom friendliness on aix. | 740 | # Define rand_bytes based on platform.
 | 
| 741 | try: | |
| 742 |     # Python 2.4 and later have os.urandom,
 | |
| 743 |     # but it doesn't work on some arches
 | |
| 744 | os.urandom(1) | |
| 1
by mbp at sourcefrog import from baz patch-364 | 745 | rand_bytes = os.urandom | 
| 1185.1.7
by Robert Collins Nathaniel McCallums patch for urandom friendliness on aix. | 746 | except (NotImplementedError, AttributeError): | 
| 747 |     # If python doesn't have os.urandom, or it doesn't work,
 | |
| 748 |     # then try to first pull random data from /dev/urandom
 | |
| 2067.1.1
by John Arbash Meinel Catch an exception while opening /dev/urandom rather than using os.path.exists() | 749 | try: | 
| 1185.1.7
by Robert Collins Nathaniel McCallums patch for urandom friendliness on aix. | 750 | rand_bytes = file('/dev/urandom', 'rb').read | 
| 751 |     # Otherwise, use this hack as a last resort
 | |
| 2067.1.1
by John Arbash Meinel Catch an exception while opening /dev/urandom rather than using os.path.exists() | 752 | except (IOError, OSError): | 
| 1185.1.7
by Robert Collins Nathaniel McCallums patch for urandom friendliness on aix. | 753 |         # not well seeded, but better than nothing
 | 
| 754 | def rand_bytes(n): | |
| 755 | import random | |
| 756 | s = '' | |
| 757 | while n: | |
| 758 | s += chr(random.randint(0, 255)) | |
| 759 | n -= 1 | |
| 760 | return s | |
| 1
by mbp at sourcefrog import from baz patch-364 | 761 | |
| 1553.5.5
by Martin Pool New utility routine rand_chars | 762 | |
| 763 | ALNUM = '0123456789abcdefghijklmnopqrstuvwxyz' | |
| 764 | def rand_chars(num): | |
| 765 | """Return a random string of num alphanumeric characters | |
| 766 |     
 | |
| 767 |     The result only contains lowercase chars because it may be used on 
 | |
| 768 |     case-insensitive filesystems.
 | |
| 769 |     """
 | |
| 770 | s = '' | |
| 771 | for raw_byte in rand_bytes(num): | |
| 772 | s += ALNUM[ord(raw_byte) % 36] | |
| 773 | return s | |
| 774 | ||
| 775 | ||
| 1
by mbp at sourcefrog import from baz patch-364 | 776 | ## TODO: We could later have path objects that remember their list
 | 
| 1759.2.2
by Jelmer Vernooij Revert some of my spelling fixes and fix some typos after review by Aaron. | 777 | ## decomposition (might be too tricksy though.)
 | 
| 1
by mbp at sourcefrog import from baz patch-364 | 778 | |
| 779 | def splitpath(p): | |
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 780 | """Turn string into list of parts.""" | 
| 271
by Martin Pool - Windows path fixes | 781 |     # split on either delimiter because people might use either on
 | 
| 782 |     # Windows
 | |
| 783 | ps = re.split(r'[\\/]', p) | |
| 784 | ||
| 785 | rps = [] | |
| 1
by mbp at sourcefrog import from baz patch-364 | 786 | for f in ps: | 
| 787 | if f == '..': | |
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 788 | raise errors.BzrError("sorry, %r not allowed in path" % f) | 
| 271
by Martin Pool - Windows path fixes | 789 | elif (f == '.') or (f == ''): | 
| 790 |             pass
 | |
| 791 | else: | |
| 792 | rps.append(f) | |
| 793 | return rps | |
| 1
by mbp at sourcefrog import from baz patch-364 | 794 | |
| 795 | def joinpath(p): | |
| 796 | for f in p: | |
| 1963.2.6
by Robey Pointer pychecker is on crack; go back to using 'is None'. | 797 | if (f == '..') or (f is None) or (f == ''): | 
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 798 | raise errors.BzrError("sorry, %r not allowed in path" % f) | 
| 1185.31.32
by John Arbash Meinel Updated the bzr sourcecode to use bzrlib.osutils.pathjoin rather than os.path.join to enforce internal use of / instead of \ | 799 | return pathjoin(*p) | 
| 1
by mbp at sourcefrog import from baz patch-364 | 800 | |
| 801 | ||
| 1231
by Martin Pool - more progress on fetch on top of weaves | 802 | def split_lines(s): | 
| 803 | """Split s into lines, but without removing the newline characters.""" | |
| 1666.1.6
by Robert Collins Make knit the default format. | 804 | lines = s.split('\n') | 
| 805 | result = [line + '\n' for line in lines[:-1]] | |
| 806 | if lines[-1]: | |
| 807 | result.append(lines[-1]) | |
| 808 | return result | |
| 1391
by Robert Collins merge from integration | 809 | |
| 810 | ||
| 1185.10.4
by Aaron Bentley Disabled hardlinks on cygwin, mac OS | 811 | def hardlinks_good(): | 
| 1185.10.5
by Aaron Bentley Fixed hardlinks_good test | 812 | return sys.platform not in ('win32', 'cygwin', 'darwin') | 
| 1185.10.4
by Aaron Bentley Disabled hardlinks on cygwin, mac OS | 813 | |
| 1185.1.46
by Robert Collins Aarons branch --basis patch | 814 | |
| 1185.10.3
by Aaron Bentley Made copy_multi_immutable create hardlinks opportunistically | 815 | def link_or_copy(src, dest): | 
| 816 | """Hardlink a file, or copy it if it can't be hardlinked.""" | |
| 1185.10.4
by Aaron Bentley Disabled hardlinks on cygwin, mac OS | 817 | if not hardlinks_good(): | 
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 818 | shutil.copyfile(src, dest) | 
| 1185.10.3
by Aaron Bentley Made copy_multi_immutable create hardlinks opportunistically | 819 |         return
 | 
| 820 | try: | |
| 821 | os.link(src, dest) | |
| 822 | except (OSError, IOError), e: | |
| 823 | if e.errno != errno.EXDEV: | |
| 824 |             raise
 | |
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 825 | shutil.copyfile(src, dest) | 
| 1399.1.4
by Robert Collins move diff and symlink conditionals into inventory.py from diff.py | 826 | |
| 2831.5.2
by Vincent Ladeuil Review feedback. | 827 | |
| 828 | # Look Before You Leap (LBYL) is appropriate here instead of Easier to Ask for
 | |
| 829 | # Forgiveness than Permission (EAFP) because:
 | |
| 830 | # - root can damage a solaris file system by using unlink,
 | |
| 831 | # - unlink raises different exceptions on different OSes (linux: EISDIR, win32:
 | |
| 832 | #   EACCES, OSX: EPERM) when invoked on a directory.
 | |
| 833 | def delete_any(path): | |
| 1558.12.9
by Aaron Bentley Handle resolving conflicts with directories properly | 834 | """Delete a file or directory.""" | 
| 2831.5.2
by Vincent Ladeuil Review feedback. | 835 | if isdir(path): # Takes care of symlinks | 
| 836 | os.rmdir(path) | |
| 837 | else: | |
| 838 | os.unlink(path) | |
| 1558.12.9
by Aaron Bentley Handle resolving conflicts with directories properly | 839 | |
| 1399.1.4
by Robert Collins move diff and symlink conditionals into inventory.py from diff.py | 840 | |
| 841 | def has_symlinks(): | |
| 1963.2.6
by Robey Pointer pychecker is on crack; go back to using 'is None'. | 842 | if getattr(os, 'symlink', None) is not None: | 
| 1399.1.4
by Robert Collins move diff and symlink conditionals into inventory.py from diff.py | 843 | return True | 
| 844 | else: | |
| 845 | return False | |
| 2831.5.2
by Vincent Ladeuil Review feedback. | 846 | |
| 1185.16.38
by Martin Pool - move contains_whitespace and contains_linebreaks to osutils | 847 | |
| 3136.1.1
by Aaron Bentley Add support for hardlinks to TreeTransform | 848 | def has_hardlinks(): | 
| 849 | if getattr(os, 'link', None) is not None: | |
| 850 | return True | |
| 851 | else: | |
| 852 | return False | |
| 853 | ||
| 854 | ||
| 3287.18.14
by Matt McClure Extracted a host_os_dereferences_symlinks method. | 855 | def host_os_dereferences_symlinks(): | 
| 856 | return (has_symlinks() | |
| 3287.18.19
by Matt McClure Changed tested sys.platform value from 'windows' (mistaken) to 'win32' | 857 | and sys.platform not in ('cygwin', 'win32')) | 
| 3287.18.14
by Matt McClure Extracted a host_os_dereferences_symlinks method. | 858 | |
| 859 | ||
| 1185.16.38
by Martin Pool - move contains_whitespace and contains_linebreaks to osutils | 860 | def contains_whitespace(s): | 
| 861 | """True if there are any whitespace characters in s.""" | |
| 2249.2.1
by John Arbash Meinel (John Arbash Meinel) hard-code the whitespace chars to avoid problems in some locales. | 862 |     # string.whitespace can include '\xa0' in certain locales, because it is
 | 
| 863 |     # considered "non-breaking-space" as part of ISO-8859-1. But it
 | |
| 864 |     # 1) Isn't a breaking whitespace
 | |
| 865 |     # 2) Isn't one of ' \t\r\n' which are characters we sometimes use as
 | |
| 866 |     #    separators
 | |
| 867 |     # 3) '\xa0' isn't unicode safe since it is >128.
 | |
| 2249.5.16
by John Arbash Meinel [merge] bzr.dev 2283 | 868 | |
| 869 |     # This should *not* be a unicode set of characters in case the source
 | |
| 870 |     # string is not a Unicode string. We can auto-up-cast the characters since
 | |
| 871 |     # they are ascii, but we don't want to auto-up-cast the string in case it
 | |
| 872 |     # is utf-8
 | |
| 873 | for ch in ' \t\n\r\v\f': | |
| 1185.16.38
by Martin Pool - move contains_whitespace and contains_linebreaks to osutils | 874 | if ch in s: | 
| 875 | return True | |
| 876 | else: | |
| 877 | return False | |
| 878 | ||
| 879 | ||
| 880 | def contains_linebreaks(s): | |
| 881 | """True if there is any vertical whitespace in s.""" | |
| 882 | for ch in '\f\n\r': | |
| 883 | if ch in s: | |
| 884 | return True | |
| 885 | else: | |
| 886 | return False | |
| 1457.1.2
by Robert Collins move branch._relpath into osutils as relpath | 887 | |
| 888 | ||
| 889 | def relpath(base, path): | |
| 890 | """Return path relative to base, or raise exception. | |
| 891 | ||
| 892 |     The path may be either an absolute path or a path relative to the
 | |
| 893 |     current working directory.
 | |
| 894 | ||
| 895 |     os.path.commonprefix (python2.4) has a bad bug that it works just
 | |
| 896 |     on string prefixes, assuming that '/u' is a prefix of '/u2'.  This
 | |
| 1636.1.1
by Robert Collins Fix calling relpath() and abspath() on transports at their root. | 897 |     avoids that problem.
 | 
| 898 |     """
 | |
| 1685.1.12
by John Arbash Meinel Some more work to get LocalTransport to only support URLs | 899 | |
| 3376.2.4
by Martin Pool Remove every assert statement from bzrlib! | 900 | if len(base) < MIN_ABS_PATHLENGTH: | 
| 901 |         # must have space for e.g. a drive letter
 | |
| 902 | raise ValueError('%r is too short to calculate a relative path' | |
| 903 | % (base,)) | |
| 1685.1.9
by John Arbash Meinel Updated LocalTransport so that it's base is now a URL rather than a local path. This helps consistency with all other functions. To do so, I added local_abspath() which returns the local path, and local_path_to/from_url | 904 | |
| 1685.1.12
by John Arbash Meinel Some more work to get LocalTransport to only support URLs | 905 | rp = abspath(path) | 
| 1457.1.2
by Robert Collins move branch._relpath into osutils as relpath | 906 | |
| 907 | s = [] | |
| 1685.1.12
by John Arbash Meinel Some more work to get LocalTransport to only support URLs | 908 | head = rp | 
| 1457.1.2
by Robert Collins move branch._relpath into osutils as relpath | 909 | while len(head) >= len(base): | 
| 910 | if head == base: | |
| 911 |             break
 | |
| 912 | head, tail = os.path.split(head) | |
| 913 | if tail: | |
| 914 | s.insert(0, tail) | |
| 915 | else: | |
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 916 | raise errors.PathNotChild(rp, base) | 
| 1457.1.2
by Robert Collins move branch._relpath into osutils as relpath | 917 | |
| 1185.31.35
by John Arbash Meinel Couple small fixes, all tests pass on cygwin. | 918 | if s: | 
| 919 | return pathjoin(*s) | |
| 920 | else: | |
| 921 | return '' | |
| 1185.33.60
by Martin Pool Use full terminal width for verbose test output. | 922 | |
| 923 | ||
| 1534.3.1
by Robert Collins * bzrlib.osutils.safe_unicode now exists to provide parameter coercion | 924 | def safe_unicode(unicode_or_utf8_string): | 
| 925 | """Coerce unicode_or_utf8_string into unicode. | |
| 926 | ||
| 927 |     If it is unicode, it is returned.
 | |
| 928 |     Otherwise it is decoded from utf-8. If a decoding error
 | |
| 929 |     occurs, it is wrapped as a If the decoding fails, the exception is wrapped 
 | |
| 930 |     as a BzrBadParameter exception.
 | |
| 931 |     """
 | |
| 932 | if isinstance(unicode_or_utf8_string, unicode): | |
| 933 | return unicode_or_utf8_string | |
| 934 | try: | |
| 935 | return unicode_or_utf8_string.decode('utf8') | |
| 936 | except UnicodeDecodeError: | |
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 937 | raise errors.BzrBadParameterNotUnicode(unicode_or_utf8_string) | 
| 1534.3.1
by Robert Collins * bzrlib.osutils.safe_unicode now exists to provide parameter coercion | 938 | |
| 939 | ||
| 2249.5.8
by John Arbash Meinel Add osutils.safe_utf8 and safe_revision_id for the new revision_id work. | 940 | def safe_utf8(unicode_or_utf8_string): | 
| 941 | """Coerce unicode_or_utf8_string to a utf8 string. | |
| 942 | ||
| 943 |     If it is a str, it is returned.
 | |
| 944 |     If it is Unicode, it is encoded into a utf-8 string.
 | |
| 945 |     """
 | |
| 946 | if isinstance(unicode_or_utf8_string, str): | |
| 947 |         # TODO: jam 20070209 This is overkill, and probably has an impact on
 | |
| 948 |         #       performance if we are dealing with lots of apis that want a
 | |
| 949 |         #       utf-8 revision id
 | |
| 950 | try: | |
| 951 |             # Make sure it is a valid utf-8 string
 | |
| 952 | unicode_or_utf8_string.decode('utf-8') | |
| 953 | except UnicodeDecodeError: | |
| 954 | raise errors.BzrBadParameterNotUnicode(unicode_or_utf8_string) | |
| 955 | return unicode_or_utf8_string | |
| 956 | return unicode_or_utf8_string.encode('utf-8') | |
| 957 | ||
| 958 | ||
| 2309.4.4
by John Arbash Meinel Change what warnings are raised, and add tests that they are used. | 959 | _revision_id_warning = ('Unicode revision ids were deprecated in bzr 0.15.' | 
| 960 |                         ' Revision id generators should be creating utf8'
 | |
| 961 | ' revision ids.') | |
| 962 | ||
| 963 | ||
| 964 | def safe_revision_id(unicode_or_utf8_string, warn=True): | |
| 2249.5.8
by John Arbash Meinel Add osutils.safe_utf8 and safe_revision_id for the new revision_id work. | 965 | """Revision ids should now be utf8, but at one point they were unicode. | 
| 966 | ||
| 2309.4.4
by John Arbash Meinel Change what warnings are raised, and add tests that they are used. | 967 |     :param unicode_or_utf8_string: A possibly Unicode revision_id. (can also be
 | 
| 968 |         utf8 or None).
 | |
| 969 |     :param warn: Functions that are sanitizing user data can set warn=False
 | |
| 970 |     :return: None or a utf8 revision id.
 | |
| 2249.5.8
by John Arbash Meinel Add osutils.safe_utf8 and safe_revision_id for the new revision_id work. | 971 |     """
 | 
| 2309.4.3
by John Arbash Meinel (broken) change safe_*_id to emit a warning. | 972 | if (unicode_or_utf8_string is None | 
| 973 | or unicode_or_utf8_string.__class__ == str): | |
| 974 | return unicode_or_utf8_string | |
| 2309.4.4
by John Arbash Meinel Change what warnings are raised, and add tests that they are used. | 975 | if warn: | 
| 976 | symbol_versioning.warn(_revision_id_warning, DeprecationWarning, | |
| 977 | stacklevel=2) | |
| 2309.4.3
by John Arbash Meinel (broken) change safe_*_id to emit a warning. | 978 | return cache_utf8.encode(unicode_or_utf8_string) | 
| 979 | ||
| 980 | ||
| 2309.4.4
by John Arbash Meinel Change what warnings are raised, and add tests that they are used. | 981 | _file_id_warning = ('Unicode file ids were deprecated in bzr 0.15. File id' | 
| 982 | ' generators should be creating utf8 file ids.') | |
| 983 | ||
| 984 | ||
| 985 | def safe_file_id(unicode_or_utf8_string, warn=True): | |
| 2309.4.3
by John Arbash Meinel (broken) change safe_*_id to emit a warning. | 986 | """File ids should now be utf8, but at one point they were unicode. | 
| 987 | ||
| 988 |     This is the same as safe_utf8, except it uses the cached encode functions
 | |
| 989 |     to save a little bit of performance.
 | |
| 2309.4.4
by John Arbash Meinel Change what warnings are raised, and add tests that they are used. | 990 | |
| 991 |     :param unicode_or_utf8_string: A possibly Unicode file_id. (can also be
 | |
| 992 |         utf8 or None).
 | |
| 993 |     :param warn: Functions that are sanitizing user data can set warn=False
 | |
| 994 |     :return: None or a utf8 file id.
 | |
| 2309.4.3
by John Arbash Meinel (broken) change safe_*_id to emit a warning. | 995 |     """
 | 
| 996 | if (unicode_or_utf8_string is None | |
| 997 | or unicode_or_utf8_string.__class__ == str): | |
| 998 | return unicode_or_utf8_string | |
| 2309.4.4
by John Arbash Meinel Change what warnings are raised, and add tests that they are used. | 999 | if warn: | 
| 1000 | symbol_versioning.warn(_file_id_warning, DeprecationWarning, | |
| 1001 | stacklevel=2) | |
| 2309.4.3
by John Arbash Meinel (broken) change safe_*_id to emit a warning. | 1002 | return cache_utf8.encode(unicode_or_utf8_string) | 
| 2294.1.4
by John Arbash Meinel Add safe_file_id as a helper in osutils. | 1003 | |
| 1004 | ||
| 1185.85.75
by John Arbash Meinel Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. | 1005 | _platform_normalizes_filenames = False | 
| 1006 | if sys.platform == 'darwin': | |
| 1007 | _platform_normalizes_filenames = True | |
| 1008 | ||
| 1009 | ||
| 1010 | def normalizes_filenames(): | |
| 1011 | """Return True if this platform normalizes unicode filenames. | |
| 1012 | ||
| 1013 |     Mac OSX does, Windows/Linux do not.
 | |
| 1014 |     """
 | |
| 1015 | return _platform_normalizes_filenames | |
| 1016 | ||
| 1017 | ||
| 1830.3.2
by John Arbash Meinel normalized_filename is a much better name | 1018 | def _accessible_normalized_filename(path): | 
| 1830.3.1
by John Arbash Meinel Change the return value of unicode_filename, and make it testable on all platforms | 1019 | """Get the unicode normalized path, and if you can access the file. | 
| 1020 | ||
| 1021 |     On platforms where the system normalizes filenames (Mac OSX),
 | |
| 1022 |     you can access a file by any path which will normalize correctly.
 | |
| 1023 |     On platforms where the system does not normalize filenames 
 | |
| 1024 |     (Windows, Linux), you have to access a file by its exact path.
 | |
| 1025 | ||
| 3201.1.1
by jameinel Fix bug #185458, switch from NFKC to NFC and add tests for filenames that would be broken under NFKC | 1026 |     Internally, bzr only supports NFC normalization, since that is 
 | 
| 1830.3.1
by John Arbash Meinel Change the return value of unicode_filename, and make it testable on all platforms | 1027 |     the standard for XML documents.
 | 
| 1028 | ||
| 1029 |     So return the normalized path, and a flag indicating if the file
 | |
| 1030 |     can be accessed by that path.
 | |
| 1031 |     """
 | |
| 1032 | ||
| 3201.1.1
by jameinel Fix bug #185458, switch from NFKC to NFC and add tests for filenames that would be broken under NFKC | 1033 | return unicodedata.normalize('NFC', unicode(path)), True | 
| 1830.3.1
by John Arbash Meinel Change the return value of unicode_filename, and make it testable on all platforms | 1034 | |
| 1035 | ||
| 1830.3.2
by John Arbash Meinel normalized_filename is a much better name | 1036 | def _inaccessible_normalized_filename(path): | 
| 1037 | __doc__ = _accessible_normalized_filename.__doc__ | |
| 1830.3.1
by John Arbash Meinel Change the return value of unicode_filename, and make it testable on all platforms | 1038 | |
| 3201.1.1
by jameinel Fix bug #185458, switch from NFKC to NFC and add tests for filenames that would be broken under NFKC | 1039 | normalized = unicodedata.normalize('NFC', unicode(path)) | 
| 1830.3.1
by John Arbash Meinel Change the return value of unicode_filename, and make it testable on all platforms | 1040 | return normalized, normalized == path | 
| 1041 | ||
| 1042 | ||
| 1185.85.75
by John Arbash Meinel Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. | 1043 | if _platform_normalizes_filenames: | 
| 1830.3.2
by John Arbash Meinel normalized_filename is a much better name | 1044 | normalized_filename = _accessible_normalized_filename | 
| 1185.85.75
by John Arbash Meinel Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. | 1045 | else: | 
| 1830.3.2
by John Arbash Meinel normalized_filename is a much better name | 1046 | normalized_filename = _inaccessible_normalized_filename | 
| 1185.85.75
by John Arbash Meinel Adding bzrlib.osutils.unicode_filename to handle unicode normalization for file paths. | 1047 | |
| 1048 | ||
| 1185.33.60
by Martin Pool Use full terminal width for verbose test output. | 1049 | def terminal_width(): | 
| 1050 | """Return estimated terminal width.""" | |
| 1704.2.3
by Martin Pool (win32) Detect terminal width using GetConsoleScreenBufferInfo (Alexander) | 1051 | if sys.platform == 'win32': | 
| 2245.4.6
by Alexander Belchenko osutils.py: terminal_width() now use win32utils.get_console_size() | 1052 | return win32utils.get_console_size()[0] | 
| 1704.2.2
by Martin Pool Detect terminal width using ioctl | 1053 | width = 0 | 
| 1185.33.60
by Martin Pool Use full terminal width for verbose test output. | 1054 | try: | 
| 1704.2.2
by Martin Pool Detect terminal width using ioctl | 1055 | import struct, fcntl, termios | 
| 1056 | s = struct.pack('HHHH', 0, 0, 0, 0) | |
| 1057 | x = fcntl.ioctl(1, termios.TIOCGWINSZ, s) | |
| 1058 | width = struct.unpack('HHHH', x)[1] | |
| 1059 | except IOError: | |
| 1060 |         pass
 | |
| 1061 | if width <= 0: | |
| 1062 | try: | |
| 1063 | width = int(os.environ['COLUMNS']) | |
| 1064 | except: | |
| 1065 |             pass
 | |
| 1066 | if width <= 0: | |
| 1067 | width = 80 | |
| 1068 | ||
| 1069 | return width | |
| 1534.7.25
by Aaron Bentley Added set_executability | 1070 | |
| 1963.1.5
by John Arbash Meinel Create an osutils helper function for modifying the environment | 1071 | |
| 1534.7.25
by Aaron Bentley Added set_executability | 1072 | def supports_executable(): | 
| 1534.7.160
by Aaron Bentley Changed implementation of supports_executable | 1073 | return sys.platform != "win32" | 
| 1551.2.53
by abentley Strip trailing slashes in a platform-sensible way | 1074 | |
| 1075 | ||
| 1551.10.4
by Aaron Bentley Update to skip on win32 | 1076 | def supports_posix_readonly(): | 
| 1077 | """Return True if 'readonly' has POSIX semantics, False otherwise. | |
| 1078 | ||
| 1079 |     Notably, a win32 readonly file cannot be deleted, unlike POSIX where the
 | |
| 1080 |     directory controls creation/deletion, etc.
 | |
| 1081 | ||
| 1082 |     And under win32, readonly means that the directory itself cannot be
 | |
| 1083 |     deleted.  The contents of a readonly directory can be changed, unlike POSIX
 | |
| 1084 |     where files in readonly directories cannot be added, deleted or renamed.
 | |
| 1085 |     """
 | |
| 1086 | return sys.platform != "win32" | |
| 1087 | ||
| 1088 | ||
| 1963.1.5
by John Arbash Meinel Create an osutils helper function for modifying the environment | 1089 | def set_or_unset_env(env_variable, value): | 
| 1090 | """Modify the environment, setting or removing the env_variable. | |
| 1091 | ||
| 1092 |     :param env_variable: The environment variable in question
 | |
| 1093 |     :param value: The value to set the environment to. If None, then
 | |
| 1094 |         the variable will be removed.
 | |
| 1095 |     :return: The original value of the environment variable.
 | |
| 1096 |     """
 | |
| 1097 | orig_val = os.environ.get(env_variable) | |
| 1098 | if value is None: | |
| 1099 | if orig_val is not None: | |
| 1100 | del os.environ[env_variable] | |
| 1101 | else: | |
| 1102 | if isinstance(value, unicode): | |
| 1103 | value = value.encode(bzrlib.user_encoding) | |
| 1104 | os.environ[env_variable] = value | |
| 1105 | return orig_val | |
| 1106 | ||
| 1107 | ||
| 1551.2.56
by Aaron Bentley Better illegal pathname check for Windows | 1108 | _validWin32PathRE = re.compile(r'^([A-Za-z]:[/\\])?[^:<>*"?\|]*$') | 
| 1109 | ||
| 1110 | ||
| 1111 | def check_legal_path(path): | |
| 1112 | """Check whether the supplied path is legal. | |
| 1113 |     This is only required on Windows, so we don't test on other platforms
 | |
| 1114 |     right now.
 | |
| 1115 |     """
 | |
| 1116 | if sys.platform != "win32": | |
| 1117 |         return
 | |
| 1118 | if _validWin32PathRE.match(path) is None: | |
| 1996.3.25
by John Arbash Meinel Make importing errors lazy for osutils | 1119 | raise errors.IllegalPath(path) | 
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 1120 | |
| 1121 | ||
| 3596.2.2
by John Arbash Meinel Factor out the common exception handling looking for ENOTDIR and use it | 1122 | _WIN32_ERROR_DIRECTORY = 267 # Similar to errno.ENOTDIR | 
| 1123 | ||
| 1124 | def _is_error_enotdir(e): | |
| 1125 | """Check if this exception represents ENOTDIR. | |
| 1126 | ||
| 1127 |     Unfortunately, python is very inconsistent about the exception
 | |
| 1128 |     here. The cases are:
 | |
| 1129 |       1) Linux, Mac OSX all versions seem to set errno == ENOTDIR
 | |
| 1130 |       2) Windows, Python2.4, uses errno == ERROR_DIRECTORY (267)
 | |
| 1131 |          which is the windows error code.
 | |
| 1132 |       3) Windows, Python2.5 uses errno == EINVAL and
 | |
| 1133 |          winerror == ERROR_DIRECTORY
 | |
| 1134 | ||
| 1135 |     :param e: An Exception object (expected to be OSError with an errno
 | |
| 1136 |         attribute, but we should be able to cope with anything)
 | |
| 1137 |     :return: True if this represents an ENOTDIR error. False otherwise.
 | |
| 1138 |     """
 | |
| 1139 | en = getattr(e, 'errno', None) | |
| 1140 | if (en == errno.ENOTDIR | |
| 1141 | or (sys.platform == 'win32' | |
| 1142 | and (en == _WIN32_ERROR_DIRECTORY | |
| 1143 | or (en == errno.EINVAL | |
| 1144 | and getattr(e, 'winerror', None) == _WIN32_ERROR_DIRECTORY) | |
| 1145 |         ))):
 | |
| 1146 | return True | |
| 1147 | return False | |
| 1148 | ||
| 1149 | ||
| 1757.2.8
by Robert Collins Teach walkdirs to walk a subdir of a tree. | 1150 | def walkdirs(top, prefix=""): | 
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 1151 | """Yield data about all the directories in a tree. | 
| 1152 |     
 | |
| 1153 |     This yields all the data about the contents of a directory at a time.
 | |
| 1154 |     After each directory has been yielded, if the caller has mutated the list
 | |
| 1155 |     to exclude some directories, they are then not descended into.
 | |
| 1156 |     
 | |
| 1157 |     The data yielded is of the form:
 | |
| 1897.1.2
by Robert Collins cleanup osutils.walkdirs changes after review. | 1158 |     ((directory-relpath, directory-path-from-top),
 | 
| 2694.4.1
by Alexander Belchenko trivial fix for docstring of osutils.walkdirs() | 1159 |     [(relpath, basename, kind, lstat, path-from-top), ...]),
 | 
| 1897.1.2
by Robert Collins cleanup osutils.walkdirs changes after review. | 1160 |      - directory-relpath is the relative path of the directory being returned
 | 
| 1161 |        with respect to top. prefix is prepended to this.
 | |
| 1162 |      - directory-path-from-root is the path including top for this directory. 
 | |
| 1163 |        It is suitable for use with os functions.
 | |
| 1897.1.1
by Robert Collins Add some useful summary data to osutils.walkdirs output. | 1164 |      - relpath is the relative path within the subtree being walked.
 | 
| 1165 |      - basename is the basename of the path
 | |
| 1897.1.2
by Robert Collins cleanup osutils.walkdirs changes after review. | 1166 |      - kind is the kind of the file now. If unknown then the file is not
 | 
| 1897.1.1
by Robert Collins Add some useful summary data to osutils.walkdirs output. | 1167 |        present within the tree - but it may be recorded as versioned. See
 | 
| 1168 |        versioned_kind.
 | |
| 1169 |      - lstat is the stat data *if* the file was statted.
 | |
| 1170 |      - planned, not implemented: 
 | |
| 1171 |        path_from_tree_root is the path from the root of the tree.
 | |
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 1172 | |
| 1757.2.16
by Robert Collins Review comments. | 1173 |     :param prefix: Prefix the relpaths that are yielded with 'prefix'. This 
 | 
| 1174 |         allows one to walk a subtree but get paths that are relative to a tree
 | |
| 1175 |         rooted higher up.
 | |
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 1176 |     :return: an iterator over the dirs.
 | 
| 1177 |     """
 | |
| 1897.1.1
by Robert Collins Add some useful summary data to osutils.walkdirs output. | 1178 |     #TODO there is a bit of a smell where the results of the directory-
 | 
| 1179 |     # summary in this, and the path from the root, may not agree 
 | |
| 1180 |     # depending on top and prefix - i.e. ./foo and foo as a pair leads to
 | |
| 1181 |     # potentially confusing output. We should make this more robust - but
 | |
| 1897.1.2
by Robert Collins cleanup osutils.walkdirs changes after review. | 1182 |     # not at a speed cost. RBC 20060731
 | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1183 | _lstat = os.lstat | 
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 1184 | _directory = _directory_kind | 
| 1996.3.14
by John Arbash Meinel lazy_import osutils and sign_my_commits | 1185 | _listdir = os.listdir | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1186 | _kind_from_mode = _formats.get | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1187 | pending = [(safe_unicode(prefix), "", _directory, None, safe_unicode(top))] | 
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 1188 | while pending: | 
| 1189 |         # 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath
 | |
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1190 | relroot, _, _, _, top = pending.pop() | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1191 | if relroot: | 
| 1192 | relprefix = relroot + u'/' | |
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 1193 | else: | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1194 | relprefix = '' | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1195 | top_slash = top + u'/' | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1196 | |
| 1197 | dirblock = [] | |
| 1198 | append = dirblock.append | |
| 3585.2.4
by Robert Collins * Deleting directories by hand before running ``bzr rm`` will not | 1199 | try: | 
| 1200 | names = sorted(_listdir(top)) | |
| 3596.2.2
by John Arbash Meinel Factor out the common exception handling looking for ENOTDIR and use it | 1201 | except OSError, e: | 
| 1202 | if not _is_error_enotdir(e): | |
| 3585.2.4
by Robert Collins * Deleting directories by hand before running ``bzr rm`` will not | 1203 |                 raise
 | 
| 1204 | else: | |
| 1205 | for name in names: | |
| 1206 | abspath = top_slash + name | |
| 1207 | statvalue = _lstat(abspath) | |
| 1208 | kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown') | |
| 1209 | append((relprefix + name, name, kind, statvalue, abspath)) | |
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1210 | yield (relroot, top), dirblock | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1211 | |
| 1753.1.1
by Robert Collins (rbc, jam, mbp)Add bzrlib.osutils.walkdirs, an optimised walk-and-stat routine. | 1212 |         # push the user specified dirs from dirblock
 | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1213 | pending.extend(d for d in reversed(dirblock) if d[2] == _directory) | 
| 1773.3.1
by Robert Collins Add path_prefix_key and compare_paths_prefix_order utility functions. | 1214 | |
| 1215 | ||
| 3557.2.3
by John Arbash Meinel Change the logic for selecting a real _walkdirs_utf8 implementation, | 1216 | _real_walkdirs_utf8 = None | 
| 1217 | ||
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1218 | def _walkdirs_utf8(top, prefix=""): | 
| 1219 | """Yield data about all the directories in a tree. | |
| 1220 | ||
| 1221 |     This yields the same information as walkdirs() only each entry is yielded
 | |
| 1222 |     in utf-8. On platforms which have a filesystem encoding of utf8 the paths
 | |
| 1223 |     are returned as exact byte-strings.
 | |
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1224 | |
| 1225 |     :return: yields a tuple of (dir_info, [file_info])
 | |
| 1226 |         dir_info is (utf8_relpath, path-from-top)
 | |
| 1227 |         file_info is (utf8_relpath, utf8_name, kind, lstat, path-from-top)
 | |
| 1228 |         if top is an absolute path, path-from-top is also an absolute path.
 | |
| 1229 |         path-from-top might be unicode or utf8, but it is the correct path to
 | |
| 1230 |         pass to os functions to affect the file in question. (such as os.lstat)
 | |
| 1231 |     """
 | |
| 3557.2.3
by John Arbash Meinel Change the logic for selecting a real _walkdirs_utf8 implementation, | 1232 | global _real_walkdirs_utf8 | 
| 1233 | if _real_walkdirs_utf8 is None: | |
| 1234 | fs_encoding = _fs_enc.upper() | |
| 3557.2.6
by John Arbash Meinel Switch from os.name to bzrlib.win32utils.winver. | 1235 | if win32utils.winver == 'Windows NT': | 
| 3557.2.4
by John Arbash Meinel Cleanup the tests a bit, and add a test that we downgrade if os.name isn't 'nt' | 1236 |             # Win98 doesn't have unicode apis like FindFirstFileW
 | 
| 1237 |             # TODO: We possibly could support Win98 by falling back to the
 | |
| 1238 |             #       original FindFirstFile, and using TCHAR instead of WCHAR,
 | |
| 1239 |             #       but that gets a bit tricky, and requires custom compiling
 | |
| 1240 |             #       for win98 anyway.
 | |
| 3557.2.3
by John Arbash Meinel Change the logic for selecting a real _walkdirs_utf8 implementation, | 1241 | try: | 
| 1242 | from bzrlib._walkdirs_win32 import _walkdirs_utf8_win32_find_file | |
| 1243 | except ImportError: | |
| 1244 | _real_walkdirs_utf8 = _walkdirs_unicode_to_utf8 | |
| 1245 | else: | |
| 1246 | _real_walkdirs_utf8 = _walkdirs_utf8_win32_find_file | |
| 1247 | elif fs_encoding not in ('UTF-8', 'US-ASCII', 'ANSI_X3.4-1968'): | |
| 1248 |             # ANSI_X3.4-1968 is a form of ASCII
 | |
| 1249 | _real_walkdirs_utf8 = _walkdirs_unicode_to_utf8 | |
| 3504.4.5
by John Arbash Meinel Add tests to ensure that you can skip subdirs, start exposing the function. | 1250 | else: | 
| 3557.2.3
by John Arbash Meinel Change the logic for selecting a real _walkdirs_utf8 implementation, | 1251 | _real_walkdirs_utf8 = _walkdirs_fs_utf8 | 
| 1252 | return _real_walkdirs_utf8(top, prefix=prefix) | |
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1253 | |
| 1254 | ||
| 1255 | def _walkdirs_fs_utf8(top, prefix=""): | |
| 1256 | """See _walkdirs_utf8. | |
| 1257 | ||
| 1258 |     This sub-function is called when we know the filesystem is already in utf8
 | |
| 1259 |     encoding. So we don't need to transcode filenames.
 | |
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1260 |     """
 | 
| 1261 | _lstat = os.lstat | |
| 1262 | _directory = _directory_kind | |
| 1263 | _listdir = os.listdir | |
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1264 | _kind_from_mode = _formats.get | 
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1265 | |
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1266 |     # 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath
 | 
| 1267 |     # But we don't actually uses 1-3 in pending, so set them to None
 | |
| 1268 | pending = [(safe_utf8(prefix), None, None, None, safe_utf8(top))] | |
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1269 | while pending: | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1270 | relroot, _, _, _, top = pending.pop() | 
| 1271 | if relroot: | |
| 1272 | relprefix = relroot + '/' | |
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1273 | else: | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1274 | relprefix = '' | 
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1275 | top_slash = top + '/' | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1276 | |
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1277 | dirblock = [] | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1278 | append = dirblock.append | 
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1279 | for name in sorted(_listdir(top)): | 
| 1280 | abspath = top_slash + name | |
| 1281 | statvalue = _lstat(abspath) | |
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1282 | kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown') | 
| 1283 | append((relprefix + name, name, kind, statvalue, abspath)) | |
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1284 | yield (relroot, top), dirblock | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1285 | |
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1286 |         # push the user specified dirs from dirblock
 | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1287 | pending.extend(d for d in reversed(dirblock) if d[2] == _directory) | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1288 | |
| 1289 | ||
| 1290 | def _walkdirs_unicode_to_utf8(top, prefix=""): | |
| 1291 | """See _walkdirs_utf8 | |
| 1292 | ||
| 1293 |     Because Win32 has a Unicode api, all of the 'path-from-top' entries will be
 | |
| 1294 |     Unicode paths.
 | |
| 1295 |     This is currently the fallback code path when the filesystem encoding is
 | |
| 1296 |     not UTF-8. It may be better to implement an alternative so that we can
 | |
| 1297 |     safely handle paths that are not properly decodable in the current
 | |
| 1298 |     encoding.
 | |
| 1299 |     """
 | |
| 1300 | _utf8_encode = codecs.getencoder('utf8') | |
| 1301 | _lstat = os.lstat | |
| 1302 | _directory = _directory_kind | |
| 1303 | _listdir = os.listdir | |
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1304 | _kind_from_mode = _formats.get | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1305 | |
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1306 | pending = [(safe_utf8(prefix), None, None, None, safe_unicode(top))] | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1307 | while pending: | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1308 | relroot, _, _, _, top = pending.pop() | 
| 1309 | if relroot: | |
| 1310 | relprefix = relroot + '/' | |
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1311 | else: | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1312 | relprefix = '' | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1313 | top_slash = top + u'/' | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1314 | |
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1315 | dirblock = [] | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1316 | append = dirblock.append | 
| 2255.7.32
by John Arbash Meinel Add tests that the walkdirs variants work on unicode paths. | 1317 | for name in sorted(_listdir(top)): | 
| 1318 | name_utf8 = _utf8_encode(name)[0] | |
| 1319 | abspath = top_slash + name | |
| 1320 | statvalue = _lstat(abspath) | |
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1321 | kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown') | 
| 1322 | append((relprefix + name_utf8, name_utf8, kind, statvalue, abspath)) | |
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1323 | yield (relroot, top), dirblock | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1324 | |
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1325 |         # push the user specified dirs from dirblock
 | 
| 2255.7.33
by John Arbash Meinel More inner loop tuning of walkdirs, can save as much as 5% | 1326 | pending.extend(d for d in reversed(dirblock) if d[2] == _directory) | 
| 2255.7.27
by John Arbash Meinel Add a _walkdirs_utf8 which returns utf8 paths instead of Unicode. Approx 20% faster in walking utf8 filesystems | 1327 | |
| 1328 | ||
| 1907.3.2
by John Arbash Meinel Updated the copy_tree function to allow overriding functionality. | 1329 | def copy_tree(from_path, to_path, handlers={}): | 
| 1907.3.1
by John Arbash Meinel create a copy_tree wrapper around walkdirs() | 1330 | """Copy all of the entries in from_path into to_path. | 
| 1331 | ||
| 1332 |     :param from_path: The base directory to copy. 
 | |
| 1333 |     :param to_path: The target directory. If it does not exist, it will
 | |
| 1334 |         be created.
 | |
| 1907.3.2
by John Arbash Meinel Updated the copy_tree function to allow overriding functionality. | 1335 |     :param handlers: A dictionary of functions, which takes a source and
 | 
| 1336 |         destinations for files, directories, etc.
 | |
| 1337 |         It is keyed on the file kind, such as 'directory', 'symlink', or 'file'
 | |
| 1338 |         'file', 'directory', and 'symlink' should always exist.
 | |
| 1339 |         If they are missing, they will be replaced with 'os.mkdir()',
 | |
| 1340 |         'os.readlink() + os.symlink()', and 'shutil.copy2()', respectively.
 | |
| 1907.3.1
by John Arbash Meinel create a copy_tree wrapper around walkdirs() | 1341 |     """
 | 
| 1342 |     # Now, just copy the existing cached tree to the new location
 | |
| 1343 |     # We use a cheap trick here.
 | |
| 1344 |     # Absolute paths are prefixed with the first parameter
 | |
| 1345 |     # relative paths are prefixed with the second.
 | |
| 1346 |     # So we can get both the source and target returned
 | |
| 1347 |     # without any extra work.
 | |
| 1348 | ||
| 1907.3.2
by John Arbash Meinel Updated the copy_tree function to allow overriding functionality. | 1349 | def copy_dir(source, dest): | 
| 1350 | os.mkdir(dest) | |
| 1351 | ||
| 1352 | def copy_link(source, dest): | |
| 1353 | """Copy the contents of a symlink""" | |
| 1354 | link_to = os.readlink(source) | |
| 1355 | os.symlink(link_to, dest) | |
| 1356 | ||
| 1357 | real_handlers = {'file':shutil.copy2, | |
| 1358 | 'symlink':copy_link, | |
| 1359 | 'directory':copy_dir, | |
| 1360 |                     }
 | |
| 1361 | real_handlers.update(handlers) | |
| 1362 | ||
| 1907.3.1
by John Arbash Meinel create a copy_tree wrapper around walkdirs() | 1363 | if not os.path.exists(to_path): | 
| 1907.3.2
by John Arbash Meinel Updated the copy_tree function to allow overriding functionality. | 1364 | real_handlers['directory'](from_path, to_path) | 
| 1907.3.1
by John Arbash Meinel create a copy_tree wrapper around walkdirs() | 1365 | |
| 1366 | for dir_info, entries in walkdirs(from_path, prefix=to_path): | |
| 1367 | for relpath, name, kind, st, abspath in entries: | |
| 1907.3.2
by John Arbash Meinel Updated the copy_tree function to allow overriding functionality. | 1368 | real_handlers[kind](abspath, relpath) | 
| 1907.3.1
by John Arbash Meinel create a copy_tree wrapper around walkdirs() | 1369 | |
| 1370 | ||
| 1773.3.1
by Robert Collins Add path_prefix_key and compare_paths_prefix_order utility functions. | 1371 | def path_prefix_key(path): | 
| 1372 | """Generate a prefix-order path key for path. | |
| 1373 | ||
| 1374 |     This can be used to sort paths in the same way that walkdirs does.
 | |
| 1375 |     """
 | |
| 1773.3.2
by Robert Collins New corner case from John Meinel, showing up the need to check the directory lexographically outside of a single tree's root. Fixed. | 1376 | return (dirname(path) , path) | 
| 1773.3.1
by Robert Collins Add path_prefix_key and compare_paths_prefix_order utility functions. | 1377 | |
| 1378 | ||
| 1379 | def compare_paths_prefix_order(path_a, path_b): | |
| 1380 | """Compare path_a and path_b to generate the same order walkdirs uses.""" | |
| 1381 | key_a = path_prefix_key(path_a) | |
| 1382 | key_b = path_prefix_key(path_b) | |
| 1383 | return cmp(key_a, key_b) | |
| 1955.2.2
by John Arbash Meinel Change the name of the test classes (test_lang => test_locale), move the function into osutils.py | 1384 | |
| 1385 | ||
| 1386 | _cached_user_encoding = None | |
| 1387 | ||
| 1388 | ||
| 2192.1.3
by Alexander Belchenko Tests for osutils.get_user_encoding | 1389 | def get_user_encoding(use_cache=True): | 
| 1955.2.2
by John Arbash Meinel Change the name of the test classes (test_lang => test_locale), move the function into osutils.py | 1390 | """Find out what the preferred user encoding is. | 
| 1391 | ||
| 1392 |     This is generally the encoding that is used for command line parameters
 | |
| 1393 |     and file contents. This may be different from the terminal encoding
 | |
| 1394 |     or the filesystem encoding.
 | |
| 1395 | ||
| 2192.1.3
by Alexander Belchenko Tests for osutils.get_user_encoding | 1396 |     :param  use_cache:  Enable cache for detected encoding.
 | 
| 1397 |                         (This parameter is turned on by default,
 | |
| 1398 |                         and required only for selftesting)
 | |
| 1399 | ||
| 1955.2.2
by John Arbash Meinel Change the name of the test classes (test_lang => test_locale), move the function into osutils.py | 1400 |     :return: A string defining the preferred user encoding
 | 
| 1401 |     """
 | |
| 1402 | global _cached_user_encoding | |
| 2192.1.3
by Alexander Belchenko Tests for osutils.get_user_encoding | 1403 | if _cached_user_encoding is not None and use_cache: | 
| 1955.2.2
by John Arbash Meinel Change the name of the test classes (test_lang => test_locale), move the function into osutils.py | 1404 | return _cached_user_encoding | 
| 1405 | ||
| 1406 | if sys.platform == 'darwin': | |
| 1407 |         # work around egregious python 2.4 bug
 | |
| 1408 | sys.platform = 'posix' | |
| 1409 | try: | |
| 1410 | import locale | |
| 1411 | finally: | |
| 1412 | sys.platform = 'darwin' | |
| 1413 | else: | |
| 1414 | import locale | |
| 1415 | ||
| 1416 | try: | |
| 2192.1.3
by Alexander Belchenko Tests for osutils.get_user_encoding | 1417 | user_encoding = locale.getpreferredencoding() | 
| 1955.2.2
by John Arbash Meinel Change the name of the test classes (test_lang => test_locale), move the function into osutils.py | 1418 | except locale.Error, e: | 
| 1955.2.3
by John Arbash Meinel Change error message text | 1419 | sys.stderr.write('bzr: warning: %s\n' | 
| 2001.2.1
by Jelmer Vernooij Fix typo in encoding warning. | 1420 | ' Could not determine what text encoding to use.\n' | 
| 1955.2.3
by John Arbash Meinel Change error message text | 1421 | ' This error usually means your Python interpreter\n' | 
| 1422 | ' doesn\'t support the locale set by $LANG (%s)\n' | |
| 1423 | " Continuing with ascii encoding.\n" | |
| 1955.2.2
by John Arbash Meinel Change the name of the test classes (test_lang => test_locale), move the function into osutils.py | 1424 | % (e, os.environ.get('LANG'))) | 
| 2192.1.7
by Alexander Belchenko get_user_encoding: if locale.Error raised we need to set user_encoding to 'ascii' as warning says | 1425 | user_encoding = 'ascii' | 
| 1955.2.2
by John Arbash Meinel Change the name of the test classes (test_lang => test_locale), move the function into osutils.py | 1426 | |
| 2127.4.1
by Alexander Belchenko (jam, bialix) Workaround for cp0 console encoding on Windows | 1427 |     # Windows returns 'cp0' to indicate there is no code page. So we'll just
 | 
| 1428 |     # treat that as ASCII, and not support printing unicode characters to the
 | |
| 1429 |     # console.
 | |
| 3405.3.1
by Neil Martinsen-Burrell accept for an encoding to mean ascii | 1430 |     #
 | 
| 1431 |     # For python scripts run under vim, we get '', so also treat that as ASCII
 | |
| 1432 | if user_encoding in (None, 'cp0', ''): | |
| 2192.1.3
by Alexander Belchenko Tests for osutils.get_user_encoding | 1433 | user_encoding = 'ascii' | 
| 2192.1.1
by Alexander Belchenko Before actually using encoding need to check that Python has corresponding codec | 1434 | else: | 
| 1435 |         # check encoding
 | |
| 1436 | try: | |
| 2192.1.3
by Alexander Belchenko Tests for osutils.get_user_encoding | 1437 | codecs.lookup(user_encoding) | 
| 2192.1.1
by Alexander Belchenko Before actually using encoding need to check that Python has corresponding codec | 1438 | except LookupError: | 
| 1439 | sys.stderr.write('bzr: warning:' | |
| 1440 | ' unknown encoding %s.' | |
| 1441 | ' Continuing with ascii encoding.\n' | |
| 2192.1.3
by Alexander Belchenko Tests for osutils.get_user_encoding | 1442 | % user_encoding | 
| 2192.1.1
by Alexander Belchenko Before actually using encoding need to check that Python has corresponding codec | 1443 |                             )
 | 
| 2192.1.3
by Alexander Belchenko Tests for osutils.get_user_encoding | 1444 | user_encoding = 'ascii' | 
| 1445 | ||
| 1446 | if use_cache: | |
| 1447 | _cached_user_encoding = user_encoding | |
| 1448 | ||
| 1449 | return user_encoding | |
| 2091.1.1
by Martin Pool Avoid MSG_WAITALL as it doesn't work on Windows | 1450 | |
| 1451 | ||
| 1452 | def recv_all(socket, bytes): | |
| 1453 | """Receive an exact number of bytes. | |
| 1454 | ||
| 1455 |     Regular Socket.recv() may return less than the requested number of bytes,
 | |
| 1456 |     dependning on what's in the OS buffer.  MSG_WAITALL is not available
 | |
| 1457 |     on all platforms, but this should work everywhere.  This will return
 | |
| 1458 |     less than the requested amount if the remote end closes.
 | |
| 1459 | ||
| 1460 |     This isn't optimized and is intended mostly for use in testing.
 | |
| 1461 |     """
 | |
| 1462 | b = '' | |
| 1463 | while len(b) < bytes: | |
| 1464 | new = socket.recv(bytes - len(b)) | |
| 1465 | if new == '': | |
| 1466 | break # eof | |
| 1467 | b += new | |
| 1468 | return b | |
| 1469 | ||
| 3118.2.1
by Andrew Bennetts (andrew) Fix #115781 by passing no more than 64k at a time to socket.sendall. | 1470 | |
| 1471 | def send_all(socket, bytes): | |
| 1472 | """Send all bytes on a socket. | |
| 1473 | ||
| 1474 |     Regular socket.sendall() can give socket error 10053 on Windows.  This
 | |
| 1475 |     implementation sends no more than 64k at a time, which avoids this problem.
 | |
| 1476 |     """
 | |
| 1477 | chunk_size = 2**16 | |
| 1478 | for pos in xrange(0, len(bytes), chunk_size): | |
| 1479 | socket.sendall(bytes[pos:pos+chunk_size]) | |
| 1480 | ||
| 1481 | ||
| 2091.3.7
by Aaron Bentley Rename real_parent to dereferenced_path | 1482 | def dereference_path(path): | 
| 1483 | """Determine the real path to a file. | |
| 1484 | ||
| 1485 |     All parent elements are dereferenced.  But the file itself is not
 | |
| 1486 |     dereferenced.
 | |
| 1487 |     :param path: The original path.  May be absolute or relative.
 | |
| 1488 |     :return: the real path *to* the file
 | |
| 1489 |     """
 | |
| 2091.3.5
by Aaron Bentley Move realpath functionality into osutils | 1490 | parent, base = os.path.split(path) | 
| 1491 |     # The pathjoin for '.' is a workaround for Python bug #1213894.
 | |
| 1492 |     # (initial path components aren't dereferenced)
 | |
| 1493 | return pathjoin(realpath(pathjoin('.', parent)), base) | |
| 2681.3.4
by Lukáš Lalinsky - Rename 'windows' to 'mapi' | 1494 | |
| 1495 | ||
| 1496 | def supports_mapi(): | |
| 1497 | """Return True if we can use MAPI to launch a mail client.""" | |
| 1498 | return sys.platform == "win32" | |
| 3089.3.8
by Ian Clatworthy move resource loading into a reusable function | 1499 | |
| 1500 | ||
| 1501 | def resource_string(package, resource_name): | |
| 1502 | """Load a resource from a package and return it as a string. | |
| 1503 | ||
| 1504 |     Note: Only packages that start with bzrlib are currently supported.
 | |
| 1505 | ||
| 1506 |     This is designed to be a lightweight implementation of resource
 | |
| 1507 |     loading in a way which is API compatible with the same API from
 | |
| 1508 |     pkg_resources. See
 | |
| 1509 |     http://peak.telecommunity.com/DevCenter/PkgResources#basic-resource-access.
 | |
| 1510 |     If and when pkg_resources becomes a standard library, this routine
 | |
| 1511 |     can delegate to it.
 | |
| 1512 |     """
 | |
| 1513 |     # Check package name is within bzrlib
 | |
| 1514 | if package == "bzrlib": | |
| 1515 | resource_relpath = resource_name | |
| 1516 | elif package.startswith("bzrlib."): | |
| 1517 | package = package[len("bzrlib."):].replace('.', os.sep) | |
| 1518 | resource_relpath = pathjoin(package, resource_name) | |
| 1519 | else: | |
| 1520 | raise errors.BzrError('resource package %s not in bzrlib' % package) | |
| 1521 | ||
| 1522 |     # Map the resource to a file and read its contents
 | |
| 1523 | base = dirname(bzrlib.__file__) | |
| 1524 | if getattr(sys, 'frozen', None): # bzr.exe | |
| 1525 | base = abspath(pathjoin(base, '..', '..')) | |
| 1526 | filename = pathjoin(base, resource_relpath) | |
| 1527 | return open(filename, 'rU').read() |