/brz/remove-bazaar : revision 3224.5.38

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/osutils.py

Committer: Andrew Bennetts
Date: 2008-10-01 05:40:45 UTC
mfrom: (3753 +trunk)
mto: This revision was merged to the branch mainline in revision 3756.
Revision ID: andrew.bennetts@canonical.com-20081001054045-z50qc0d3p9qsc5im

Merge from bzr.dev; resolve osutils.py conflict by reverting my sha import hackery.

files added:
bzrlib/python-compat.h

bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py

doc/developers/lca_tree_merging.txt

files removed:
bzrlib/_walkdirs_win32.h

files renamed:
bzrlib/tests/repository_implementations/ => bzrlib/tests/per_repository/

files modified:
.bzrignore

NEWS

bzr.ico

bzrlib/__init__.py

bzrlib/_btree_serializer_c.pyx

bzrlib/_dirstate_helpers_c.pyx

bzrlib/_dirstate_helpers_py.py

bzrlib/_patiencediff_c.c

bzrlib/_readdir_py.py

bzrlib/_readdir_pyx.pyx

bzrlib/_walkdirs_win32.pyx

bzrlib/annotate.py

bzrlib/branch.py

bzrlib/branchbuilder.py

bzrlib/btree_index.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bzrdir.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/directory_service.py

bzrlib/dirstate.py

bzrlib/errors.py

bzrlib/hashcache.py

bzrlib/help_topics/__init__.py

bzrlib/help_topics/en/hooks.txt

bzrlib/hooks.py

bzrlib/index.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/missing.py

bzrlib/mutabletree.py

bzrlib/osutils.py

bzrlib/remote.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/smart/branch.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/message.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/status.py

bzrlib/testament.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/http_server.py

bzrlib/tests/http_utils.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/per_repository/__init__.py

bzrlib/tests/per_repository/helpers.py

bzrlib/tests/per_repository/test__generate_text_key_index.py

bzrlib/tests/per_repository/test_add_fallback_repository.py

bzrlib/tests/per_repository/test_break_lock.py

bzrlib/tests/per_repository/test_check.py

bzrlib/tests/per_repository/test_check_reconcile.py

bzrlib/tests/per_repository/test_commit_builder.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_find_text_key_references.py

bzrlib/tests/per_repository/test_get_parent_map.py

bzrlib/tests/per_repository/test_has_revisions.py

bzrlib/tests/per_repository/test_has_same_location.py

bzrlib/tests/per_repository/test_is_write_locked.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_pack.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_repository.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_statistics.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/test__dirstate_helpers.py

bzrlib/tests/test__walkdirs_win32.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_directory_service.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revisionspec.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_win32utils.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/remote.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tuned_gzip.py

bzrlib/util/configobj/configobj.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

doc/developers/development-repo.txt

doc/developers/inventory.txt

doc/en/user-guide/http_smart_server.txt

profile_imports.py

setup.py

tools/doc_generate/autodoc_man.py

Show diffs side-by-side

added added

removed removed

bzrlib/osutils.py

splitdrive as _nt_splitdrive,

)

import posixpath

import sha

import shutil

from shutil import (

rmtree,

)

""")

# sha and md5 modules are deprecated in python2.6 but hashlib is available as

# of 2.5

if sys.version_info < (2, 5):

import md5 as _mod_md5

md5 = _mod_md5.new

import sha as _mod_sha

sha = _mod_sha.new

else:

from hashlib import (

md5,

sha1 as sha,

)

import bzrlib

from bzrlib import symbol_versioning

118

130

119

131

_directory_kind = 'directory'

120

132

121

_formats = {

122

stat.S_IFDIR:_directory_kind,

123

stat.S_IFCHR:'chardev',

124

stat.S_IFBLK:'block',

125

stat.S_IFREG:'file',

126

stat.S_IFIFO:'fifo',

127

stat.S_IFLNK:'symlink',

128

stat.S_IFSOCK:'socket',

129

}

130

131

132

def file_kind_from_stat_mode(stat_mode, _formats=_formats, _unknown='unknown'):

133

"""Generate a file kind from a stat mode. This is used in walkdirs.

134

135

Its performance is critical: Do not mutate without careful benchmarking.

136

"""

137

try:

138

return _formats[stat_mode & 0170000]

139

except KeyError:

140

return _unknown

141

142

143

def file_kind(f, _lstat=os.lstat, _mapper=file_kind_from_stat_mode):

144

try:

145

return _mapper(_lstat(f).st_mode)

146

except OSError, e:

147

if getattr(e, 'errno', None) in (errno.ENOENT, errno.ENOTDIR):

148

raise errors.NoSuchFile(f)

149

raise

150

151

152

133

def get_umask():

153

134

"""Return the current umask"""

154

135

# Assume that people aren't messing with the umask while running

597

578

598

579

The file cursor should be already at the start.

599

580

"""

600

s = sha.new()

581

s = sha()

601

582

BUFSIZE = 128<<10

602

583

while True:

603

584

b = f.read(BUFSIZE)

609

590

610

591

def sha_file_by_name(fname):

611

592

"""Calculate the SHA1 of a file by reading the full text"""

612

s = sha.new()

593

s = sha()

613

594

f = os.open(fname, os.O_RDONLY | O_BINARY)

614

595

try:

615

596

while True:

621

602

os.close(f)

622

603

623

604

624

def sha_strings(strings):

605

def sha_strings(strings, _factory=sha):

625

606

"""Return the sha-1 of concatenation of strings"""

626

# Do some hackery here to install an optimised version of this function on

627

# the first invocation of this function. (We don't define it like this

628

# initially so that we can avoid loading the sha module, which takes up to

629

# 2ms, unless we need to.)

630

global sha_strings

631

def _sha_strings(strings, _factory=sha.new):

632

"""Return the sha-1 of concatenation of strings"""

633

s = _factory()

634

map(s.update, strings)

635

return s.hexdigest()

636

sha_strings = _sha_strings

637

# Now that we've installed the real version, call it.

638

return sha_strings(strings)

639

640

641

def sha_string(f):

642

global sha_string

643

def sha_string(f, _factory=sha.new):

644

return _factory(f).hexdigest()

645

return sha_string(f)

646

607

s = _factory()

608

map(s.update, strings)

609

return s.hexdigest()

610

611

612

def sha_string(f, _factory=sha):

613

return _factory(f).hexdigest()

647

614

648

615

649

616

def fingerprint_file(f):

650

617

b = f.read()

651

618

return {'size': len(b),

652

'sha1': sha.new(b).hexdigest()}

619

'sha1': sha(b).hexdigest()}

653

620

654

621

655

622

def compare_files(a, b):

1212

1179

_lstat = os.lstat

1213

1180

_directory = _directory_kind

1214

1181

_listdir = os.listdir

1215

_kind_from_mode = _formats.get

1182

_kind_from_mode = file_kind_from_stat_mode

1216

1183

pending = [(safe_unicode(prefix), "", _directory, None, safe_unicode(top))]

1217

1184

while pending:

1218

1185

# 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath

1234

1201

for name in names:

1235

1202

abspath = top_slash + name

1236

1203

statvalue = _lstat(abspath)

1237

kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown')

1204

kind = _kind_from_mode(statvalue.st_mode)

1238

1205

append((relprefix + name, name, kind, statvalue, abspath))

1239

1206

yield (relroot, top), dirblock

1240

1207

1242

1209

pending.extend(d for d in reversed(dirblock) if d[2] == _directory)

1243

1210

1244

1211

1245

_real_walkdirs_utf8 = None

1212

class DirReader(object):

1213

"""An interface for reading directories."""

1214

1215

def top_prefix_to_starting_dir(self, top, prefix=""):

1216

"""Converts top and prefix to a starting dir entry

1217

1218

:param top: A utf8 path

1219

:param prefix: An optional utf8 path to prefix output relative paths

1220

with.

1221

:return: A tuple starting with prefix, and ending with the native

1222

encoding of top.

1223

"""

1224

raise NotImplementedError(self.top_prefix_to_starting_dir)

1225

1226

def read_dir(self, prefix, top):

1227

"""Read a specific dir.

1228

1229

:param prefix: A utf8 prefix to be preprended to the path basenames.

1230

:param top: A natively encoded path to read.

1231

:return: A list of the directories contents. Each item contains:

1232

(utf8_relpath, utf8_name, kind, lstatvalue, native_abspath)

1233

"""

1234

raise NotImplementedError(self.read_dir)

1235

1236

1237

_selected_dir_reader = None

1238

1246

1239

1247

1240

def _walkdirs_utf8(top, prefix=""):

1248

1241

"""Yield data about all the directories in a tree.

1258

1251

path-from-top might be unicode or utf8, but it is the correct path to

1259

1252

pass to os functions to affect the file in question. (such as os.lstat)

1260

1253

"""

1261

global _real_walkdirs_utf8

1262

if _real_walkdirs_utf8 is None:

1254

global _selected_dir_reader

1255

if _selected_dir_reader is None:

1263

1256

fs_encoding = _fs_enc.upper()

1264

1257

if sys.platform == "win32" and win32utils.winver == 'Windows NT':

1265

1258

# Win98 doesn't have unicode apis like FindFirstFileW

1268

1261

# but that gets a bit tricky, and requires custom compiling

1269

1262

# for win98 anyway.

1270

1263

try:

1271

from bzrlib._walkdirs_win32 import _walkdirs_utf8_win32_find_file

1264

from bzrlib._walkdirs_win32 import Win32ReadDir

1272

1265

except ImportError:

1273

_real_walkdirs_utf8 = _walkdirs_unicode_to_utf8

1266

_selected_dir_reader = UnicodeDirReader()

1274

1267

else:

1275

_real_walkdirs_utf8 = _walkdirs_utf8_win32_find_file

1268

_selected_dir_reader = Win32ReadDir()

1276

1269

elif fs_encoding not in ('UTF-8', 'US-ASCII', 'ANSI_X3.4-1968'):

1277

1270

# ANSI_X3.4-1968 is a form of ASCII

1278

_real_walkdirs_utf8 = _walkdirs_unicode_to_utf8

1271

_selected_dir_reader = UnicodeDirReader()

1279

1272

else:

1280

_real_walkdirs_utf8 = _walkdirs_fs_utf8

1281

return _real_walkdirs_utf8(top, prefix=prefix)

1282

1283

1284

def _walkdirs_fs_utf8(top, prefix=""):

1285

"""See _walkdirs_utf8.

1286

1287

This sub-function is called when we know the filesystem is already in utf8

1288

encoding. So we don't need to transcode filenames.

1289

"""

1290

_lstat = os.lstat

1291

_directory = _directory_kind

1292

# Use C accelerated directory listing.

1293

_listdir = _read_dir

1294

_kind_from_mode = _formats.get

1295

1273

try:

1274

from bzrlib._readdir_pyx import UTF8DirReader

1275

except ImportError:

1276

# No optimised code path

1277

_selected_dir_reader = UnicodeDirReader()

1278

else:

1279

_selected_dir_reader = UTF8DirReader()

1296

1280

# 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath

1297

1281

# But we don't actually uses 1-3 in pending, so set them to None

1298

pending = [(safe_utf8(prefix), None, None, None, safe_utf8(top))]

1282

pending = [[_selected_dir_reader.top_prefix_to_starting_dir(top, prefix)]]

1283

read_dir = _selected_dir_reader.read_dir

1284

_directory = _directory_kind

1299

1285

while pending:

1300

relroot, _, _, _, top = pending.pop()

1301

if relroot:

1302

relprefix = relroot + '/'

1303

else:

1304

relprefix = ''

1305

top_slash = top + '/'

1306

1307

dirblock = []

1308

append = dirblock.append

1309

# read_dir supplies in should-stat order.

1310

for _, name in sorted(_listdir(top)):

1311

abspath = top_slash + name

1312

statvalue = _lstat(abspath)

1313

kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown')

1314

append((relprefix + name, name, kind, statvalue, abspath))

1315

dirblock.sort()

1286

relroot, _, _, _, top = pending[-1].pop()

1287

if not pending[-1]:

1288

pending.pop()

1289

dirblock = sorted(read_dir(relroot, top))

1316

1290

yield (relroot, top), dirblock

1317

1318

1291

# push the user specified dirs from dirblock

1319

pending.extend(d for d in reversed(dirblock) if d[2] == _directory)

1320

1321

1322

def _walkdirs_unicode_to_utf8(top, prefix=""):

1323

"""See _walkdirs_utf8

1324

1325

Because Win32 has a Unicode api, all of the 'path-from-top' entries will be

1326

Unicode paths.

1327

This is currently the fallback code path when the filesystem encoding is

1328

not UTF-8. It may be better to implement an alternative so that we can

1329

safely handle paths that are not properly decodable in the current

1330

encoding.

1331

"""

1332

_utf8_encode = codecs.getencoder('utf8')

1333

_lstat = os.lstat

1334

_directory = _directory_kind

1335

_listdir = os.listdir

1336

_kind_from_mode = _formats.get

1337

1338

pending = [(safe_utf8(prefix), None, None, None, safe_unicode(top))]

1339

while pending:

1340

relroot, _, _, _, top = pending.pop()

1341

if relroot:

1342

relprefix = relroot + '/'

1292

next = [d for d in reversed(dirblock) if d[2] == _directory]

1293

if next:

1294

pending.append(next)

1295

1296

1297

class UnicodeDirReader(DirReader):

1298

"""A dir reader for non-utf8 file systems, which transcodes."""

1299

1300

__slots__ = ['_utf8_encode']

1301

1302

def __init__(self):

1303

self._utf8_encode = codecs.getencoder('utf8')

1304

1305

def top_prefix_to_starting_dir(self, top, prefix=""):

1306

"""See DirReader.top_prefix_to_starting_dir."""

1307

return (safe_utf8(prefix), None, None, None, safe_unicode(top))

1308

1309

def read_dir(self, prefix, top):

1310

"""Read a single directory from a non-utf8 file system.

1311

1312

top, and the abspath element in the output are unicode, all other paths

1313

are utf8. Local disk IO is done via unicode calls to listdir etc.

1314

1315

This is currently the fallback code path when the filesystem encoding is

1316

not UTF-8. It may be better to implement an alternative so that we can

1317

safely handle paths that are not properly decodable in the current

1318

encoding.

1319

1320

See DirReader.read_dir for details.

1321

"""

1322

_utf8_encode = self._utf8_encode

1323

_lstat = os.lstat

1324

_listdir = os.listdir

1325

_kind_from_mode = file_kind_from_stat_mode

1326

1327

if prefix:

1328

relprefix = prefix + '/'

1343

1329

else:

1344

1330

relprefix = ''

1345

1331

top_slash = top + u'/'

1347

1333

dirblock = []

1348

1334

append = dirblock.append

1349

1335

for name in sorted(_listdir(top)):

1350

name_utf8 = _utf8_encode(name)[0]

1336

try:

1337

name_utf8 = _utf8_encode(name)[0]

1338

except UnicodeDecodeError:

1339

raise errors.BadFilenameEncoding(

1340

_utf8_encode(relprefix)[0] + name, _fs_enc)

1351

1341

abspath = top_slash + name

1352

1342

statvalue = _lstat(abspath)

1353

kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown')

1343

kind = _kind_from_mode(statvalue.st_mode)

1354

1344

append((relprefix + name_utf8, name_utf8, kind, statvalue, abspath))

1355

yield (relroot, top), dirblock

1356

1357

# push the user specified dirs from dirblock

1358

pending.extend(d for d in reversed(dirblock) if d[2] == _directory)

1345

return dirblock

1359

1346

1360

1347

1361

1348

def copy_tree(from_path, to_path, handlers={}):

1436

1423

return _cached_user_encoding

1437

1424

1438

1425

if sys.platform == 'darwin':

1439

# work around egregious python 2.4 bug

1426

# python locale.getpreferredencoding() always return

1427

# 'mac-roman' on darwin. That's a lie.

1440

1428

sys.platform = 'posix'

1441

1429

try:

1430

if os.environ.get('LANG', None) is None:

1431

# If LANG is not set, we end up with 'ascii', which is bad

1432

# ('mac-roman' is more than ascii), so we set a default which

1433

# will give us UTF-8 (which appears to work in all cases on

1434

# OSX). Users are still free to override LANG of course, as

1435

# long as it give us something meaningful. This work-around

1436

# *may* not be needed with python 3k and/or OSX 10.5, but will

1437

# work with them too -- vila 20080908

1438

os.environ['LANG'] = 'en_US.UTF-8'

1442

1439

import locale

1443

1440

finally:

1444

1441

sys.platform = 'darwin'

1573

1570

return open(filename, 'rU').read()

1574

1571

1575

1572

1576

try:

1577

from bzrlib._readdir_pyx import read_dir as _read_dir

1578

except ImportError:

1579

from bzrlib._readdir_py import read_dir as _read_dir

1573

def file_kind_from_stat_mode_thunk(mode):

1574

global file_kind_from_stat_mode

1575

if file_kind_from_stat_mode is file_kind_from_stat_mode_thunk:

1576

try:

1577

from bzrlib._readdir_pyx import UTF8DirReader

1578

file_kind_from_stat_mode = UTF8DirReader().kind_from_mode

1579

except ImportError:

1580

from bzrlib._readdir_py import (

1581

_kind_from_mode as file_kind_from_stat_mode

1582

)

1583

return file_kind_from_stat_mode(mode)

1584

file_kind_from_stat_mode = file_kind_from_stat_mode_thunk

1585

1586

1587

def file_kind(f, _lstat=os.lstat):

1588

try:

1589

return file_kind_from_stat_mode(_lstat(f).st_mode)

1590

except OSError, e:

1591

if getattr(e, 'errno', None) in (errno.ENOENT, errno.ENOTDIR):

1592

raise errors.NoSuchFile(f)

1593

raise

1594

1595

Older »