1
# Copyright (C) 2006, 2007, 2009, 2010, 2011 Canonical Ltd
1
# Copyright (C) 2006 Canonical Ltd
3
3
# This program is free software; you can redistribute it and/or modify
4
4
# it under the terms of the GNU General Public License as published by
17
17
"""Common code for generating file or revision ids."""
19
from __future__ import absolute_import
21
from .lazy_import import lazy_import
19
from bzrlib.lazy_import import lazy_import
22
20
lazy_import(globals(), """
35
from .sixish import text_type
37
35
# the regex removes any weird characters; we don't escape them
38
36
# but rather just pull them out
39
_file_id_chars_re = lazy_regex.lazy_compile(b'[^\\w.]')
40
_rev_id_chars_re = lazy_regex.lazy_compile(b'[^-\\w.+@]')
37
_file_id_chars_re = lazy_regex.lazy_compile(r'[^\w.]')
38
_rev_id_chars_re = lazy_regex.lazy_compile(r'[^-\w.+@]')
41
39
_gen_file_id_suffix = None
42
40
_gen_file_id_serial = 0
49
47
give a highly probably globally unique number. Then each call in the same
50
48
process adds 1 to a serial number we append to that unique value.
52
# XXX TODO: change breezy.add.smart_add_tree to call workingtree.add() rather
50
# XXX TODO: change bzrlib.add.smart_add_tree to call workingtree.add() rather
53
51
# than having to move the id randomness out of the inner loop like this.
54
52
# XXX TODO: for the global randomness this uses we should add the thread-id
55
53
# before the serial #.
61
59
global _gen_file_id_suffix, _gen_file_id_serial
62
60
if _gen_file_id_suffix is None:
63
_gen_file_id_suffix = ("-%s-%s-" % (
64
osutils.compact_date(time.time()), osutils.rand_chars(16))
61
_gen_file_id_suffix = "-%s-%s-" % (osutils.compact_date(time.time()),
62
osutils.rand_chars(16))
66
63
_gen_file_id_serial += 1
67
return b"%s%d" % (_gen_file_id_suffix, _gen_file_id_serial)
64
return _gen_file_id_suffix + str(_gen_file_id_serial)
70
67
def gen_file_id(name):
73
70
The uniqueness is supplied from _next_id_suffix.
75
if isinstance(name, text_type):
76
name = name.encode('ascii', 'replace')
77
72
# The real randomness is in the _next_id_suffix, the
78
73
# rest of the identifier is just to be nice.
86
81
# 4) Removing starting '.' characters to prevent the file ids from
87
82
# being considered hidden.
88
ascii_word_only = _file_id_chars_re.sub(b'', name.lower())
89
short_no_dots = ascii_word_only.lstrip(b'.')[:20]
83
ascii_word_only = str(_file_id_chars_re.sub('', name.lower()))
84
short_no_dots = ascii_word_only.lstrip('.')[:20]
90
85
return short_no_dots + _next_id_suffix()
98
93
def gen_revision_id(username, timestamp=None):
99
94
"""Return new revision-id.
101
:param username: The username of the committer, in the format returned by
102
config.username(). This is typically a real name, followed by an
103
email address. If found, we will use just the email address portion.
104
Otherwise we flatten the real name, and use that.
96
:param username: This is the value returned by config.username(), which is
97
typically a real name, followed by an email address. If found, we will
98
use just the email address portion. Otherwise we flatten the real name,
105
100
:return: A new revision id.
108
103
user_or_email = config.extract_email_address(username)
109
except config.NoEmailInUsername:
104
except errors.NoEmailInUsername:
110
105
user_or_email = username
112
107
user_or_email = user_or_email.lower()
113
108
user_or_email = user_or_email.replace(' ', '_')
114
user_or_email = _rev_id_chars_re.sub(b'', user_or_email.encode('utf-8'))
109
user_or_email = _rev_id_chars_re.sub('', user_or_email)
116
111
# This gives 36^16 ~= 2^82.7 ~= 83 bits of entropy
117
unique_chunk = osutils.rand_chars(16).encode('utf-8')
112
unique_chunk = osutils.rand_chars(16)
119
114
if timestamp is None:
120
115
timestamp = time.time()
122
rev_id = b'-'.join((user_or_email,
123
osutils.compact_date(timestamp).encode('utf-8'),
117
rev_id = u'-'.join((user_or_email,
118
osutils.compact_date(timestamp),
120
return rev_id.encode('utf8')