1
# Copyright (C) 2008 Canonical Ltd
3
# This program is free software; you can redistribute it and/or modify
4
# it under the terms of the GNU General Public License as published by
5
# the Free Software Foundation; either version 2 of the License, or
6
# (at your option) any later version.
8
# This program is distributed in the hope that it will be useful,
9
# but WITHOUT ANY WARRANTY; without even the implied warranty of
10
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
11
# GNU General Public License for more details.
13
# You should have received a copy of the GNU General Public License
14
# along with this program; if not, write to the Free Software
15
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
17
"""Serializer object for CHK based inventory storage."""
19
from cStringIO import (
28
revision as _mod_revision,
33
_decode_utf8 = cache_utf8.decode
36
def _validate_properties(props):
38
# TODO: we really want an 'isascii' check for key
39
unicode_props = dict((key, _decode_utf8(value))
40
for key, value in props.iteritems())
44
def _is_format_10(value):
46
raise ValueError('Format number was not recognized, expected 10 got %d'
51
class BEncodeRevisionSerializer1(object):
52
"""Simple revision serializer based around bencode.
55
# Maps {key:(Revision attribute, bencode_type, validator)}
56
# This tells us what kind we expect bdecode to create, what variable on
57
# Revision we should be using, and a function to call to validate/transform
59
# TODO: add a 'validate_utf8' for things like revision_id and file_id
60
# and a validator for parent-ids
61
_schema = {'format': (None, int, _is_format_10),
62
'committer': ('committer', str, _decode_utf8),
63
'timezone': ('timezone', int, None),
64
'timestamp': ('timestamp', str, float),
65
'revision-id': ('revision_id', str, None),
66
'parent-ids': ('parent_ids', list, tuple),
67
'inventory-sha1': ('inventory_sha1', str, None),
68
'message': ('message', str, _decode_utf8),
69
'properties': ('properties', dict, _validate_properties),
72
def write_revision_to_string(self, rev):
73
encode_utf8 = cache_utf8.encode
74
# Use a list of tuples rather than a dict
75
# This lets us control the ordering, so that we are able to create
79
("committer", encode_utf8(rev.committer)),
81
if rev.timezone is not None:
82
ret.append(("timezone", rev.timezone))
83
# For bzr revisions, the most common property is just 'branch-nick'
84
# which changes infrequently.
86
for key, value in rev.properties.iteritems():
87
revprops[key] = encode_utf8(value)
88
ret.append(('properties', revprops))
90
("timestamp", "%.3f" % rev.timestamp),
91
("revision-id", rev.revision_id),
92
("parent-ids", rev.parent_ids),
93
("inventory-sha1", rev.inventory_sha1),
94
("message", encode_utf8(rev.message)),
96
return bencode.bencode(ret)
98
def write_revision(self, rev, f):
99
f.write(self.write_revision_to_string(rev))
101
def read_revision_from_string(self, text):
102
# TODO: consider writing a Revision decoder, rather than using the
103
# generic bencode decoder
104
decode_utf8 = cache_utf8.decode
105
ret = bencode.bdecode(text)
106
if not isinstance(ret, list):
107
raise ValueError("invalid revision text")
108
schema = dict(self._schema)
110
for key, value in ret:
111
# The entry must be present in allowed keys, but only present a
113
var_name, expected_type, validator = schema.pop(key)
114
if value.__class__ is not expected_type:
115
raise ValueError('key %s did not conform to the expected type'
117
% (key, expected_type, type(value)))
118
if validator is not None:
119
value = validator(value)
120
if var_name is not None:
121
bits[var_name] = value
122
if schema.keys() not in ([], ['timezone']):
123
raise ValueError('Revision text was missing expected keys %s,'
124
' text %r' % (schema.keys(), text))
125
rev = _mod_revision.Revision(**bits)
126
if "timezone" not in bits:
130
def read_revision(self, f):
131
return self.read_revision_from_string(f.read())
134
class CHKSerializerSubtree(BEncodeRevisionSerializer1, xml6.Serializer_v6):
135
"""A CHKInventory based serializer that supports tree references"""
137
supported_kinds = set(['file', 'directory', 'symlink', 'tree-reference'])
139
revision_format_num = None
140
support_altered_by_hack = False
142
def _unpack_entry(self, elt):
144
if not kind in self.supported_kinds:
145
raise AssertionError('unsupported entry kind %s' % kind)
146
if kind == 'tree-reference':
147
file_id = elt.attrib['file_id']
148
name = elt.attrib['name']
149
parent_id = elt.attrib['parent_id']
150
revision = elt.get('revision')
151
reference_revision = elt.get('reference_revision')
152
return inventory.TreeReference(file_id, name, parent_id, revision,
155
return xml6.Serializer_v6._unpack_entry(self, elt)
157
def __init__(self, node_size, search_key_name):
158
self.maximum_size = node_size
159
self.search_key_name = search_key_name
162
class CHKSerializer(xml5.Serializer_v5):
163
"""A CHKInventory based serializer with 'plain' behaviour."""
166
revision_format_num = None
167
support_altered_by_hack = False
169
def __init__(self, node_size, search_key_name):
170
self.maximum_size = node_size
171
self.search_key_name = search_key_name
174
chk_serializer_255_bigpage = CHKSerializer(65536, 'hash-255-way')
177
class CHKBEncodeSerializer(BEncodeRevisionSerializer1, CHKSerializer):
178
"""A CHKInventory and BEncode based serializer with 'plain' behaviour."""
183
chk_bencode_serializer = CHKBEncodeSerializer(65536, 'hash-255-way')