215
218
class TestSerializer(TestCase):
216
219
"""Test XML serialization"""
221
def test_canned_inventory(self):
222
"""Test unpacked a canned inventory v4 file."""
223
inp = StringIO(_working_inventory_v4)
224
inv = serializer_v4.read_inventory(inp)
225
self.assertEqual(len(inv), 4)
226
self.assert_('bar-20050901064931-73b4b1138abc9cd2' in inv)
228
def test_unpack_revision(self):
229
"""Test unpacking a canned revision v4"""
230
inp = StringIO(_revision_v4)
231
rev = serializer_v4.read_revision(inp)
232
eq = self.assertEqual
234
"Martin Pool <mbp@sourcefrog.net>")
236
"mbp@sourcefrog.net-20050905080035-e0439293f8b6b9f9")
237
eq(len(rev.parent_ids), 1)
238
eq(rev.parent_ids[0],
239
"mbp@sourcefrog.net-20050905063503-43948f59fa127d92")
218
241
def test_unpack_revision_5(self):
219
242
"""Test unpacking a canned revision v5"""
220
inp = BytesIO(_revision_v5)
221
rev = breezy.bzr.xml5.serializer_v5.read_revision(inp)
243
inp = StringIO(_revision_v5)
244
rev = bzrlib.xml5.serializer_v5.read_revision(inp)
222
245
eq = self.assertEqual
223
246
eq(rev.committer,
224
247
"Martin Pool <mbp@sourcefrog.net>")
225
248
eq(len(rev.parent_ids), 1)
226
249
eq(rev.timezone, 36000)
227
250
eq(rev.parent_ids[0],
228
b"mbp@sourcefrog.net-20050905063503-43948f59fa127d92")
251
"mbp@sourcefrog.net-20050905063503-43948f59fa127d92")
230
253
def test_unpack_revision_5_utc(self):
231
inp = BytesIO(_revision_v5_utc)
232
rev = breezy.bzr.xml5.serializer_v5.read_revision(inp)
254
inp = StringIO(_revision_v5_utc)
255
rev = bzrlib.xml5.serializer_v5.read_revision(inp)
233
256
eq = self.assertEqual
234
257
eq(rev.committer,
235
258
"Martin Pool <mbp@sourcefrog.net>")
236
259
eq(len(rev.parent_ids), 1)
237
260
eq(rev.timezone, 0)
238
261
eq(rev.parent_ids[0],
239
b"mbp@sourcefrog.net-20050905063503-43948f59fa127d92")
262
"mbp@sourcefrog.net-20050905063503-43948f59fa127d92")
241
264
def test_unpack_inventory_5(self):
242
265
"""Unpack canned new-style inventory"""
243
inp = BytesIO(_committed_inv_v5)
244
inv = breezy.bzr.xml5.serializer_v5.read_inventory(inp)
266
inp = StringIO(_committed_inv_v5)
267
inv = bzrlib.xml5.serializer_v5.read_inventory(inp)
245
268
eq = self.assertEqual
247
ie = inv.get_entry(b'bar-20050824000535-6bc48cfad47ed134')
270
ie = inv['bar-20050824000535-6bc48cfad47ed134']
248
271
eq(ie.kind, 'file')
249
eq(ie.revision, b'mbp@foo-00')
272
eq(ie.revision, 'mbp@foo-00')
250
273
eq(ie.name, 'bar')
251
eq(inv.get_entry(ie.parent_id).kind, 'directory')
274
eq(inv[ie.parent_id].kind, 'directory')
253
276
def test_unpack_basis_inventory_5(self):
254
277
"""Unpack canned new-style inventory"""
255
inv = breezy.bzr.xml5.serializer_v5.read_inventory_from_lines(
256
breezy.osutils.split_lines(_basis_inv_v5))
278
inp = StringIO(_basis_inv_v5)
279
inv = bzrlib.xml5.serializer_v5.read_inventory(inp)
257
280
eq = self.assertEqual
260
b'mbp@sourcefrog.net-20050905063503-43948f59fa127d92')
261
ie = inv.get_entry(b'bar-20050824000535-6bc48cfad47ed134')
282
eq(inv.revision_id, 'mbp@sourcefrog.net-20050905063503-43948f59fa127d92')
283
ie = inv['bar-20050824000535-6bc48cfad47ed134']
262
284
eq(ie.kind, 'file')
263
eq(ie.revision, b'mbp@foo-00')
285
eq(ie.revision, 'mbp@foo-00')
264
286
eq(ie.name, 'bar')
265
eq(inv.get_entry(ie.parent_id).kind, 'directory')
287
eq(inv[ie.parent_id].kind, 'directory')
267
289
def test_unpack_inventory_5a(self):
268
inv = breezy.bzr.xml5.serializer_v5.read_inventory_from_lines(
269
breezy.osutils.split_lines(_inventory_v5a), revision_id=b'test-rev-id')
270
self.assertEqual(b'test-rev-id', inv.root.revision)
290
inv = bzrlib.xml5.serializer_v5.read_inventory_from_string(
291
_inventory_v5a, revision_id='test-rev-id')
292
self.assertEqual('test-rev-id', inv.root.revision)
272
294
def test_unpack_inventory_5a_cache_and_copy(self):
273
295
# Passing an entry_cache should get populated with the objects
274
296
# But the returned objects should be copies if return_from_cache is
276
298
entry_cache = fifo_cache.FIFOCache()
277
inv = breezy.bzr.xml5.serializer_v5.read_inventory_from_lines(
278
breezy.osutils.split_lines(_inventory_v5a), revision_id=b'test-rev-id',
299
inv = bzrlib.xml5.serializer_v5.read_inventory_from_string(
300
_inventory_v5a, revision_id='test-rev-id',
279
301
entry_cache=entry_cache, return_from_cache=False)
280
302
for entry in inv.iter_just_entries():
281
303
key = (entry.file_id, entry.revision)
351
372
def test_pack_revision_5(self):
352
373
"""Pack revision to XML v5"""
353
374
# fixed 20051025, revisions should have final newline
354
rev = breezy.bzr.xml5.serializer_v5.read_revision_from_string(
356
outfile_contents = breezy.bzr.xml5.serializer_v5.write_revision_to_string(rev)
357
self.assertEqual(outfile_contents[-1:], b'\n')
358
self.assertEqualDiff(
360
b''.join(breezy.bzr.xml5.serializer_v5.write_revision_to_lines(rev)))
375
rev = bzrlib.xml5.serializer_v5.read_revision_from_string(_revision_v5)
377
bzrlib.xml5.serializer_v5.write_revision(rev, outp)
378
outfile_contents = outp.getvalue()
379
self.assertEqual(outfile_contents[-1], '\n')
380
self.assertEqualDiff(outfile_contents, bzrlib.xml5.serializer_v5.write_revision_to_string(rev))
361
381
self.assertEqualDiff(outfile_contents, _expected_rev_v5)
363
383
def test_empty_property_value(self):
364
384
"""Create an empty property value check that it serializes correctly"""
365
s_v5 = breezy.bzr.xml5.serializer_v5
385
s_v5 = bzrlib.xml5.serializer_v5
366
386
rev = s_v5.read_revision_from_string(_revision_v5)
367
props = {'empty': '', 'one': 'one'}
388
props = {'empty':'', 'one':'one'}
368
389
rev.properties = props
369
txt = b''.join(s_v5.write_revision_to_lines(rev))
390
txt = s_v5.write_revision_to_string(rev)
370
391
new_rev = s_v5.read_revision_from_string(txt)
371
392
self.assertEqual(props, new_rev.properties)
373
394
def get_sample_inventory(self):
374
inv = Inventory(b'tree-root-321', revision_id=b'rev_outer')
375
inv.add(inventory.InventoryFile(b'file-id', 'file', b'tree-root-321'))
376
inv.add(inventory.InventoryDirectory(b'dir-id', 'dir',
378
inv.add(inventory.InventoryLink(b'link-id', 'link', b'tree-root-321'))
379
inv.get_entry(b'tree-root-321').revision = b'rev_outer'
380
inv.get_entry(b'dir-id').revision = b'rev_outer'
381
inv.get_entry(b'file-id').revision = b'rev_outer'
382
inv.get_entry(b'file-id').text_sha1 = b'A'
383
inv.get_entry(b'file-id').text_size = 1
384
inv.get_entry(b'link-id').revision = b'rev_outer'
385
inv.get_entry(b'link-id').symlink_target = 'a'
395
inv = Inventory('tree-root-321', revision_id='rev_outer')
396
inv.add(inventory.InventoryFile('file-id', 'file', 'tree-root-321'))
397
inv.add(inventory.InventoryDirectory('dir-id', 'dir',
399
inv.add(inventory.InventoryLink('link-id', 'link', 'tree-root-321'))
400
inv['tree-root-321'].revision = 'rev_outer'
401
inv['dir-id'].revision = 'rev_outer'
402
inv['file-id'].revision = 'rev_outer'
403
inv['file-id'].text_sha1 = 'A'
404
inv['file-id'].text_size = 1
405
inv['link-id'].revision = 'rev_outer'
406
inv['link-id'].symlink_target = 'a'
388
409
def test_roundtrip_inventory_v7(self):
389
410
inv = self.get_sample_inventory()
390
inv.add(inventory.TreeReference(b'nested-id', 'nested', b'tree-root-321',
391
b'rev_outer', b'rev_inner'))
411
inv.add(inventory.TreeReference('nested-id', 'nested', 'tree-root-321',
412
'rev_outer', 'rev_inner'))
413
txt = xml7.serializer_v7.write_inventory_to_string(inv)
392
414
lines = xml7.serializer_v7.write_inventory_to_lines(inv)
393
self.assertEqualDiff(_expected_inv_v7, b''.join(lines))
394
inv2 = xml7.serializer_v7.read_inventory_from_lines(lines)
415
self.assertEqual(bzrlib.osutils.split_lines(txt), lines)
416
self.assertEqualDiff(_expected_inv_v7, txt)
417
inv2 = xml7.serializer_v7.read_inventory_from_string(txt)
395
418
self.assertEqual(5, len(inv2))
396
419
for path, ie in inv.iter_entries():
397
self.assertEqual(ie, inv2.get_entry(ie.file_id))
420
self.assertEqual(ie, inv2[ie.file_id])
399
422
def test_roundtrip_inventory_v6(self):
400
423
inv = self.get_sample_inventory()
424
txt = xml6.serializer_v6.write_inventory_to_string(inv)
401
425
lines = xml6.serializer_v6.write_inventory_to_lines(inv)
402
self.assertEqualDiff(_expected_inv_v6, b''.join(lines))
403
inv2 = xml6.serializer_v6.read_inventory_from_lines(lines)
426
self.assertEqual(bzrlib.osutils.split_lines(txt), lines)
427
self.assertEqualDiff(_expected_inv_v6, txt)
428
inv2 = xml6.serializer_v6.read_inventory_from_string(txt)
404
429
self.assertEqual(4, len(inv2))
405
430
for path, ie in inv.iter_entries():
406
self.assertEqual(ie, inv2.get_entry(ie.file_id))
431
self.assertEqual(ie, inv2[ie.file_id])
408
433
def test_wrong_format_v7(self):
409
434
"""Can't accidentally open a file with wrong serializer"""
410
s_v6 = breezy.bzr.xml6.serializer_v6
435
s_v6 = bzrlib.xml6.serializer_v6
411
436
s_v7 = xml7.serializer_v7
412
437
self.assertRaises(errors.UnexpectedInventoryFormat,
413
s_v7.read_inventory_from_lines,
414
breezy.osutils.split_lines(_expected_inv_v5))
438
s_v7.read_inventory_from_string, _expected_inv_v5)
415
439
self.assertRaises(errors.UnexpectedInventoryFormat,
416
s_v6.read_inventory_from_lines,
417
breezy.osutils.split_lines(_expected_inv_v7))
440
s_v6.read_inventory_from_string, _expected_inv_v7)
419
442
def test_tree_reference(self):
420
s_v5 = breezy.bzr.xml5.serializer_v5
421
s_v6 = breezy.bzr.xml6.serializer_v6
443
s_v5 = bzrlib.xml5.serializer_v5
444
s_v6 = bzrlib.xml6.serializer_v6
422
445
s_v7 = xml7.serializer_v7
423
inv = Inventory(b'tree-root-321', revision_id=b'rev-outer')
424
inv.root.revision = b'root-rev'
425
inv.add(inventory.TreeReference(b'nested-id', 'nested', b'tree-root-321',
426
b'rev-outer', b'rev-inner'))
427
self.assertRaises(errors.UnsupportedInventoryKind,
428
s_v5.write_inventory_to_lines, inv)
429
self.assertRaises(errors.UnsupportedInventoryKind,
430
s_v6.write_inventory_to_lines, inv)
431
lines = s_v7.write_inventory_to_chunks(inv)
432
inv2 = s_v7.read_inventory_from_lines(lines)
433
self.assertEqual(b'tree-root-321',
434
inv2.get_entry(b'nested-id').parent_id)
435
self.assertEqual(b'rev-outer', inv2.get_entry(b'nested-id').revision)
437
b'rev-inner', inv2.get_entry(b'nested-id').reference_revision)
446
inv = Inventory('tree-root-321', revision_id='rev-outer')
447
inv.root.revision = 'root-rev'
448
inv.add(inventory.TreeReference('nested-id', 'nested', 'tree-root-321',
449
'rev-outer', 'rev-inner'))
450
self.assertRaises(errors.UnsupportedInventoryKind,
451
s_v5.write_inventory_to_string, inv)
452
self.assertRaises(errors.UnsupportedInventoryKind,
453
s_v6.write_inventory_to_string, inv)
454
txt = s_v7.write_inventory_to_string(inv)
455
lines = s_v7.write_inventory_to_lines(inv)
456
self.assertEqual(bzrlib.osutils.split_lines(txt), lines)
457
inv2 = s_v7.read_inventory_from_string(txt)
458
self.assertEqual('tree-root-321', inv2['nested-id'].parent_id)
459
self.assertEqual('rev-outer', inv2['nested-id'].revision)
460
self.assertEqual('rev-inner', inv2['nested-id'].reference_revision)
461
self.assertRaises(errors.UnsupportedInventoryKind,
462
s_v6.read_inventory_from_string,
463
txt.replace('format="7"', 'format="6"'))
464
self.assertRaises(errors.UnsupportedInventoryKind,
465
s_v5.read_inventory_from_string,
466
txt.replace('format="7"', 'format="5"'))
439
468
def test_roundtrip_inventory_v8(self):
440
469
inv = self.get_sample_inventory()
441
lines = xml8.serializer_v8.write_inventory_to_lines(inv)
442
inv2 = xml8.serializer_v8.read_inventory_from_lines(lines)
470
txt = xml8.serializer_v8.write_inventory_to_string(inv)
471
inv2 = xml8.serializer_v8.read_inventory_from_string(txt)
443
472
self.assertEqual(4, len(inv2))
444
473
for path, ie in inv.iter_entries():
445
self.assertEqual(ie, inv2.get_entry(ie.file_id))
474
self.assertEqual(ie, inv2[ie.file_id])
447
476
def test_inventory_text_v8(self):
448
477
inv = self.get_sample_inventory()
478
txt = xml8.serializer_v8.write_inventory_to_string(inv)
449
479
lines = xml8.serializer_v8.write_inventory_to_lines(inv)
450
self.assertEqualDiff(_expected_inv_v8, b''.join(lines))
480
self.assertEqual(bzrlib.osutils.split_lines(txt), lines)
481
self.assertEqualDiff(_expected_inv_v8, txt)
452
483
def test_revision_text_v6(self):
453
484
"""Pack revision to XML v6"""
454
rev = breezy.bzr.xml6.serializer_v6.read_revision_from_string(
485
rev = bzrlib.xml6.serializer_v6.read_revision_from_string(
455
486
_expected_rev_v5)
456
serialized = breezy.bzr.xml6.serializer_v6.write_revision_to_lines(
458
self.assertEqualDiff(b''.join(serialized), _expected_rev_v5)
487
serialized = bzrlib.xml6.serializer_v6.write_revision_to_string(rev)
488
self.assertEqualDiff(serialized, _expected_rev_v5)
460
490
def test_revision_text_v7(self):
461
491
"""Pack revision to XML v7"""
462
rev = breezy.bzr.xml7.serializer_v7.read_revision_from_string(
492
rev = bzrlib.xml7.serializer_v7.read_revision_from_string(
463
493
_expected_rev_v5)
464
serialized = breezy.bzr.xml7.serializer_v7.write_revision_to_lines(
466
self.assertEqualDiff(b''.join(serialized), _expected_rev_v5)
494
serialized = bzrlib.xml7.serializer_v7.write_revision_to_string(rev)
495
self.assertEqualDiff(serialized, _expected_rev_v5)
468
497
def test_revision_text_v8(self):
469
498
"""Pack revision to XML v8"""
470
rev = breezy.bzr.xml8.serializer_v8.read_revision_from_string(
499
rev = bzrlib.xml8.serializer_v8.read_revision_from_string(
471
500
_expected_rev_v8)
472
serialized = breezy.bzr.xml8.serializer_v8.write_revision_to_lines(
474
self.assertEqualDiff(b''.join(serialized), _expected_rev_v8)
476
def test_revision_text_v8_complex(self):
477
"""Pack revision to XML v8"""
478
rev = breezy.bzr.xml8.serializer_v8.read_revision_from_string(
479
_expected_rev_v8_complex)
480
serialized = breezy.bzr.xml8.serializer_v8.write_revision_to_lines(
482
self.assertEqualDiff(b''.join(serialized), _expected_rev_v8_complex)
501
serialized = bzrlib.xml8.serializer_v8.write_revision_to_string(rev)
502
self.assertEqualDiff(serialized, _expected_rev_v8)
484
504
def test_revision_ids_are_utf8(self):
485
505
"""Parsed revision_ids should all be utf-8 strings, not unicode."""
486
s_v5 = breezy.bzr.xml5.serializer_v5
506
s_v5 = bzrlib.xml5.serializer_v5
487
507
rev = s_v5.read_revision_from_string(_revision_utf8_v5)
488
self.assertEqual(b'erik@b\xc3\xa5gfors-02', rev.revision_id)
489
self.assertIsInstance(rev.revision_id, bytes)
490
self.assertEqual([b'erik@b\xc3\xa5gfors-01'], rev.parent_ids)
508
self.assertEqual('erik@b\xc3\xa5gfors-02', rev.revision_id)
509
self.assertIsInstance(rev.revision_id, str)
510
self.assertEqual(['erik@b\xc3\xa5gfors-01'], rev.parent_ids)
491
511
for parent_id in rev.parent_ids:
492
self.assertIsInstance(parent_id, bytes)
512
self.assertIsInstance(parent_id, str)
493
513
self.assertEqual(u'Include \xb5nicode characters\n', rev.message)
494
self.assertIsInstance(rev.message, text_type)
514
self.assertIsInstance(rev.message, unicode)
496
516
# ie.revision should either be None or a utf-8 revision id
497
inv = s_v5.read_inventory_from_lines(breezy.osutils.split_lines(_inventory_utf8_v5))
517
inv = s_v5.read_inventory_from_string(_inventory_utf8_v5)
498
518
rev_id_1 = u'erik@b\xe5gfors-01'.encode('utf8')
499
519
rev_id_2 = u'erik@b\xe5gfors-02'.encode('utf8')
500
520
fid_root = u'TRE\xe9_ROOT'.encode('utf8')
505
525
(u'b\xe5r', fid_bar1, fid_root, rev_id_1),
506
526
(u's\xb5bdir', fid_sub, fid_root, rev_id_1),
507
527
(u's\xb5bdir/b\xe5r', fid_bar2, fid_sub, rev_id_2),
509
529
self.assertEqual(rev_id_2, inv.revision_id)
510
self.assertIsInstance(inv.revision_id, bytes)
530
self.assertIsInstance(inv.revision_id, str)
512
532
actual = list(inv.iter_entries_by_dir())
513
533
for ((exp_path, exp_file_id, exp_parent_id, exp_rev_id),
514
534
(act_path, act_ie)) in zip(expected, actual):
515
535
self.assertEqual(exp_path, act_path)
516
self.assertIsInstance(act_path, text_type)
536
self.assertIsInstance(act_path, unicode)
517
537
self.assertEqual(exp_file_id, act_ie.file_id)
518
self.assertIsInstance(act_ie.file_id, bytes)
538
self.assertIsInstance(act_ie.file_id, str)
519
539
self.assertEqual(exp_parent_id, act_ie.parent_id)
520
540
if exp_parent_id is not None:
521
self.assertIsInstance(act_ie.parent_id, bytes)
541
self.assertIsInstance(act_ie.parent_id, str)
522
542
self.assertEqual(exp_rev_id, act_ie.revision)
523
543
if exp_rev_id is not None:
524
self.assertIsInstance(act_ie.revision, bytes)
544
self.assertIsInstance(act_ie.revision, str)
526
546
self.assertEqual(len(expected), len(actual))
528
def test_serialization_error(self):
529
s_v5 = breezy.bzr.xml5.serializer_v5
530
e = self.assertRaises(
531
errors.UnexpectedInventoryFormat,
532
s_v5.read_inventory_from_lines, [b"<Notquitexml"])
533
self.assertEqual(str(e), "unclosed token: line 1, column 0")
536
549
class TestEncodeAndEscape(TestCase):
537
550
"""Whitebox testing of the _encode_and_escape function."""
540
super(TestEncodeAndEscape, self).setUp()
541
554
# Keep the cache clear before and after the test
542
breezy.bzr.xml_serializer._clear_cache()
543
self.addCleanup(breezy.bzr.xml_serializer._clear_cache)
555
bzrlib.xml8._ensure_utf8_re()
556
bzrlib.xml8._clear_cache()
557
self.addCleanup(bzrlib.xml8._clear_cache)
545
559
def test_simple_ascii(self):
546
560
# _encode_and_escape always appends a final ", because these parameters
547
561
# are being used in xml attributes, and by returning it now, we have to
548
562
# do fewer string operations later.
549
val = breezy.bzr.xml_serializer.encode_and_escape('foo bar')
550
self.assertEqual(b'foo bar', val)
563
val = bzrlib.xml8._encode_and_escape('foo bar')
564
self.assertEqual('foo bar"', val)
551
565
# The second time should be cached
552
val2 = breezy.bzr.xml_serializer.encode_and_escape('foo bar')
566
val2 = bzrlib.xml8._encode_and_escape('foo bar')
553
567
self.assertIs(val2, val)
555
569
def test_ascii_with_xml(self):
556
self.assertEqual(b'&'"<>',
557
breezy.bzr.xml_serializer.encode_and_escape('&\'"<>'))
570
self.assertEqual('&'"<>"',
571
bzrlib.xml8._encode_and_escape('&\'"<>'))
559
573
def test_utf8_with_xml(self):
560
574
# u'\xb5\xe5&\u062c'
561
utf8_str = b'\xc2\xb5\xc3\xa5&\xd8\xac'
562
self.assertEqual(b'µå&ج',
563
breezy.bzr.xml_serializer.encode_and_escape(utf8_str))
575
utf8_str = '\xc2\xb5\xc3\xa5&\xd8\xac'
576
self.assertEqual('µå&ج"',
577
bzrlib.xml8._encode_and_escape(utf8_str))
565
579
def test_unicode(self):
566
580
uni_str = u'\xb5\xe5&\u062c'
567
self.assertEqual(b'µå&ج',
568
breezy.bzr.xml_serializer.encode_and_escape(uni_str))
571
class TestMisc(TestCase):
573
def test_unescape_xml(self):
574
"""We get some kind of error when malformed entities are passed"""
575
self.assertRaises(KeyError, breezy.bzr.xml8._unescape_xml, b'foo&bar;')
581
self.assertEqual('µå&ج"',
582
bzrlib.xml8._encode_and_escape(uni_str))