"""Tests for git base objects."""
+# TODO: Round-trip parse-serialize-parse and serialize-parse-serialize tests.
+
+import datetime
import os
import stat
import unittest
+from dulwich.errors import (
+ ChecksumMismatch,
+ ObjectFormatException,
+ )
from dulwich.objects import (
Blob,
Tree,
Tag,
format_timezone,
hex_to_sha,
+ sha_to_hex,
+ hex_to_filename,
+ check_hexsha,
+ check_identity,
parse_timezone,
+ parse_tree,
+ _parse_tree_py,
+ )
+from dulwich.tests import (
+ TestSkipped,
)
a_sha = '6f670c0fb53f9463760b7295fbb814e965fb20c8'
tree_sha = '70c190eb48fa8bbb50ddc692a17b44cb781af7f6'
tag_sha = '71033db03a03c6a36721efcf1968dd8f8e0cf023'
+
+try:
+ from itertools import permutations
+except ImportError:
+ # Implementation of permutations from Python 2.6 documentation:
+ # http://docs.python.org/2.6/library/itertools.html#itertools.permutations
+ # Copyright (c) 2001-2010 Python Software Foundation; All Rights Reserved
+ def permutations(iterable, r=None):
+ # permutations('ABCD', 2) --> AB AC AD BA BC BD CA CB CD DA DB DC
+ # permutations(range(3)) --> 012 021 102 120 201 210
+ pool = tuple(iterable)
+ n = len(pool)
+ r = n if r is None else r
+ if r > n:
+ return
+ indices = range(n)
+ cycles = range(n, n-r, -1)
+ yield tuple(pool[i] for i in indices[:r])
+ while n:
+ for i in reversed(range(r)):
+ cycles[i] -= 1
+ if cycles[i] == 0:
+ indices[i:] = indices[i+1:] + indices[i:i+1]
+ cycles[i] = n - i
+ else:
+ j = cycles[i]
+ indices[i], indices[-j] = indices[-j], indices[i]
+ yield tuple(pool[i] for i in indices[:r])
+ break
+ else:
+ return
+
+
+class TestHexToSha(unittest.TestCase):
+
+ def test_simple(self):
+ self.assertEquals("\xab\xcd" * 10, hex_to_sha("abcd" * 10))
+
+ def test_reverse(self):
+ self.assertEquals("abcd" * 10, sha_to_hex("\xab\xcd" * 10))
+
+
class BlobReadTests(unittest.TestCase):
"""Test decompression of blobs"""
-
- def get_sha_file(self, obj, base, sha):
- return obj.from_file(os.path.join(os.path.dirname(__file__),
- 'data', base, sha))
-
+
+ def get_sha_file(self, cls, base, sha):
+ dir = os.path.join(os.path.dirname(__file__), 'data', base)
+ return cls.from_path(hex_to_filename(dir, sha))
+
def get_blob(self, sha):
"""Return the blob named sha from the test data dir"""
return self.get_sha_file(Blob, 'blobs', sha)
b = Blob.from_string(string)
self.assertEqual(b.data, string)
self.assertEqual(b.sha().hexdigest(), b_sha)
+
+ def test_chunks(self):
+ string = 'test 5\n'
+ b = Blob.from_string(string)
+ self.assertEqual([string], b.chunked)
+
+ def test_set_chunks(self):
+ b = Blob()
+ b.chunked = ['te', 'st', ' 5\n']
+ self.assertEqual('test 5\n', b.data)
+ b.chunked = ['te', 'st', ' 6\n']
+ self.assertEqual('test 6\n', b.as_raw_string())
def test_parse_legacy_blob(self):
string = 'test 3\n'
self.assertEqual(c.commit_timezone, 0)
self.assertEqual(c.author_timezone, 0)
self.assertEqual(c.message, 'Merge ../b\n')
-
+
+ def test_check_id(self):
+ wrong_sha = '1' * 40
+ b = self.get_blob(wrong_sha)
+ self.assertEqual(wrong_sha, b.id)
+ self.assertRaises(ChecksumMismatch, b.check)
+ self.assertEqual('742b386350576589175e374a5706505cbd17680c', b.id)
+
+
+class ShaFileCheckTests(unittest.TestCase):
+
+ def assertCheckFails(self, cls, data):
+ obj = cls()
+ def do_check():
+ obj.set_raw_string(data)
+ obj.check()
+ self.assertRaises(ObjectFormatException, do_check)
+
+ def assertCheckSucceeds(self, cls, data):
+ obj = cls()
+ obj.set_raw_string(data)
+ self.assertEqual(None, obj.check())
class CommitSerializationTests(unittest.TestCase):
c1.set_raw_string(c.as_raw_string())
self.assertEquals(30, c1.commit_time)
+ def test_raw_length(self):
+ c = self.make_base()
+ self.assertEquals(len(c.as_raw_string()), c.raw_length())
+
def test_simple(self):
c = self.make_base()
self.assertEquals(c.id, '5dac377bdded4c9aeb8dff595f0faeebcc8498cc')
self.assertTrue(" -0100\n" in c.as_raw_string())
-class CommitDeserializationTests(unittest.TestCase):
+default_committer = 'James Westby <jw+debian@jameswestby.net> 1174773719 +0000'
+
+class CommitParseTests(ShaFileCheckTests):
+
+ def make_commit_lines(self,
+ tree='d80c186a03f423a81b39df39dc87fd269736ca86',
+ parents=['ab64bbdcc51b170d21588e5c5d391ee5c0c96dfd',
+ '4cffe90e0a41ad3f5190079d7c8f036bde29cbe6'],
+ author=default_committer,
+ committer=default_committer,
+ encoding=None,
+ message='Merge ../b\n',
+ extra=None):
+ lines = []
+ if tree is not None:
+ lines.append('tree %s' % tree)
+ if parents is not None:
+ lines.extend('parent %s' % p for p in parents)
+ if author is not None:
+ lines.append('author %s' % author)
+ if committer is not None:
+ lines.append('committer %s' % committer)
+ if encoding is not None:
+ lines.append('encoding %s' % encoding)
+ if extra is not None:
+ for name, value in sorted(extra.iteritems()):
+ lines.append('%s %s' % (name, value))
+ lines.append('')
+ if message is not None:
+ lines.append(message)
+ return lines
+
+ def make_commit_text(self, **kwargs):
+ return '\n'.join(self.make_commit_lines(**kwargs))
def test_simple(self):
- c = Commit.from_string(
- 'tree d80c186a03f423a81b39df39dc87fd269736ca86\n'
- 'parent ab64bbdcc51b170d21588e5c5d391ee5c0c96dfd\n'
- 'parent 4cffe90e0a41ad3f5190079d7c8f036bde29cbe6\n'
- 'author James Westby <jw+debian@jameswestby.net> 1174773719 +0000\n'
- 'committer James Westby <jw+debian@jameswestby.net> 1174773719 +0000\n'
- '\n'
- 'Merge ../b\n')
+ c = Commit.from_string(self.make_commit_text())
self.assertEquals('Merge ../b\n', c.message)
+ self.assertEquals('James Westby <jw+debian@jameswestby.net>', c.author)
self.assertEquals('James Westby <jw+debian@jameswestby.net>',
- c.author)
- self.assertEquals('James Westby <jw+debian@jameswestby.net>',
- c.committer)
- self.assertEquals('d80c186a03f423a81b39df39dc87fd269736ca86',
- c.tree)
+ c.committer)
+ self.assertEquals('d80c186a03f423a81b39df39dc87fd269736ca86', c.tree)
self.assertEquals(['ab64bbdcc51b170d21588e5c5d391ee5c0c96dfd',
- '4cffe90e0a41ad3f5190079d7c8f036bde29cbe6'],
- c.parents)
+ '4cffe90e0a41ad3f5190079d7c8f036bde29cbe6'],
+ c.parents)
+ expected_time = datetime.datetime(2007, 3, 24, 22, 1, 59)
+ self.assertEquals(expected_time,
+ datetime.datetime.utcfromtimestamp(c.commit_time))
+ self.assertEquals(0, c.commit_timezone)
+ self.assertEquals(expected_time,
+ datetime.datetime.utcfromtimestamp(c.author_time))
+ self.assertEquals(0, c.author_timezone)
+ self.assertEquals(None, c.encoding)
def test_custom(self):
- c = Commit.from_string(
- 'tree d80c186a03f423a81b39df39dc87fd269736ca86\n'
- 'parent ab64bbdcc51b170d21588e5c5d391ee5c0c96dfd\n'
- 'parent 4cffe90e0a41ad3f5190079d7c8f036bde29cbe6\n'
- 'author James Westby <jw+debian@jameswestby.net> 1174773719 +0000\n'
- 'committer James Westby <jw+debian@jameswestby.net> 1174773719 +0000\n'
- 'extra-field data\n'
- '\n'
- 'Merge ../b\n')
+ c = Commit.from_string(self.make_commit_text(
+ extra={'extra-field': 'data'}))
self.assertEquals([('extra-field', 'data')], c.extra)
-
-class TreeSerializationTests(unittest.TestCase):
+ def test_encoding(self):
+ c = Commit.from_string(self.make_commit_text(encoding='UTF-8'))
+ self.assertEquals('UTF-8', c.encoding)
+
+ def test_check(self):
+ self.assertCheckSucceeds(Commit, self.make_commit_text())
+ self.assertCheckSucceeds(Commit, self.make_commit_text(parents=None))
+ self.assertCheckSucceeds(Commit,
+ self.make_commit_text(encoding='UTF-8'))
+
+ self.assertCheckFails(Commit, self.make_commit_text(tree='xxx'))
+ self.assertCheckFails(Commit, self.make_commit_text(
+ parents=[a_sha, 'xxx']))
+ bad_committer = "some guy without an email address 1174773719 +0000"
+ self.assertCheckFails(Commit,
+ self.make_commit_text(committer=bad_committer))
+ self.assertCheckFails(Commit,
+ self.make_commit_text(author=bad_committer))
+ self.assertCheckFails(Commit, self.make_commit_text(author=None))
+ self.assertCheckFails(Commit, self.make_commit_text(committer=None))
+ self.assertCheckFails(Commit, self.make_commit_text(
+ author=None, committer=None))
+
+ def test_check_duplicates(self):
+ # duplicate each of the header fields
+ for i in xrange(5):
+ lines = self.make_commit_lines(parents=[a_sha], encoding='UTF-8')
+ lines.insert(i, lines[i])
+ text = '\n'.join(lines)
+ if lines[i].startswith('parent'):
+ # duplicate parents are ok for now
+ self.assertCheckSucceeds(Commit, text)
+ else:
+ self.assertCheckFails(Commit, text)
+
+ def test_check_order(self):
+ lines = self.make_commit_lines(parents=[a_sha], encoding='UTF-8')
+ headers = lines[:5]
+ rest = lines[5:]
+ # of all possible permutations, ensure only the original succeeds
+ for perm in permutations(headers):
+ perm = list(perm)
+ text = '\n'.join(perm + rest)
+ if perm == headers:
+ self.assertCheckSucceeds(Commit, text)
+ else:
+ self.assertCheckFails(Commit, text)
+
+
+class TreeTests(ShaFileCheckTests):
def test_simple(self):
myhexsha = "d80c186a03f423a81b39df39dc87fd269736ca86"
x["a/c"] = (stat.S_IFDIR, "d80c186a03f423a81b39df39dc87fd269736ca86")
self.assertEquals(["a.c", "a", "a/c"], [p[0] for p in x.iteritems()])
+ def _do_test_parse_tree(self, parse_tree):
+ dir = os.path.join(os.path.dirname(__file__), 'data', 'trees')
+ o = Tree.from_path(hex_to_filename(dir, tree_sha))
+ o._parse_file()
+ self.assertEquals([('a', 0100644, a_sha), ('b', 0100644, b_sha)],
+ list(parse_tree(o.as_raw_string())))
+
+ def test_parse_tree(self):
+ self._do_test_parse_tree(_parse_tree_py)
+
+ def test_parse_tree_extension(self):
+ if parse_tree is _parse_tree_py:
+ raise TestSkipped('parse_tree extension not found')
+ self._do_test_parse_tree(parse_tree)
+
+ def test_check(self):
+ t = Tree
+ sha = hex_to_sha(a_sha)
+
+ # filenames
+ self.assertCheckSucceeds(t, '100644 .a\0%s' % sha)
+ self.assertCheckFails(t, '100644 \0%s' % sha)
+ self.assertCheckFails(t, '100644 .\0%s' % sha)
+ self.assertCheckFails(t, '100644 a/a\0%s' % sha)
+ self.assertCheckFails(t, '100644 ..\0%s' % sha)
+
+ # modes
+ self.assertCheckSucceeds(t, '100644 a\0%s' % sha)
+ self.assertCheckSucceeds(t, '100755 a\0%s' % sha)
+ self.assertCheckSucceeds(t, '160000 a\0%s' % sha)
+ # TODO more whitelisted modes
+ self.assertCheckFails(t, '123456 a\0%s' % sha)
+ self.assertCheckFails(t, '123abc a\0%s' % sha)
+
+ # shas
+ self.assertCheckFails(t, '100644 a\0%s' % ('x' * 5))
+ self.assertCheckFails(t, '100644 a\0%s' % ('x' * 18 + '\0'))
+ self.assertCheckFails(t, '100644 a\0%s\n100644 b\0%s' % ('x' * 21, sha))
+
+ # ordering
+ sha2 = hex_to_sha(b_sha)
+ self.assertCheckSucceeds(t, '100644 a\0%s\n100644 b\0%s' % (sha, sha))
+ self.assertCheckSucceeds(t, '100644 a\0%s\n100644 b\0%s' % (sha, sha2))
+ self.assertCheckFails(t, '100644 a\0%s\n100755 a\0%s' % (sha, sha2))
+ self.assertCheckFails(t, '100644 b\0%s\n100644 a\0%s' % (sha2, sha))
+
+ def test_iter(self):
+ t = Tree()
+ t["foo"] = (0100644, a_sha)
+ self.assertEquals(set(["foo"]), set(t))
+
class TagSerializeTests(unittest.TestCase):
x.tagger = "Jelmer Vernooij <jelmer@samba.org>"
x.name = "0.1"
x.message = "Tag 0.1"
- x.object = (3, "d80c186a03f423a81b39df39dc87fd269736ca86")
+ x.object = (Blob, "d80c186a03f423a81b39df39dc87fd269736ca86")
x.tag_time = 423423423
x.tag_timezone = 0
self.assertEquals("""object d80c186a03f423a81b39df39dc87fd269736ca86
Tag 0.1""", x.as_raw_string())
-class TagParseTests(unittest.TestCase):
-
- def test_parse_ctime(self):
- x = Tag()
- x.set_raw_string("""object a38d6181ff27824c79fc7df825164a212eff6a3f
-type commit
-tag v2.6.22-rc7
-tagger Linus Torvalds <torvalds@woody.linux-foundation.org> Sun Jul 1 12:54:34 2007 -0700
-
-Linux 2.6.22-rc7
+default_tagger = ('Linus Torvalds <torvalds@woody.linux-foundation.org> '
+ '1183319674 -0700')
+default_message = """Linux 2.6.22-rc7
-----BEGIN PGP SIGNATURE-----
Version: GnuPG v1.4.7 (GNU/Linux)
OK2XeQOiEeXtT76rV4t2WR4=
=ivrA
-----END PGP SIGNATURE-----
-""")
- self.assertEquals("Linus Torvalds <torvalds@woody.linux-foundation.org>", x.tagger)
+"""
+
+
+class TagParseTests(ShaFileCheckTests):
+ def make_tag_lines(self,
+ object_sha="a38d6181ff27824c79fc7df825164a212eff6a3f",
+ object_type_name="commit",
+ name="v2.6.22-rc7",
+ tagger=default_tagger,
+ message=default_message):
+ lines = []
+ if object_sha is not None:
+ lines.append("object %s" % object_sha)
+ if object_type_name is not None:
+ lines.append("type %s" % object_type_name)
+ if name is not None:
+ lines.append("tag %s" % name)
+ if tagger is not None:
+ lines.append("tagger %s" % tagger)
+ lines.append("")
+ if message is not None:
+ lines.append(message)
+ return lines
+
+ def make_tag_text(self, **kwargs):
+ return "\n".join(self.make_tag_lines(**kwargs))
+
+ def test_parse(self):
+ x = Tag()
+ x.set_raw_string(self.make_tag_text())
+ self.assertEquals(
+ "Linus Torvalds <torvalds@woody.linux-foundation.org>", x.tagger)
self.assertEquals("v2.6.22-rc7", x.name)
+ object_type, object_sha = x.object
+ self.assertEquals("a38d6181ff27824c79fc7df825164a212eff6a3f",
+ object_sha)
+ self.assertEquals(Commit, object_type)
+ self.assertEquals(datetime.datetime.utcfromtimestamp(x.tag_time),
+ datetime.datetime(2007, 7, 1, 19, 54, 34))
+ self.assertEquals(-25200, x.tag_timezone)
def test_parse_no_tagger(self):
x = Tag()
- x.set_raw_string("""object a38d6181ff27824c79fc7df825164a212eff6a3f
-type commit
-tag v2.6.22-rc7
-
-Linux 2.6.22-rc7
------BEGIN PGP SIGNATURE-----
-Version: GnuPG v1.4.7 (GNU/Linux)
-
-iD8DBQBGiAaAF3YsRnbiHLsRAitMAKCiLboJkQECM/jpYsY3WPfvUgLXkACgg3ql
-OK2XeQOiEeXtT76rV4t2WR4=
-=ivrA
------END PGP SIGNATURE-----
-""")
+ x.set_raw_string(self.make_tag_text(tagger=None))
self.assertEquals(None, x.tagger)
self.assertEquals("v2.6.22-rc7", x.name)
+ def test_check(self):
+ self.assertCheckSucceeds(Tag, self.make_tag_text())
+ self.assertCheckFails(Tag, self.make_tag_text(object_sha=None))
+ self.assertCheckFails(Tag, self.make_tag_text(object_type_name=None))
+ self.assertCheckFails(Tag, self.make_tag_text(name=None))
+ self.assertCheckFails(Tag, self.make_tag_text(name=''))
+ self.assertCheckFails(Tag, self.make_tag_text(
+ object_type_name="foobar"))
+ self.assertCheckFails(Tag, self.make_tag_text(
+ tagger="some guy without an email address 1183319674 -0700"))
+ self.assertCheckFails(Tag, self.make_tag_text(
+ tagger=("Linus Torvalds <torvalds@woody.linux-foundation.org> "
+ "Sun 7 Jul 2007 12:54:34 +0700")))
+ self.assertCheckFails(Tag, self.make_tag_text(object_sha="xxx"))
+
+ def test_check_duplicates(self):
+ # duplicate each of the header fields
+ for i in xrange(4):
+ lines = self.make_tag_lines()
+ lines.insert(i, lines[i])
+ self.assertCheckFails(Tag, '\n'.join(lines))
+
+ def test_check_order(self):
+ lines = self.make_tag_lines()
+ headers = lines[:4]
+ rest = lines[4:]
+ # of all possible permutations, ensure only the original succeeds
+ for perm in permutations(headers):
+ perm = list(perm)
+ text = '\n'.join(perm + rest)
+ if perm == headers:
+ self.assertCheckSucceeds(Tag, text)
+ else:
+ self.assertCheckFails(Tag, text)
+
+
+class CheckTests(unittest.TestCase):
+
+ def test_check_hexsha(self):
+ check_hexsha(a_sha, "failed to check good sha")
+ self.assertRaises(ObjectFormatException, check_hexsha, '1' * 39,
+ 'sha too short')
+ self.assertRaises(ObjectFormatException, check_hexsha, '1' * 41,
+ 'sha too long')
+ self.assertRaises(ObjectFormatException, check_hexsha, 'x' * 40,
+ 'invalid characters')
+
+ def test_check_identity(self):
+ check_identity("Dave Borowitz <dborowitz@google.com>",
+ "failed to check good identity")
+ check_identity("<dborowitz@google.com>",
+ "failed to check good identity")
+ self.assertRaises(ObjectFormatException, check_identity,
+ "Dave Borowitz", "no email")
+ self.assertRaises(ObjectFormatException, check_identity,
+ "Dave Borowitz <dborowitz", "incomplete email")
+ self.assertRaises(ObjectFormatException, check_identity,
+ "dborowitz@google.com>", "incomplete email")
+ self.assertRaises(ObjectFormatException, check_identity,
+ "Dave Borowitz <<dborowitz@google.com>", "typo")
+ self.assertRaises(ObjectFormatException, check_identity,
+ "Dave Borowitz <dborowitz@google.com>>", "typo")
+ self.assertRaises(ObjectFormatException, check_identity,
+ "Dave Borowitz <dborowitz@google.com>xxx",
+ "trailing characters")
+
class TimezoneTests(unittest.TestCase):
def test_parse_timezone_utc(self):
- self.assertEquals(0, parse_timezone("+0000"))
+ self.assertEquals((0, False), parse_timezone("+0000"))
+
+ def test_parse_timezone_utc_negative(self):
+ self.assertEquals((0, True), parse_timezone("-0000"))
def test_generate_timezone_utc(self):
self.assertEquals("+0000", format_timezone(0))
+ def test_generate_timezone_utc_negative(self):
+ self.assertEquals("-0000", format_timezone(0, True))
+
def test_parse_timezone_cet(self):
- self.assertEquals(60 * 60, parse_timezone("+0100"))
+ self.assertEquals((60 * 60, False), parse_timezone("+0100"))
def test_format_timezone_cet(self):
self.assertEquals("+0100", format_timezone(60 * 60))
self.assertEquals("-0400", format_timezone(-4 * 60 * 60))
def test_parse_timezone_pdt(self):
- self.assertEquals(-4 * 60 * 60, parse_timezone("-0400"))
+ self.assertEquals((-4 * 60 * 60, False), parse_timezone("-0400"))
def test_format_timezone_pdt_half(self):
- self.assertEquals("-0440", format_timezone(int(((-4 * 60) - 40) * 60)))
+ self.assertEquals("-0440",
+ format_timezone(int(((-4 * 60) - 40) * 60)))
def test_parse_timezone_pdt_half(self):
- self.assertEquals(((-4 * 60) - 40) * 60, parse_timezone("-0440"))
+ self.assertEquals((((-4 * 60) - 40) * 60, False),
+ parse_timezone("-0440"))