diff options
author | Sebastian Thiel <byronimo@gmail.com> | 2010-10-15 12:34:43 +0200 |
---|---|---|
committer | Sebastian Thiel <byronimo@gmail.com> | 2010-10-15 12:40:39 +0200 |
commit | 0019d7dc8c72839d238065473a62b137c3c350f5 (patch) | |
tree | 75c5fcd85fe9e655e035bd3cbec10e49071562f1 /test/git/test_commit.py | |
parent | 0f88fb96869b6ac3ed4dac7d23310a9327d3c89c (diff) | |
download | gitpython-0019d7dc8c72839d238065473a62b137c3c350f5.tar.gz |
Added unicode handling for author names. They will now be properly encoded into the byte stream, as well as decoded from it
Diffstat (limited to 'test/git/test_commit.py')
-rw-r--r-- | test/git/test_commit.py | 29 |
1 files changed, 29 insertions, 0 deletions
diff --git a/test/git/test_commit.py b/test/git/test_commit.py index a9ea7f98..2692938f 100644 --- a/test/git/test_commit.py +++ b/test/git/test_commit.py @@ -242,3 +242,32 @@ class TestCommit(TestBase): # create all commits of our repo assert_commit_serialization(rwrepo, '0.1.6') + def test_serialization_unicode_support(self): + assert Commit.default_encoding.lower() == 'utf-8' + + # create a commit with unicode in the message, and the author's name + # Verify its serialization and deserialization + cmt = self.rorepo.commit('0.1.6') + assert isinstance(cmt.message, unicode) # it automatically decodes it as such + assert isinstance(cmt.author.name, unicode) # same here + + cmt.message = "üäêèß".decode("utf-8") + assert len(cmt.message) == 5 + + cmt.author.name = "äüß".decode("utf-8") + assert len(cmt.author.name) == 3 + + cstream = StringIO() + cmt._serialize(cstream) + cstream.seek(0) + assert len(cstream.getvalue()) + + ncmt = Commit(self.rorepo, cmt.binsha) + ncmt._deserialize(cstream) + + assert cmt.author.name == ncmt.author.name + assert cmt.message == ncmt.message + # actually, it can't be printed in a shell as repr wants to have ascii only + # it appears + cmt.author.__repr__() + |