diff options
| author | Vincent Driessen <me@nvie.com> | 2016-06-14 22:44:11 +0200 | 
|---|---|---|
| committer | Vincent Driessen <me@nvie.com> | 2016-06-14 23:09:22 +0200 | 
| commit | 3ee291c469fc7ea6065ed22f344ed3f2792aa2ca (patch) | |
| tree | 2b0b2e213c34fb61a0eb91f358685bb40101b1b0 /git/test/test_diff.py | |
| parent | 105a8c0fb3fe61b77956c8ebd3216738c78a3dff (diff) | |
| download | gitpython-3ee291c469fc7ea6065ed22f344ed3f2792aa2ca.tar.gz | |
Store raw path bytes in Diff instanceskeep-raw-bytes-on-diffs
Previously, the following fields on Diff instances were assumed to be
passed in as unicode strings:
  - `a_path`
  - `b_path`
  - `rename_from`
  - `rename_to`
However, since Git natively records paths as bytes, these may
potentially not have a valid unicode representation.
This patch changes the Diff instance to instead take the following
equivalent fields that should be raw bytes instead:
  - `a_rawpath`
  - `b_rawpath`
  - `raw_rename_from`
  - `raw_rename_to`
NOTE ON BACKWARD COMPATIBILITY:
The original `a_path`, `b_path`, etc. fields are still available as
properties (rather than slots).  These properties now dynamically decode
the raw bytes into a unicode string (performing the potentially
destructive operation of replacing invalid unicode chars by "�"'s).
This means that all code using Diffs should remain backward compatible.
The only exception is when people would manually construct Diff
instances by calling the constructor directly, in which case they should
now pass in bytes rather than unicode strings.
See also the discussion on
https://github.com/gitpython-developers/GitPython/pull/467
Diffstat (limited to 'git/test/test_diff.py')
| -rw-r--r-- | git/test/test_diff.py | 6 | 
1 files changed, 5 insertions, 1 deletions
| diff --git a/git/test/test_diff.py b/git/test/test_diff.py index 8d189b12..ba0d2d13 100644 --- a/git/test/test_diff.py +++ b/git/test/test_diff.py @@ -90,6 +90,8 @@ class TestDiff(TestBase):          assert_true(diff.renamed)          assert_equal(diff.rename_from, u'Jérôme')          assert_equal(diff.rename_to, u'müller') +        assert_equal(diff.raw_rename_from, b'J\xc3\xa9r\xc3\xb4me') +        assert_equal(diff.raw_rename_to, b'm\xc3\xbcller')          assert isinstance(str(diff), str)          output = StringProcessAdapter(fixture('diff_rename_raw')) @@ -129,7 +131,7 @@ class TestDiff(TestBase):          output = StringProcessAdapter(fixture('diff_index_raw'))          res = Diff._index_from_raw_format(None, output.stdout)          assert res[0].deleted_file -        assert res[0].b_path == '' +        assert res[0].b_path is None      def test_diff_initial_commit(self):          initial_commit = self.rorepo.commit('33ebe7acec14b25c5f84f35a664803fcab2f7781') @@ -162,7 +164,9 @@ class TestDiff(TestBase):          self.assertEqual(res[7].b_path, u'path/with-question-mark?')          self.assertEqual(res[8].b_path, u'path/¯\\_(ツ)_|¯')          self.assertEqual(res[9].b_path, u'path/💩.txt') +        self.assertEqual(res[9].b_rawpath, b'path/\xf0\x9f\x92\xa9.txt')          self.assertEqual(res[10].b_path, u'path/�-invalid-unicode-path.txt') +        self.assertEqual(res[10].b_rawpath, b'path/\x80-invalid-unicode-path.txt')          # The "Moves"          # NOTE: The path prefixes a/ and b/ here are legit!  We're actually | 
