commit.create_from_tree now uses pure python implementation, fixed message parsing which truncated newlines although it was ilegitimate. Its up to the reader to truncate therse, nowhere in the git code I could find anyone adding newlines to commits where it is written

Added performance tests for serialization, it does about 5k commits per second if writing to tmpfs
author: Sebastian Thiel <byronimo@gmail.com> 2010-06-03 23:20:34 +0200
committer: Sebastian Thiel <byronimo@gmail.com> 2010-06-03 23:20:34 +0200
commit: 1e2b46138ba58033738a24dadccc265748fce2ca (patch)
tree: 0f2a625a371c16cc95e53e024e007d8b89d87c92 /test/git/performance/test_commit.py
parent: 4b4a514e51fbc7dc6ddcb27c188159d57b5d1fa9 (diff)
download: gitpython-1e2b46138ba58033738a24dadccc265748fce2ca.tar.gz
1 files changed, 33 insertions, 3 deletions
diff --git a/test/git/performance/test_commit.py b/test/git/performance/test_commit.py
index b4a9d868..2398c93d 100644
--- a/test/git/performance/test_commit.py
+++ b/test/git/performance/test_commit.py
@@ -6,10 +6,12 @@
 
 from lib import *
 from git import *
+from test.git.test_commit import assert_commit_serialization
+from cStringIO import StringIO
 from time import time
 import sys
 
-class TestPerformance(TestBigRepoReadOnly):
+class TestPerformance(TestBigRepoRW):
 
 	# ref with about 100 commits in its history
 	ref_100 = '0.1.6'
@@ -48,7 +50,7 @@ class TestPerformance(TestBigRepoReadOnly):
 		# bound to cat-file parsing performance
 		nc = 0
 		st = time()
-		for c in self.gitrepo.commit(self.head_sha_2k).traverse(branch_first=False):
+		for c in self.gitrorepo.commit(self.head_sha_2k).traverse(branch_first=False):
 			nc += 1
 			self._query_commit_info(c)
 		# END for each traversed commit
@@ -59,10 +61,38 @@ class TestPerformance(TestBigRepoReadOnly):
 		# bound to stream parsing performance
 		nc = 0
 		st = time()
-		for c in Commit.iter_items(self.gitrepo, self.head_sha_2k):
+		for c in Commit.iter_items(self.gitrorepo, self.head_sha_2k):
 			nc += 1
 			self._query_commit_info(c)
 		# END for each traversed commit
 		elapsed_time = time() - st
 		print >> sys.stderr, "Iterated %i Commits in %s [s] ( %f commits/s )" % (nc, elapsed_time, nc/elapsed_time)
 		
+	def test_commit_serialization(self):
+		assert_commit_serialization(self.gitrwrepo, self.head_sha_2k, True)
+		
+		rwrepo = self.gitrwrepo
+		make_object = rwrepo.odb.to_object
+		# direct serialization - deserialization can be tested afterwards
+		# serialization is probably limited on IO
+		hc = rwrepo.commit(self.head_sha_2k)
+		
+		commits = list()
+		nc = 5000
+		st = time()
+		for i in xrange(nc):
+			cm = Commit(	rwrepo, Commit.NULL_HEX_SHA, hc.tree, 
+							hc.author, hc.authored_date, hc.author_tz_offset, 
+							hc.committer, hc.committed_date, hc.committer_tz_offset, 
+							str(i), parents=hc.parents, encoding=hc.encoding)
+			
+			stream = StringIO()
+			cm._serialize(stream)
+			slen = stream.tell()
+			stream.seek(0)
+			
+			cm.sha = make_object(Commit.type, slen, stream)
+		# END commit creation
+		elapsed = time() - st
+		
+		print >> sys.stderr, "Serialized %i commits to loose objects in %f s ( %f commits / s )" % (nc, elapsed, nc / elapsed)
author	Sebastian Thiel <byronimo@gmail.com>	2010-06-03 23:20:34 +0200
committer	Sebastian Thiel <byronimo@gmail.com>	2010-06-03 23:20:34 +0200
commit	1e2b46138ba58033738a24dadccc265748fce2ca (patch)
tree	0f2a625a371c16cc95e53e024e007d8b89d87c92 /test/git/performance/test_commit.py
parent	4b4a514e51fbc7dc6ddcb27c188159d57b5d1fa9 (diff)
download	gitpython-1e2b46138ba58033738a24dadccc265748fce2ca.tar.gz