commit.create_from_tree now uses pure python implementation, fixed message parsing which truncated newlines although it was ilegitimate. Its up to the reader to truncate therse, nowhere in the git code I could find anyone adding newlines to commits where it is written

Added performance tests for serialization, it does about 5k commits per second if writing to tmpfs
author: Sebastian Thiel <byronimo@gmail.com> 2010-06-03 23:20:34 +0200
committer: Sebastian Thiel <byronimo@gmail.com> 2010-06-03 23:20:34 +0200
commit: 1e2b46138ba58033738a24dadccc265748fce2ca (patch)
tree: 0f2a625a371c16cc95e53e024e007d8b89d87c92 /lib/git/odb/utils.py
parent: 4b4a514e51fbc7dc6ddcb27c188159d57b5d1fa9 (diff)
download: gitpython-1e2b46138ba58033738a24dadccc265748fce2ca.tar.gz
1 files changed, 18 insertions, 14 deletions
diff --git a/lib/git/odb/utils.py b/lib/git/odb/utils.py
index 94d1cea8..fd340962 100644
--- a/lib/git/odb/utils.py
+++ b/lib/git/odb/utils.py
@@ -137,7 +137,7 @@ class DecompressMemMapReader(object):
 		# END handle size
 		
 		# read header
-		maxb = 8192
+		maxb = 512				# should really be enough, cgit uses 8192 I believe
 		self._s = maxb
 		hdr = self.read(maxb)
 		hdrend = hdr.find("\0")
@@ -172,20 +172,24 @@ class DecompressMemMapReader(object):
 		# Our performance now depends on StringIO. This way we don't need two large
 		# buffers in peak times, but only one large one in the end which is 
 		# the return buffer
-		if size > self.max_read_size:
-			sio = StringIO()
-			while size:
-				read_size = min(self.max_read_size, size)
-				data = self.read(read_size)
-				sio.write(data)
-				size -= len(data)
-				if len(data) < read_size:
-					break
-			# END data loop
-			sio.seek(0)
-			return sio.getvalue()
-		# END handle maxread
+		# NO: We don't do it - if the user thinks its best, he is right. If he 
+		# has trouble, he will start reading in chunks. According to our tests
+		# its still faster if we read 10 Mb at once instead of chunking it.
 		
+		# if size > self.max_read_size:
+			# sio = StringIO()
+			# while size:
+				# read_size = min(self.max_read_size, size)
+				# data = self.read(read_size)
+				# sio.write(data)
+				# size -= len(data)
+				# if len(data) < read_size:
+					# break
+			# # END data loop
+			# sio.seek(0)
+			# return sio.getvalue()
+		# # END handle maxread
+		# 
 		# deplete the buffer, then just continue using the decompress object 
 		# which has an own buffer. We just need this to transparently parse the 
 		# header from the zlib stream
author	Sebastian Thiel <byronimo@gmail.com>	2010-06-03 23:20:34 +0200
committer	Sebastian Thiel <byronimo@gmail.com>	2010-06-03 23:20:34 +0200
commit	1e2b46138ba58033738a24dadccc265748fce2ca (patch)
tree	0f2a625a371c16cc95e53e024e007d8b89d87c92 /lib/git/odb/utils.py
parent	4b4a514e51fbc7dc6ddcb27c188159d57b5d1fa9 (diff)
download	gitpython-1e2b46138ba58033738a24dadccc265748fce2ca.tar.gz