dulwich-users team mailing list archive
-
dulwich-users team
-
Mailing list archive
-
Message #00586
[PATCH 25/33] pack: Fix a buffering issue with PackStreamReader; add tests.
From: Dave Borowitz <dborowitz@xxxxxxxxxx>
Change-Id: I2695ce332114e213239efaa00bd46b423a670d5c
---
NEWS | 3 ++
dulwich/pack.py | 7 ++++++
dulwich/tests/test_pack.py | 48 ++++++++++++++++++++++++++++++++++++++++++++
3 files changed, 58 insertions(+), 0 deletions(-)
diff --git a/NEWS b/NEWS
index c229e15..02745fb 100644
--- a/NEWS
+++ b/NEWS
@@ -24,6 +24,9 @@
* Fix short-circuit behavior for no-op fetches in the server. (Dave Borowitz)
+ * Fix a bug in reading the pack checksum when there are fewer than 20 bytes
+ left in the buffer. (Dave Borowitz)
+
API CHANGES
* write_pack no longer takes the num_objects argument and requires an object
diff --git a/dulwich/pack.py b/dulwich/pack.py
index 3e0b9fb..da83f7e 100644
--- a/dulwich/pack.py
+++ b/dulwich/pack.py
@@ -747,6 +747,13 @@ class PackStreamReader(object):
buf.seek(0)
self._rbuf = buf
+ if self._buf_len() < 20:
+ # If the read buffer is full, then the last read() got the whole
+ # trailer off the wire. If not, it means there is still some of the
+ # trailer to read. We need to read() all 20 bytes; N come from the
+ # read buffer and (20 - N) come from the wire.
+ self.read(20)
+
pack_sha = ''.join(self._trailer)
if pack_sha != self.sha.digest():
raise ChecksumMismatch(sha_to_hex(pack_sha), self.sha.hexdigest())
diff --git a/dulwich/tests/test_pack.py b/dulwich/tests/test_pack.py
index 860822f..1be2e01 100644
--- a/dulwich/tests/test_pack.py
+++ b/dulwich/tests/test_pack.py
@@ -49,6 +49,7 @@ from dulwich.objects import (
from dulwich.pack import (
OFS_DELTA,
REF_DELTA,
+ DELTA_TYPES,
MemoryPackIndex,
Pack,
PackData,
@@ -66,6 +67,7 @@ from dulwich.pack import (
write_pack,
unpack_object,
compute_file_sha,
+ PackStreamReader,
DeltaChainIterator,
)
from dulwich.tests import (
@@ -655,6 +657,52 @@ class DeltifyTests(TestCase):
list(deltify_pack_objects([(b1, ""), (b2, "")])))
+class TestPackStreamReader(TestCase):
+
+ def test_read_objects_emtpy(self):
+ f = StringIO()
+ build_pack(f, [])
+ reader = PackStreamReader(f.read)
+ self.assertEqual(0, len(list(reader.read_objects())))
+
+ def test_read_objects(self):
+ f = StringIO()
+ entries = build_pack(f, [
+ (Blob.type_num, 'blob'),
+ (OFS_DELTA, (0, 'blob1')),
+ ])
+ reader = PackStreamReader(f.read)
+ objects = list(reader.read_objects(compute_crc32=True))
+ self.assertEqual(2, len(objects))
+
+ blob, delta = objects
+ bofs, btype, buncomp, blen, bcrc = blob
+ dofs, dtype, duncomp, dlen, dcrc = delta
+
+ self.assertEqual(entries[0][0], bofs)
+ self.assertEqual(Blob.type_num, btype)
+ self.assertEqual('blob', ''.join(buncomp))
+ self.assertEqual(dofs - bofs, blen)
+ self.assertEqual(entries[0][4], bcrc)
+
+ self.assertEqual(entries[1][0], dofs)
+ self.assertEqual(OFS_DELTA, dtype)
+ delta_ofs, delta_chunks = duncomp
+ self.assertEqual(dofs - bofs, delta_ofs)
+ self.assertEqual(create_delta('blob', 'blob1'), ''.join(delta_chunks))
+ self.assertEqual(len(f.getvalue()) - 20 - dofs, dlen)
+ self.assertEqual(entries[1][4], dcrc)
+
+ def test_read_objects_buffered(self):
+ f = StringIO()
+ build_pack(f, [
+ (Blob.type_num, 'blob'),
+ (OFS_DELTA, (0, 'blob1')),
+ ])
+ reader = PackStreamReader(f.read, zlib_bufsize=4)
+ self.assertEqual(2, len(list(reader.read_objects())))
+
+
class TestPackIterator(DeltaChainIterator):
_compute_crc32 = True
--
1.7.3.1
References