14 years ago · 76989d693c
--- a/NEWS
+++ b/NEWS
@@ -37,8 +37,7 @@
 
															   * take_msb_bytes, read_zlib_chunks, unpack_objects, and
														
 
															     PackStreamReader.read_objects now take an additional argument indicating a
														
 
															-    crc32 to compute, and each return an additional crc32 element in their
														
 
															-    return values. (Dave Borowitz)
														
 
															+    crc32 to compute. (Dave Borowitz)
														
 
															   * PackObjectIterator was removed; its functionality is still exposed by
														
 
															     PackData.iterobjects. (Dave Borowitz)
														
@@ -60,6 +59,10 @@
 
															   * Custom buffer size in read_zlib_chunks. (Dave Borowitz)
														
 
															+  * New UnpackedObject data class that replaces ad-hoc tuples in the return
														
 
															+    value of unpack_object and various DeltaChainIterator methods.
														
 
															+    (Dave Borowitz)
														
 
															+
														
 
															  TEST CHANGES
														
 
															   * If setuptools is installed, "python setup.py test" will now run the testsuite.
														
--- a/dulwich/pack.py
+++ b/dulwich/pack.py
@@ -76,6 +76,7 @@ from dulwich._compat import (
 
															     make_sha,
														
 
															     SEEK_CUR,
														
 
															     SEEK_END,
														
 
															+    namedtuple,
														
 
															     )
														
 
															 from dulwich.objects import (
														
 
															     ShaFile,
														
@@ -108,58 +109,139 @@ def take_msb_bytes(read, crc32=None):
 
															     return ret, crc32
														
 
															+class UnpackedObject(object):
														
 
															+    """Class encapsulating an object unpacked from a pack file.
														
 
															+
														
 
															+    These objects should only be created from within unpack_object. Most
														
 
															+    members start out as empty and are filled in at various points by
														
 
															+    read_zlib_chunks, unpack_object, DeltaChainIterator, etc.
														
 
															+
														
 
															+    End users of this object should take care that the function they're getting
														
 
															+    this object from is guaranteed to set the members they need.
														
 
															+    """
														
 
															+
														
 
															+    __slots__ = [
														
 
															+      'offset',         # Offset in its pack.
														
 
															+      'obj_type_num',   # Type of this object.
														
 
															+      'obj_chunks',     # Decompressed and delta-resolved chunks.
														
 
															+      'pack_type_num',  # Type of this object in the pack (may be a delta).
														
 
															+      'delta_base',     # Delta base offset or SHA.
														
 
															+      'comp_len',       # Compressed length of this object.
														
 
															+      'decomp_chunks',  # Decompressed object chunks.
														
 
															+      'decomp_len',     # Decompressed length of this object.
														
 
															+      'crc32',          # CRC32.
														
 
															+      ]
														
 
															+
														
 
															+    # TODO(dborowitz): read_zlib_chunks and unpack_object could very well be
														
 
															+    # methods of this object.
														
 
															+    def __init__(self, pack_type_num, delta_base, decomp_len, crc32):
														
 
															+        self.offset = None
														
 
															+        self.pack_type_num = pack_type_num
														
 
															+        self.delta_base = delta_base
														
 
															+        self.comp_len = None
														
 
															+        self.decomp_chunks = []
														
 
															+        self.decomp_len = decomp_len
														
 
															+        self.crc32 = crc32
														
 
															+
														
 
															+        if pack_type_num in DELTA_TYPES:
														
 
															+            self.obj_type_num = None
														
 
															+            self.obj_chunks = None
														
 
															+        else:
														
 
															+            self.obj_type_num = pack_type_num
														
 
															+            self.obj_chunks = self.decomp_chunks
														
 
															+            self.delta_base = delta_base
														
 
															+
														
 
															+    def sha(self):
														
 
															+        """Return the binary SHA of this object."""
														
 
															+        return obj_sha(self.obj_type_num, self.obj_chunks)
														
 
															+
														
 
															+    def sha_file(self):
														
 
															+        """Return a ShaFile from this object."""
														
 
															+        return ShaFile.from_raw_chunks(self.obj_type_num, self.obj_chunks)
														
 
															+
														
 
															+    # Only provided for backwards compatibility with code that expects either
														
 
															+    # chunks or a delta tuple.
														
 
															+    def _obj(self):
														
 
															+        """Return the decompressed chunks, or (delta base, delta chunks)."""
														
 
															+        if self.pack_type_num in DELTA_TYPES:
														
 
															+            return (self.delta_base, self.decomp_chunks)
														
 
															+        else:
														
 
															+            return self.decomp_chunks
														
 
															+
														
 
															+    def __eq__(self, other):
														
 
															+        if not isinstance(other, UnpackedObject):
														
 
															+            return False
														
 
															+        for slot in self.__slots__:
														
 
															+            if getattr(self, slot) != getattr(other, slot):
														
 
															+                return False
														
 
															+        return True
														
 
															+
														
 
															+    def __ne__(self, other):
														
 
															+        return not (self == other)
														
 
															+
														
 
															+    def __repr__(self):
														
 
															+        data = ['%s=%r' % (s, getattr(self, s)) for s in self.__slots__]
														
 
															+        return '%s(%s)' % (self.__class__.__name__, ', '.join(data))
														
 
															+
														
 
															+
														
 
															 _ZLIB_BUFSIZE = 4096
														
 
															-def read_zlib_chunks(read_some, dec_size, buffer_size=_ZLIB_BUFSIZE,
														
 
															-                     crc32=None):
														
 
															+def read_zlib_chunks(read_some, unpacked, buffer_size=_ZLIB_BUFSIZE):
														
 
															     """Read zlib data from a buffer.
														
 
															     This function requires that the buffer have additional data following the
														
 
															     compressed data, which is guaranteed to be the case for git pack files.
														
 
															     :param read_some: Read function that returns at least one byte, but may
														
 
															-        return less than the requested size
														
 
															-    :param dec_size: Expected size of the decompressed buffer
														
 
															-    :param buffer_size: Size of the read buffer
														
 
															-    :param crc32: If not None, the CRC32 of the compressed bytes will be
														
 
															-        computed using this starting CRC32. If False, CRC32 computations will
														
 
															-        not be done, and the returned CRC32 will be None.
														
 
															-    :return: Tuple of (
														
 
															-        list of uncompressed chunks,
														
 
															-        length of compressed data,
														
 
															-        crc32 of compressed data,
														
 
															-        unused read data,
														
 
															-        ).
														
 
															+        return less than the requested size.
														
 
															+    :param unpacked: An UnpackedObject to write result data to. If its crc32
														
 
															+        attr is not None, the CRC32 of the compressed bytes will be computed
														
 
															+        using this starting CRC32.
														
 
															+        After this function, will have the following attrs set:
														
 
															+            comp_len
														
 
															+            decomp_chunks
														
 
															+            decomp_len
														
 
															+            crc32
														
 
															+    :param buffer_size: Size of the read buffer.
														
 
															+    :return: Leftover unused data from the decompression.
														
 
															     :raise zlib.error: if a decompression error occurred.
														
 
															     """
														
 
															-    if dec_size <= -1:
														
 
															+    if unpacked.decomp_len <= -1:
														
 
															         raise ValueError('non-negative zlib data stream size expected')
														
 
															-    obj = zlib.decompressobj()
														
 
															-    ret = []
														
 
															-    size = 0
														
 
															-    comp_size = 0
														
 
															+    decomp_obj = zlib.decompressobj()
														
 
															+
														
 
															+    decomp_chunks = unpacked.decomp_chunks
														
 
															+    decomp_len = 0
														
 
															+    comp_len = 0
														
 
															+    crc32 = unpacked.crc32
														
 
															+
														
 
															     while True:
														
 
															         add = read_some(buffer_size)
														
 
															         if not add:
														
 
															             raise zlib.error('EOF before end of zlib stream')
														
 
															-        comp_size += len(add)
														
 
															-        decomp = obj.decompress(add)
														
 
															-        size += len(decomp)
														
 
															-        ret.append(decomp)
														
 
															-        unused = obj.unused_data
														
 
															+        comp_len += len(add)
														
 
															+        decomp = decomp_obj.decompress(add)
														
 
															+        decomp_len += len(decomp)
														
 
															+        decomp_chunks.append(decomp)
														
 
															+        unused = decomp_obj.unused_data
														
 
															         if unused:
														
 
															             left = len(unused)
														
 
															-            comp_size -= left
														
 
															+            comp_len -= left
														
 
															             if crc32 is not None:
														
 
															                 crc32 = binascii.crc32(add[:-left], crc32)
														
 
															             break
														
 
															         elif crc32 is not None:
														
 
															             crc32 = binascii.crc32(add, crc32)
														
 
															+    if crc32 is not None:
														
 
															+        crc32 &= 0xffffffff
														
 
															-    if size != dec_size:
														
 
															+    if decomp_len != unpacked.decomp_len:
														
 
															         raise zlib.error('decompressed data does not match expected size')
														
 
															-    return ret, comp_size, crc32, unused
														
 
															+
														
 
															+    unpacked.comp_len = comp_len
														
 
															+    unpacked.crc32 = crc32
														
 
															+    return unused
														
 
															 def iter_sha1(iter):
														
@@ -571,15 +653,16 @@ def unpack_object(read_all, read_some=None, compute_crc32=False,
 
															     :param compute_crc32: If True, compute the CRC32 of the compressed data. If
														
 
															         False, the returned CRC32 will be None.
														
 
															     :param zlib_bufsize: An optional buffer size for zlib operations.
														
 
															-    :return: A tuple of (
														
 
															-        type number,
														
 
															-        uncompressed data,
														
 
															-        length of compressed data,
														
 
															-        CRC32 of compressed data,
														
 
															-        unused read data,
														
 
															-        ).
														
 
															-        For delta types, the uncompressed data is a tuple of
														
 
															-        (base, uncompressed chunks).
														
 
															+    :return: A tuple of (unpacked, unused), where unused is the unused data
														
 
															+        leftover from decompression, and unpacked i an UnpackedObject with the
														
 
															+        following attrs set:
														
 
															+            obj_chunks     (for non-delta types)
														
 
															+            pack_type_num
														
 
															+            delta_base     (for delta types)
														
 
															+            comp_len
														
 
															+            decomp_chunks
														
 
															+            decomp_len
														
 
															+            crc32          (if compute_crc32 is True)
														
 
															     """
														
 
															     if read_some is None:
														
 
															         read_some = read_all
														
@@ -593,6 +676,7 @@ def unpack_object(read_all, read_some=None, compute_crc32=False,
 
															     size = bytes[0] & 0x0f
														
 
															     for i, byte in enumerate(bytes[1:]):
														
 
															         size += (byte & 0x7f) << ((i * 7) + 4)
														
 
															+
														
 
															     raw_base = len(bytes)
														
 
															     if type_num == OFS_DELTA:
														
 
															         bytes, crc32 = take_msb_bytes(read_all, crc32=crc32)
														
@@ -603,24 +687,19 @@ def unpack_object(read_all, read_some=None, compute_crc32=False,
 
															             delta_base_offset += 1
														
 
															             delta_base_offset <<= 7
														
 
															             delta_base_offset += (byte & 0x7f)
														
 
															-        base = delta_base_offset
														
 
															+        delta_base = delta_base_offset
														
 
															     elif type_num == REF_DELTA:
														
 
															-        base = read_all(20)
														
 
															+        delta_base = read_all(20)
														
 
															         if compute_crc32:
														
 
															-            crc32 = binascii.crc32(base, crc32)
														
 
															+            crc32 = binascii.crc32(delta_base, crc32)
														
 
															         raw_base += 20
														
 
															     else:
														
 
															-        base = None
														
 
															+        delta_base = None
														
 
															-    uncomp, comp_len, crc32, unused = read_zlib_chunks(
														
 
															-      read_some, size, crc32=crc32, buffer_size=zlib_bufsize)
														
 
															-    if compute_crc32:
														
 
															-        crc32 &= 0xffffffff
														
 
															-    comp_len += raw_base
														
 
															-    if base is None:
														
 
															-        return type_num, uncomp, comp_len, crc32, unused
														
 
															-    else:
														
 
															-        return type_num, (base, uncomp), comp_len, crc32, unused
														
 
															+    unpacked = UnpackedObject(type_num, delta_base, size, crc32)
														
 
															+    unused = read_zlib_chunks(read_some, unpacked, buffer_size=zlib_bufsize)
														
 
															+    unpacked.comp_len += raw_base
														
 
															+    return unpacked, unused
														
 
															 def _compute_object_size((num, obj)):
														
@@ -719,14 +798,15 @@ class PackStreamReader(object):
 
															         :param compute_crc32: If True, compute the CRC32 of the compressed
														
 
															             data. If False, the returned CRC32 will be None.
														
 
															-        :return: Iterator over tuples of (
														
 
															-            offset,
														
 
															-            type number,
														
 
															-            list of uncompressed chunks,
														
 
															-            length of compressed data,
														
 
															-            crc32 of compressed data,
														
 
															-            ).
														
 
															-        :raise AssertionError: if there is an error in the pack format.
														
 
															+        :return: Iterator over UnpackedObjects with the following members set:
														
 
															+            offset
														
 
															+            obj_type_num
														
 
															+            obj_chunks (for non-delta types)
														
 
															+            delta_base (for delta types)
														
 
															+            comp_len
														
 
															+            decomp_chunks
														
 
															+            decomp_len
														
 
															+            crc32 (if compute_crc32 is True)
														
 
															         :raise ChecksumMismatch: if the checksum of the pack contents does not
														
 
															             match the checksum in the pack trailer.
														
 
															         :raise zlib.error: if an error occurred during zlib decompression.
														
@@ -735,10 +815,10 @@ class PackStreamReader(object):
 
															         pack_version, self._num_objects = read_pack_header(self.read)
														
 
															         for i in xrange(self._num_objects):
														
 
															             offset = self.offset
														
 
															-            type_num, uncomp, comp_len, crc32, unused = unpack_object(
														
 
															+            unpacked, unused = unpack_object(
														
 
															               self.read, read_some=self.recv, compute_crc32=compute_crc32,
														
 
															               zlib_bufsize=self._zlib_bufsize)
														
 
															-            yield offset, type_num, uncomp, comp_len, crc32
														
 
															+            unpacked.offset = offset
														
 
															             # prepend any unused data to current read buffer
														
 
															             buf = StringIO()
														
@@ -747,6 +827,8 @@ class PackStreamReader(object):
 
															             buf.seek(0)
														
 
															             self._rbuf = buf
														
 
															+            yield unpacked
														
 
															+
														
 
															         if self._buf_len() < 20:
														
 
															             # If the read buffer is full, then the last read() got the whole
														
 
															             # trailer off the wire. If not, it means there is still some of the
														
@@ -794,8 +876,8 @@ class PackStreamCopier(PackStreamReader):
 
															         throw.
														
 
															         """
														
 
															         if self._delta_iter:
														
 
															-            for offset, type_num, uncomp, _, _ in self.read_objects():
														
 
															-                self._delta_iter.record(offset, type_num, uncomp)
														
 
															+            for unpacked in self.read_objects():
														
 
															+                self._delta_iter.record(unpacked)
														
 
															         else:
														
 
															             for _ in self.read_objects():
														
 
															                 pass
														
@@ -959,12 +1041,24 @@ class PackData(object):
 
															         offset = self._header_size
														
 
															         for i in xrange(1, self._num_objects + 1):
														
 
															             self._file.seek(offset)  # Back up over unused data.
														
 
															-            type_num, obj, total_size, crc32, unused = unpack_object(
														
 
															+            unpacked, _ = unpack_object(
														
 
															               self._file.read, compute_crc32=compute_crc32)
														
 
															             if progress is not None:
														
 
															                 progress(i, self._num_objects)
														
 
															-            yield offset, type_num, obj, crc32
														
 
															-            offset += total_size
														
 
															+            yield (offset, unpacked.pack_type_num, unpacked._obj(),
														
 
															+                   unpacked.crc32)
														
 
															+            offset += unpacked.comp_len
														
 
															+
														
 
															+    def _iter_unpacked(self):
														
 
															+        # TODO(dborowitz): Merge this with iterobjects, if we can change its
														
 
															+        # return type.
														
 
															+        offset = self._header_size
														
 
															+        for _ in xrange(self._num_objects):
														
 
															+            self._file.seek(offset)  # Back up over unused data.
														
 
															+            unpacked, _ = unpack_object(self._file.read, compute_crc32=False)
														
 
															+            unpacked.offset = offset
														
 
															+            yield unpacked
														
 
															+            offset += unpacked.comp_len
														
 
															     def iterentries(self, progress=None):
														
 
															         """Yield entries summarizing the contents of this pack.
														
@@ -1058,7 +1152,8 @@ class PackData(object):
 
															                 'offset was %r' % offset
														
 
															         assert offset >= self._header_size
														
 
															         self._file.seek(offset)
														
 
															-        return unpack_object(self._file.read)[:2]
														
 
															+        unpacked, _ = unpack_object(self._file.read)
														
 
															+        return (unpacked.pack_type_num, unpacked._obj())
														
 
															 class DeltaChainIterator(object):
														
@@ -1068,7 +1163,17 @@ class DeltaChainIterator(object):
 
															     regardless of how many objects reference it as a delta base. As a result,
														
 
															     memory usage is proportional to the length of the longest delta chain.
														
 
															-    Subclasses override _result to define the result type of the iterator.
														
 
															+    Subclasses can override _result to define the result type of the iterator.
														
 
															+    By default, results are UnpackedObjects with the following members set:
														
 
															+        offset
														
 
															+        obj_type_num
														
 
															+        obj_chunks
														
 
															+        pack_type_num
														
 
															+        delta_base     (for delta types)
														
 
															+        comp_len
														
 
															+        decomp_chunks
														
 
															+        decomp_len
														
 
															+        crc32          (if _compute_crc32 is True)
														
 
															     """
														
 
															     _compute_crc32 = False
														
@@ -1086,18 +1191,18 @@ class DeltaChainIterator(object):
 
															     def for_pack_data(cls, pack_data, resolve_ext_ref=None):
														
 
															         walker = cls(None, resolve_ext_ref=resolve_ext_ref)
														
 
															         walker.set_pack_data(pack_data)
														
 
															-        for offset, type_num, obj, _ in pack_data.iterobjects():
														
 
															-            walker.record(offset, type_num, obj)
														
 
															+        for unpacked in pack_data._iter_unpacked():
														
 
															+            walker.record(unpacked)
														
 
															         return walker
														
 
															-    def record(self, offset, type_num, uncomp):
														
 
															+    def record(self, unpacked):
														
 
															+        type_num = unpacked.pack_type_num
														
 
															+        offset = unpacked.offset
														
 
															         if type_num == OFS_DELTA:
														
 
															-            delta_offset, _ = uncomp
														
 
															-            base_offset = offset - delta_offset
														
 
															+            base_offset = offset - unpacked.delta_base
														
 
															             self._pending_ofs[base_offset].append(offset)
														
 
															         elif type_num == REF_DELTA:
														
 
															-            base_sha, _ = uncomp
														
 
															-            self._pending_ref[base_sha].append(offset)
														
 
															+            self._pending_ref[unpacked.delta_base].append(offset)
														
 
															         else:
														
 
															             self._full_ofs.append((offset, type_num))
														
@@ -1137,35 +1242,35 @@ class DeltaChainIterator(object):
 
															         self._ensure_no_pending()
														
 
															-    def _result(self, offset, type_num, chunks, sha, crc32):
														
 
															-        raise NotImplementedError
														
 
															+    def _result(self, unpacked):
														
 
															+        return unpacked
														
 
															-    def _resolve_object(self, offset, base_type_num, base_chunks):
														
 
															+    def _resolve_object(self, offset, obj_type_num, base_chunks):
														
 
															         self._file.seek(offset)
														
 
															-        type_num, obj, _, crc32, _ = unpack_object(
														
 
															+        unpacked, _ = unpack_object(
														
 
															           self._file.read, compute_crc32=self._compute_crc32)
														
 
															+        unpacked.offset = offset
														
 
															         if base_chunks is None:
														
 
															-            assert type_num == base_type_num
														
 
															-            chunks = obj
														
 
															+            assert unpacked.pack_type_num == obj_type_num
														
 
															         else:
														
 
															-            assert type_num in DELTA_TYPES
														
 
															-            _, delta_chunks = obj
														
 
															-            chunks = apply_delta(base_chunks, delta_chunks)
														
 
															-        sha = obj_sha(base_type_num, chunks)
														
 
															-        return chunks, sha, crc32
														
 
															+            assert unpacked.pack_type_num in DELTA_TYPES
														
 
															+            unpacked.obj_type_num = obj_type_num
														
 
															+            unpacked.obj_chunks = apply_delta(base_chunks,
														
 
															+                                              unpacked.decomp_chunks)
														
 
															+        return unpacked
														
 
															-    def _follow_chain(self, offset, base_type_num, base_chunks):
														
 
															+    def _follow_chain(self, offset, obj_type_num, base_chunks):
														
 
															         # Unlike PackData.get_object_at, there is no need to cache offsets as
														
 
															         # this approach by design inflates each object exactly once.
														
 
															-        chunks, sha, crc32 = self._resolve_object(offset, base_type_num,
														
 
															-                                                  base_chunks)
														
 
															-        yield self._result(offset, base_type_num, chunks, sha, crc32)
														
 
															+        unpacked = self._resolve_object(offset, obj_type_num, base_chunks)
														
 
															+        yield self._result(unpacked)
														
 
															-        pending = chain(self._pending_ofs.pop(offset, []),
														
 
															-                        self._pending_ref.pop(sha, []))
														
 
															+        pending = chain(self._pending_ofs.pop(unpacked.offset, []),
														
 
															+                        self._pending_ref.pop(unpacked.sha(), []))
														
 
															         for new_offset in pending:
														
 
															-            for result in self._follow_chain(new_offset, base_type_num, chunks):
														
 
															-                yield result
														
 
															+            for new_result in self._follow_chain(
														
 
															+              new_offset, unpacked.obj_type_num, unpacked.obj_chunks):
														
 
															+                yield new_result
														
 
															     def __iter__(self):
														
 
															         return self._walk_all_chains()
														
@@ -1179,18 +1284,15 @@ class PackIndexer(DeltaChainIterator):
 
															     _compute_crc32 = True
														
 
															-    def _result(self, offset, unused_type_num, unused_chunks, sha, crc32):
														
 
															-        return sha, offset, crc32
														
 
															+    def _result(self, unpacked):
														
 
															+        return unpacked.sha(), unpacked.offset, unpacked.crc32
														
 
															 class PackInflater(DeltaChainIterator):
														
 
															     """Delta chain iterator that yields ShaFile objects."""
														
 
															-    def _result(self, unused_offset, type_num, chunks, unused_sha,
														
 
															-                unused_crc32):
														
 
															-        # TODO: If from_raw_chunks supported it, we could pass in the SHA to
														
 
															-        # avoid another pass over the file.
														
 
															-        return ShaFile.from_raw_chunks(type_num, chunks)
														
 
															+    def _result(self, unpacked):
														
 
															+        return unpacked.sha_file()
														
 
															 class SHA1Reader(object):
														
--- a/dulwich/tests/test_pack.py
+++ b/dulwich/tests/test_pack.py
@@ -57,6 +57,7 @@ from dulwich.pack import (
 
															     create_delta,
														
 
															     deltify_pack_objects,
														
 
															     load_pack_index,
														
 
															+    UnpackedObject,
														
 
															     read_zlib_chunks,
														
 
															     write_pack_header,
														
 
															     write_pack_index_v1,
														
@@ -436,8 +437,13 @@ class WritePackTests(TestCase):
 
															         f.write('x')  # unpack_object needs extra trailing data.
														
 
															         f.seek(offset)
														
 
															         comp_len = len(f.getvalue()) - offset - 1
														
 
															-        self.assertEqual((Blob.type_num, ['blob'], comp_len, crc32, 'x'),
														
 
															-                         unpack_object(f.read, compute_crc32=True))
														
 
															+        unpacked, unused = unpack_object(f.read, compute_crc32=True)
														
 
															+        self.assertEqual(Blob.type_num, unpacked.pack_type_num)
														
 
															+        self.assertEqual(Blob.type_num, unpacked.obj_type_num)
														
 
															+        self.assertEqual(['blob'], unpacked.decomp_chunks)
														
 
															+        self.assertEqual(comp_len, unpacked.comp_len)
														
 
															+        self.assertEqual(crc32, unpacked.crc32)
														
 
															+        self.assertEqual('x', unused)
														
 
															     def test_write_pack_object_sha(self):
														
 
															         f = StringIO()
														
@@ -570,45 +576,50 @@ class ReadZlibTests(TestCase):
 
															     def setUp(self):
														
 
															         super(ReadZlibTests, self).setUp()
														
 
															         self.read = StringIO(self.comp + self.extra).read
														
 
															+        self.unpacked = UnpackedObject(Tree.type_num, None, len(self.decomp), 0)
														
 
															     def test_decompress_size(self):
														
 
															         good_decomp_len = len(self.decomp)
														
 
															-        self.assertRaises(ValueError, read_zlib_chunks, self.read, -1)
														
 
															+        self.unpacked.decomp_len = -1
														
 
															+        self.assertRaises(ValueError, read_zlib_chunks, self.read,
														
 
															+                          self.unpacked)
														
 
															+        self.unpacked.decomp_len = good_decomp_len - 1
														
 
															         self.assertRaises(zlib.error, read_zlib_chunks, self.read,
														
 
															-                          good_decomp_len - 1)
														
 
															+                          self.unpacked)
														
 
															+        self.unpacked.decomp_len = good_decomp_len + 1
														
 
															         self.assertRaises(zlib.error, read_zlib_chunks, self.read,
														
 
															-                          good_decomp_len + 1)
														
 
															+                          self.unpacked)
														
 
															     def test_decompress_truncated(self):
														
 
															         read = StringIO(self.comp[:10]).read
														
 
															-        self.assertRaises(zlib.error, read_zlib_chunks, read, len(self.decomp))
														
 
															+        self.assertRaises(zlib.error, read_zlib_chunks, read, self.unpacked)
														
 
															         read = StringIO(self.comp).read
														
 
															-        self.assertRaises(zlib.error, read_zlib_chunks, read, len(self.decomp))
														
 
															+        self.assertRaises(zlib.error, read_zlib_chunks, read, self.unpacked)
														
 
															     def test_decompress_empty(self):
														
 
															+        unpacked = UnpackedObject(Tree.type_num, None, 0, None)
														
 
															         comp = zlib.compress('')
														
 
															         read = StringIO(comp + self.extra).read
														
 
															-        decomp, comp_len, crc32, unused_data = read_zlib_chunks(read, 0,
														
 
															-                                                                crc32=0)
														
 
															-        self.assertEqual('', ''.join(decomp))
														
 
															-        self.assertEqual(len(comp), comp_len)
														
 
															-        self.assertNotEquals('', unused_data)
														
 
															-        self.assertEquals(self.extra, unused_data + read())
														
 
															+        unused = read_zlib_chunks(read, unpacked)
														
 
															+        self.assertEqual('', ''.join(unpacked.decomp_chunks))
														
 
															+        self.assertEqual(len(comp), unpacked.comp_len)
														
 
															+        self.assertNotEquals('', unused)
														
 
															+        self.assertEquals(self.extra, unused + read())
														
 
															     def test_decompress_no_crc32(self):
														
 
															-        _, _, crc32, _ = read_zlib_chunks(
														
 
															-          self.read, len(self.decomp), buffer_size=4096)
														
 
															-        self.assertEquals(None, crc32)
														
 
															+        self.unpacked.crc32 = None
														
 
															+        read_zlib_chunks(self.read, self.unpacked)
														
 
															+        self.assertEquals(None, self.unpacked.crc32)
														
 
															     def _do_decompress_test(self, buffer_size):
														
 
															-        decomp, comp_len, crc32, unused_data = read_zlib_chunks(
														
 
															-          self.read, len(self.decomp), buffer_size=buffer_size, crc32=0)
														
 
															-        self.assertEquals(self.decomp, ''.join(decomp))
														
 
															-        self.assertEquals(len(self.comp), comp_len)
														
 
															-        self.assertEquals(crc32, zlib.crc32(self.comp))
														
 
															-        self.assertNotEquals('', unused_data)
														
 
															-        self.assertEquals(self.extra, unused_data + self.read())
														
 
															+        unused = read_zlib_chunks(self.read, self.unpacked,
														
 
															+                                  buffer_size=buffer_size)
														
 
															+        self.assertEquals(self.decomp, ''.join(self.unpacked.decomp_chunks))
														
 
															+        self.assertEquals(len(self.comp), self.unpacked.comp_len)
														
 
															+        self.assertEquals(zlib.crc32(self.comp), self.unpacked.crc32)
														
 
															+        self.assertNotEquals('', unused)
														
 
															+        self.assertEquals(self.extra, unused + self.read())
														
 
															     def test_simple_decompress(self):
														
 
															         self._do_decompress_test(4096)
														
@@ -668,23 +679,27 @@ class TestPackStreamReader(TestCase):
 
															         objects = list(reader.read_objects(compute_crc32=True))
														
 
															         self.assertEqual(2, len(objects))
														
 
															-        blob, delta = objects
														
 
															-        bofs, btype, buncomp, blen, bcrc = blob
														
 
															-        dofs, dtype, duncomp, dlen, dcrc = delta
														
 
															-
														
 
															-        self.assertEqual(entries[0][0], bofs)
														
 
															-        self.assertEqual(Blob.type_num, btype)
														
 
															-        self.assertEqual('blob', ''.join(buncomp))
														
 
															-        self.assertEqual(dofs - bofs, blen)
														
 
															-        self.assertEqual(entries[0][4], bcrc)
														
 
															-
														
 
															-        self.assertEqual(entries[1][0], dofs)
														
 
															-        self.assertEqual(OFS_DELTA, dtype)
														
 
															-        delta_ofs, delta_chunks = duncomp
														
 
															-        self.assertEqual(dofs - bofs, delta_ofs)
														
 
															-        self.assertEqual(create_delta('blob', 'blob1'), ''.join(delta_chunks))
														
 
															-        self.assertEqual(len(f.getvalue()) - 20 - dofs, dlen)
														
 
															-        self.assertEqual(entries[1][4], dcrc)
														
 
															+        unpacked_blob, unpacked_delta = objects
														
 
															+
														
 
															+        self.assertEqual(entries[0][0], unpacked_blob.offset)
														
 
															+        self.assertEqual(Blob.type_num, unpacked_blob.pack_type_num)
														
 
															+        self.assertEqual(Blob.type_num, unpacked_blob.obj_type_num)
														
 
															+        self.assertEqual(None, unpacked_blob.delta_base)
														
 
															+        self.assertEqual('blob', ''.join(unpacked_blob.decomp_chunks))
														
 
															+        self.assertEqual(unpacked_delta.offset - unpacked_blob.offset,
														
 
															+                         unpacked_blob.comp_len)
														
 
															+        self.assertEqual(entries[0][4], unpacked_blob.crc32)
														
 
															+
														
 
															+        self.assertEqual(entries[1][0], unpacked_delta.offset)
														
 
															+        self.assertEqual(OFS_DELTA, unpacked_delta.pack_type_num)
														
 
															+        self.assertEqual(None, unpacked_delta.obj_type_num)
														
 
															+        self.assertEqual(unpacked_delta.offset - unpacked_blob.offset,
														
 
															+                         unpacked_delta.delta_base)
														
 
															+        self.assertEqual(create_delta('blob', 'blob1'),
														
 
															+                         ''.join(unpacked_delta.decomp_chunks))
														
 
															+        self.assertEqual(len(f.getvalue()) - 20 - unpacked_delta.offset,
														
 
															+                         unpacked_delta.comp_len)
														
 
															+        self.assertEqual(entries[1][4], unpacked_delta.crc32)
														
 
															     def test_read_objects_buffered(self):
														
 
															         f = StringIO()
														
@@ -702,19 +717,19 @@ class TestPackIterator(DeltaChainIterator):
 
															     def __init__(self, *args, **kwargs):
														
 
															         super(TestPackIterator, self).__init__(*args, **kwargs)
														
 
															-        self._unpacked = set()
														
 
															+        self._unpacked_offsets = set()
														
 
															-    def _result(self, offset, type_num, chunks, sha, crc32):
														
 
															+    def _result(self, unpacked):
														
 
															         """Return entries in the same format as build_pack."""
														
 
															-        return offset, type_num, ''.join(chunks), sha, crc32
														
 
															+        return (unpacked.offset, unpacked.obj_type_num,
														
 
															+                ''.join(unpacked.obj_chunks), unpacked.sha(), unpacked.crc32)
														
 
															-    def _resolve_object(self, offset, base_type_num, base_chunks):
														
 
															-        assert offset not in self._unpacked, ('Attempted to re-inflate offset '
														
 
															-                                              '%i' % offset)
														
 
															-        self._unpacked.add(offset)
														
 
															+    def _resolve_object(self, offset, pack_type_num, base_chunks):
														
 
															+        assert offset not in self._unpacked_offsets, (
														
 
															+                'Attempted to re-inflate offset %i' % offset)
														
 
															+        self._unpacked_offsets.add(offset)
														
 
															         return super(TestPackIterator, self)._resolve_object(
														
 
															-          offset, base_type_num, base_chunks)
														
 
															-
														
 
															+          offset, pack_type_num, base_chunks)
														
 
															 class DeltaChainIteratorTests(TestCase):