hace 2 meses · 5d25da17a2
--- a/dulwich/pack.py
+++ b/dulwich/pack.py
@@ -758,12 +758,15 @@ class MemoryPackIndex(PackIndex):
 
				         self,
			
 
				         entries: list[PackIndexEntry],
			
 
				         pack_checksum: bytes | None = None,
			
 
				+        *,
			
 
				+        object_format: ObjectFormat | None = None,
			
 
				     ) -> None:
			
 
				         """Create a new MemoryPackIndex.
			
 
				 
			
 
				         Args:
			
 
				           entries: Sequence of name, idx, crc32 (sorted)
			
 
				           pack_checksum: Optional pack checksum
			
 
				+          object_format: Object format (hash algorithm) to use
			
 
				         """
			
 
				         self._by_sha = {}
			
 
				         self._by_offset = {}
			
@@ -773,6 +776,17 @@ class MemoryPackIndex(PackIndex):
 
				         self._entries = entries
			
 
				         self._pack_checksum = pack_checksum
			
 
				 
			
 
				+        # Set hash size from object format
			
 
				+        if object_format:
			
 
				+            self.hash_size = object_format.oid_length
			
 
				+        else:
			
 
				+            warnings.warn(
			
 
				+                "MemoryPackIndex() should be called with object_format parameter",
			
 
				+                DeprecationWarning,
			
 
				+                stacklevel=2,
			
 
				+            )
			
 
				+            self.hash_size = 20  # Default to SHA1
			
 
				+
			
 
				     def get_pack_checksum(self) -> bytes | None:
			
 
				         """Return the SHA checksum stored for the corresponding packfile."""
			
 
				         return self._pack_checksum
			
@@ -788,9 +802,9 @@ class MemoryPackIndex(PackIndex):
 
				           sha: SHA to look up (binary or hex)
			
 
				         Returns: Offset in the pack file
			
 
				         """
			
 
				-        if len(sha) in (40, 64):  # Hex string (SHA1 or SHA256)
			
 
				-            sha = hex_to_sha(cast(ObjectID, sha))
			
 
				-        return self._by_sha[cast(RawObjectID, sha)]
			
 
				+        if len(sha) == self.hash_size * 2:  # hex string
			
 
				+            sha = hex_to_sha(sha)
			
 
				+        return self._by_sha[sha]
			
 
				 
			
 
				     def object_sha1(self, offset: int) -> bytes:
			
 
				         """Return the SHA1 for the object at the given offset."""
			
@@ -971,8 +985,8 @@ class FilePackIndex(PackIndex):
 
				         lives at within the corresponding pack file. If the pack file doesn't
			
 
				         have the object then None will be returned.
			
 
				         """
			
 
				-        if len(sha) == 40:
			
 
				-            sha = hex_to_sha(cast(ObjectID, sha))
			
 
				+        if len(sha) == self.hash_size * 2:  # hex string
			
 
				+            sha = hex_to_sha(sha)
			
 
				         try:
			
 
				             return self._object_offset(sha)
			
 
				         except ValueError as exc:
			
@@ -1056,12 +1070,9 @@ class PackIndex1(FilePackIndex):
 
				 
			
 
				     def _unpack_entry(self, i: int) -> tuple[RawObjectID, int, None]:
			
 
				         base_offset = (0x100 * 4) + (i * self._entry_size)
			
 
				-        if self.hash_size == 20:
			
 
				-            (offset, name) = unpack_from(">L20s", self._contents, base_offset)
			
 
				-        else:  # SHA256
			
 
				-            offset = unpack_from(">L", self._contents, base_offset)[0]
			
 
				-            name = self._contents[base_offset + 4 : base_offset + 4 + self.hash_size]
			
 
				-        return (RawObjectID(name), offset, None)
			
 
				+        offset = unpack_from(">L", self._contents, base_offset)[0]
			
 
				+        name = self._contents[base_offset + 4 : base_offset + 4 + self.hash_size]
			
 
				+        return (name, offset, None)
			
 
				 
			
 
				     def _unpack_name(self, i: int) -> bytes:
			
 
				         offset = (0x100 * 4) + (i * self._entry_size) + 4
			
@@ -2552,6 +2563,7 @@ class SHA1Writer(BinaryIO):
 
				 
			
 
				 def pack_object_header(
			
 
				     type_num: int, delta_base: bytes | int | None, size: int
			
 
				+    object_format: "ObjectFormat" | None = None
			
 
				 ) -> bytearray:
			
 
				     """Create a pack object header for the given object info.
			
 
				 
			
@@ -2559,8 +2571,18 @@ def pack_object_header(
 
				       type_num: Numeric type of the object.
			
 
				       delta_base: Delta base offset or ref, or None for whole objects.
			
 
				       size: Uncompressed object size.
			
 
				+      object_format: Object format (hash algorithm) to use.
			
 
				     Returns: A header for a packed object.
			
 
				     """
			
 
				+    from .object_format import DEFAULT_OBJECT_FORMAT
			
 
				+    if object_format is None:
			
 
				+        warnings.warn(
			
 
				+            "pack_object_header() should be called with object_format parameter",
			
 
				+            DeprecationWarning,
			
 
				+            stacklevel=2,
			
 
				+        )
			
 
				+        object_format = DEFAULT_OBJECT_FORMAT
			
 
				+
			
 
				     header = []
			
 
				     c = (type_num << 4) | (size & 15)
			
 
				     size >>= 4
			
@@ -2579,8 +2601,7 @@ def pack_object_header(
 
				             delta_base >>= 7
			
 
				         header.extend(ret)
			
 
				     elif type_num == REF_DELTA:
			
 
				-        assert isinstance(delta_base, bytes)
			
 
				-        assert len(delta_base) == 20
			
 
				+        assert len(delta_base) == object_format.oid_length
			
 
				         header += delta_base
			
 
				     return bytearray(header)
			
 
				 
			
@@ -3955,8 +3976,8 @@ class Pack:
 
				                 assert isinstance(base_type, int)
			
 
				             elif base_type == REF_DELTA:
			
 
				                 (basename, delta) = base_obj
			
 
				-                assert isinstance(basename, bytes) and len(basename) == 20
			
 
				-                base_offset, base_type, base_obj = get_ref(cast(RawObjectID, basename))
			
 
				+                assert isinstance(basename, bytes) and len(basename) == self.object_format.oid_length
			
 
				+                base_offset, base_type, base_obj = get_ref(basename)
			
 
				                 assert isinstance(base_type, int)
			
 
				                 if base_offset == prev_offset:  # object is based on itself
			
 
				                     raise UnresolvedDeltas([basename])
			
@@ -4046,12 +4067,21 @@ def extend_pack(
 
				     *,
			
 
				     compression_level: int = -1,
			
 
				     progress: Callable[[bytes], None] | None = None,
			
 
				-) -> tuple[bytes, list[tuple["RawObjectID", int, int]]]:
			
 
				+    object_format: ObjectFormat | None = None,
			
 
				+) -> tuple[bytes, list[tuple[bytes, int, int]]]:
			
 
				     """Extend a pack file with more objects.
			
 
				 
			
 
				     The caller should make sure that object_ids does not contain any objects
			
 
				     that are already in the pack
			
 
				     """
			
 
				+    from .object_format import DEFAULT_OBJECT_FORMAT
			
 
				+    if object_format is None:
			
 
				+        warnings.warn(
			
 
				+            "extend_pack() should be called with object_format parameter",
			
 
				+            DeprecationWarning,
			
 
				+            stacklevel=2,
			
 
				+        )
			
 
				+        object_format = DEFAULT_OBJECT_FORMAT
			
 
				     # Update the header with the new number of objects.
			
 
				     f.seek(0)
			
 
				     _version, num_objects = read_pack_header(f.read)
			
@@ -4077,7 +4107,7 @@ def extend_pack(
 
				             progress(
			
 
				                 (f"writing extra base objects: {i}/{len(object_ids)}\r").encode("ascii")
			
 
				             )
			
 
				-        assert len(object_id) == 20
			
 
				+        assert len(object_id) == object_format.oid_length
			
 
				         type_num, data = get_raw(object_id)
			
 
				         offset = f.tell()
			
 
				         crc32 = write_pack_object(