test_dumb.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297
  1. # test_dumb.py -- Tests for dumb HTTP git repositories
  2. # Copyright (C) 2025 Dulwich contributors
  3. #
  4. # SPDX-License-Identifier: Apache-2.0 OR GPL-2.0-or-later
  5. # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
  6. # General Public License as published by the Free Software Foundation; version 2.0
  7. # or (at your option) any later version. You can redistribute it and/or
  8. # modify it under the terms of either of these two licenses.
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. # You should have received a copy of the licenses; if not, see
  17. # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
  18. # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
  19. # License, Version 2.0.
  20. #
  21. """Tests for dumb HTTP git repositories."""
  22. import zlib
  23. from typing import Callable, Optional, Union
  24. from unittest import TestCase
  25. from unittest.mock import Mock
  26. from dulwich.dumb import DumbHTTPObjectStore, DumbRemoteHTTPRepo
  27. from dulwich.errors import NotGitRepository
  28. from dulwich.objects import Blob, Commit, ShaFile, Tag, Tree, sha_to_hex
  29. class MockResponse:
  30. def __init__(self, status: int = 200, content: bytes = b"", headers: Optional[dict[str, str]] = None) -> None:
  31. self.status = status
  32. self.content = content
  33. self.headers = headers or {}
  34. self.closed = False
  35. def close(self) -> None:
  36. self.closed = True
  37. class DumbHTTPObjectStoreTests(TestCase):
  38. """Tests for DumbHTTPObjectStore."""
  39. def setUp(self) -> None:
  40. self.base_url = "https://example.com/repo.git/"
  41. self.responses: dict[str, dict[str, Union[int, bytes]]] = {}
  42. self.store = DumbHTTPObjectStore(self.base_url, self._mock_http_request)
  43. def _mock_http_request(self, url: str, headers: dict[str, str]) -> tuple[MockResponse, Callable[[Optional[int]], bytes]]:
  44. """Mock HTTP request function."""
  45. if url in self.responses:
  46. resp_data = self.responses[url]
  47. resp = MockResponse(
  48. int(resp_data.get("status", 200)), bytes(resp_data.get("content", b""))
  49. )
  50. # Create a mock read function that behaves like urllib3's read
  51. content = resp.content
  52. offset = [0] # Use list to make it mutable in closure
  53. def read_func(size: Optional[int] = None) -> bytes:
  54. if offset[0] >= len(content):
  55. return b""
  56. if size is None:
  57. result = content[offset[0] :]
  58. offset[0] = len(content)
  59. else:
  60. result = content[offset[0] : offset[0] + size]
  61. offset[0] += size
  62. return result
  63. return resp, read_func
  64. else:
  65. resp = MockResponse(404)
  66. return resp, lambda size: b""
  67. def _add_response(self, path: str, content: bytes, status: int = 200) -> None:
  68. """Add a mock response for a given path."""
  69. url = self.base_url + path
  70. self.responses[url] = {"status": status, "content": content}
  71. def _make_object(self, obj: ShaFile) -> bytes:
  72. """Create compressed git object data."""
  73. type_name = {
  74. Blob.type_num: b"blob",
  75. Tree.type_num: b"tree",
  76. Commit.type_num: b"commit",
  77. Tag.type_num: b"tag",
  78. }[obj.type_num]
  79. content = obj.as_raw_string()
  80. header = type_name + b" " + str(len(content)).encode() + b"\x00"
  81. return zlib.compress(header + content)
  82. def test_fetch_loose_object_blob(self) -> None:
  83. # Create a blob object
  84. blob = Blob()
  85. blob.data = b"Hello, world!"
  86. hex_sha = blob.id
  87. # Add mock response
  88. path = f"objects/{hex_sha[:2].decode('ascii')}/{hex_sha[2:].decode('ascii')}"
  89. self._add_response(path, self._make_object(blob))
  90. # Fetch the object
  91. type_num, content = self.store._fetch_loose_object(blob.id)
  92. self.assertEqual(Blob.type_num, type_num)
  93. self.assertEqual(b"Hello, world!", content)
  94. def test_fetch_loose_object_not_found(self) -> None:
  95. hex_sha = b"1" * 40
  96. self.assertRaises(KeyError, self.store._fetch_loose_object, hex_sha)
  97. def test_fetch_loose_object_invalid_format(self) -> None:
  98. sha = b"1" * 20
  99. hex_sha = sha_to_hex(sha)
  100. path = f"objects/{hex_sha[:2].decode('ascii')}/{hex_sha[2:].decode('ascii')}"
  101. # Add invalid compressed data
  102. self._add_response(path, b"invalid data")
  103. self.assertRaises(Exception, self.store._fetch_loose_object, sha)
  104. def test_load_packs_empty(self) -> None:
  105. # No packs file
  106. self.store._load_packs()
  107. self.assertEqual([], self.store._packs)
  108. def test_load_packs_with_entries(self) -> None:
  109. packs_content = b"""P pack-1234567890abcdef1234567890abcdef12345678.pack
  110. P pack-abcdef1234567890abcdef1234567890abcdef12.pack
  111. """
  112. self._add_response("objects/info/packs", packs_content)
  113. self.store._load_packs()
  114. assert self.store._packs is not None
  115. self.assertEqual(2, len(self.store._packs))
  116. self.assertEqual(
  117. "pack-1234567890abcdef1234567890abcdef12345678", self.store._packs[0][0]
  118. )
  119. self.assertEqual(
  120. "pack-abcdef1234567890abcdef1234567890abcdef12", self.store._packs[1][0]
  121. )
  122. def test_get_raw_from_cache(self) -> None:
  123. sha = b"1" * 40
  124. self.store._cached_objects[sha] = (Blob.type_num, b"cached content")
  125. type_num, content = self.store.get_raw(sha)
  126. self.assertEqual(Blob.type_num, type_num)
  127. self.assertEqual(b"cached content", content)
  128. def test_contains_loose(self) -> None:
  129. # Create a blob object
  130. blob = Blob()
  131. blob.data = b"Test blob"
  132. hex_sha = blob.id
  133. # Add mock response
  134. path = f"objects/{hex_sha[:2].decode('ascii')}/{hex_sha[2:].decode('ascii')}"
  135. self._add_response(path, self._make_object(blob))
  136. self.assertTrue(self.store.contains_loose(hex_sha))
  137. self.assertFalse(self.store.contains_loose(b"0" * 40))
  138. def test_add_object_not_implemented(self) -> None:
  139. blob = Blob()
  140. blob.data = b"test"
  141. self.assertRaises(NotImplementedError, self.store.add_object, blob)
  142. def test_add_objects_not_implemented(self) -> None:
  143. self.assertRaises(NotImplementedError, self.store.add_objects, [])
  144. class DumbRemoteHTTPRepoTests(TestCase):
  145. """Tests for DumbRemoteHTTPRepo."""
  146. def setUp(self) -> None:
  147. self.base_url = "https://example.com/repo.git/"
  148. self.responses: dict[str, dict[str, Union[int, bytes]]] = {}
  149. self.repo = DumbRemoteHTTPRepo(self.base_url, self._mock_http_request)
  150. def _mock_http_request(self, url: str, headers: dict[str, str]) -> tuple[MockResponse, Callable[[Optional[int]], bytes]]:
  151. """Mock HTTP request function."""
  152. if url in self.responses:
  153. resp_data = self.responses[url]
  154. resp = MockResponse(
  155. int(resp_data.get("status", 200)), bytes(resp_data.get("content", b""))
  156. )
  157. # Create a mock read function that behaves like urllib3's read
  158. content = resp.content
  159. offset = [0] # Use list to make it mutable in closure
  160. def read_func(size: Optional[int] = None) -> bytes:
  161. if offset[0] >= len(content):
  162. return b""
  163. if size is None:
  164. result = content[offset[0] :]
  165. offset[0] = len(content)
  166. else:
  167. result = content[offset[0] : offset[0] + size]
  168. offset[0] += size
  169. return result
  170. return resp, read_func
  171. else:
  172. resp = MockResponse(404)
  173. return resp, lambda size: b""
  174. def _add_response(self, path: str, content: bytes, status: int = 200) -> None:
  175. """Add a mock response for a given path."""
  176. url = self.base_url + path
  177. self.responses[url] = {"status": status, "content": content}
  178. def test_get_refs(self) -> None:
  179. refs_content = b"""0123456789abcdef0123456789abcdef01234567\trefs/heads/master
  180. abcdef0123456789abcdef0123456789abcdef01\trefs/heads/develop
  181. fedcba9876543210fedcba9876543210fedcba98\trefs/tags/v1.0
  182. """
  183. self._add_response("info/refs", refs_content)
  184. refs = self.repo.get_refs()
  185. self.assertEqual(3, len(refs))
  186. self.assertEqual(
  187. b"0123456789abcdef0123456789abcdef01234567",
  188. refs[b"refs/heads/master"],
  189. )
  190. self.assertEqual(
  191. b"abcdef0123456789abcdef0123456789abcdef01",
  192. refs[b"refs/heads/develop"],
  193. )
  194. self.assertEqual(
  195. b"fedcba9876543210fedcba9876543210fedcba98",
  196. refs[b"refs/tags/v1.0"],
  197. )
  198. def test_get_refs_not_found(self) -> None:
  199. self.assertRaises(NotGitRepository, self.repo.get_refs)
  200. def test_get_peeled(self) -> None:
  201. refs_content = b"0123456789abcdef0123456789abcdef01234567\trefs/heads/master\n"
  202. self._add_response("info/refs", refs_content)
  203. # For dumb HTTP, peeled just returns the ref value
  204. peeled = self.repo.get_peeled(b"refs/heads/master")
  205. self.assertEqual(b"0123456789abcdef0123456789abcdef01234567", peeled)
  206. def test_fetch_pack_data_no_wants(self) -> None:
  207. refs_content = b"0123456789abcdef0123456789abcdef01234567\trefs/heads/master\n"
  208. self._add_response("info/refs", refs_content)
  209. graph_walker = Mock()
  210. def determine_wants(refs: dict[bytes, bytes]) -> list[bytes]:
  211. return []
  212. result = list(self.repo.fetch_pack_data(graph_walker, determine_wants))
  213. self.assertEqual([], result)
  214. def test_fetch_pack_data_with_blob(self) -> None:
  215. # Set up refs
  216. refs_content = b"0123456789abcdef0123456789abcdef01234567\trefs/heads/master\n"
  217. self._add_response("info/refs", refs_content)
  218. # Create a simple blob object
  219. blob = Blob()
  220. blob.data = b"Test content"
  221. blob_sha = blob.id
  222. # Add blob response
  223. self.repo.object_store._cached_objects[blob_sha] = (
  224. Blob.type_num,
  225. blob.as_raw_string(),
  226. )
  227. # Mock graph walker
  228. graph_walker = Mock()
  229. graph_walker.ack.return_value = [] # No existing objects
  230. def determine_wants(refs: dict[bytes, bytes]) -> list[bytes]:
  231. return [blob_sha]
  232. def progress(msg: bytes) -> None:
  233. assert isinstance(msg, bytes)
  234. result = list(
  235. self.repo.fetch_pack_data(graph_walker, determine_wants, progress)
  236. )
  237. self.assertEqual(1, len(result))
  238. self.assertEqual(Blob.type_num, result[0].pack_type_num)
  239. self.assertEqual([blob.as_raw_string()], result[0].obj_chunks)
  240. def test_object_store_property(self) -> None:
  241. self.assertIsInstance(self.repo.object_store, DumbHTTPObjectStore)
  242. self.assertEqual(self.base_url, self.repo.object_store.base_url)