test_object_store.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353
  1. # test_object_store.py -- tests for object_store.py
  2. # Copyright (C) 2008 Jelmer Vernooij <jelmer@jelmer.uk>
  3. #
  4. # SPDX-License-Identifier: Apache-2.0 OR GPL-2.0-or-later
  5. # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
  6. # General Public License as public by the Free Software Foundation; version 2.0
  7. # or (at your option) any later version. You can redistribute it and/or
  8. # modify it under the terms of either of these two licenses.
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. # You should have received a copy of the licenses; if not, see
  17. # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
  18. # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
  19. # License, Version 2.0.
  20. #
  21. """Tests for the object store interface."""
  22. from typing import TYPE_CHECKING, Any, Callable
  23. from unittest.mock import patch
  24. from dulwich.index import commit_tree
  25. from dulwich.object_store import (
  26. PackBasedObjectStore,
  27. iter_tree_contents,
  28. peel_sha,
  29. )
  30. from dulwich.objects import (
  31. Blob,
  32. Tree,
  33. TreeEntry,
  34. )
  35. from dulwich.protocol import DEPTH_INFINITE
  36. from .utils import make_object, make_tag
  37. if TYPE_CHECKING:
  38. from dulwich.object_store import BaseObjectStore
  39. testobject = make_object(Blob, data=b"yummy data")
  40. class ObjectStoreTests:
  41. store: "BaseObjectStore"
  42. assertEqual: Callable[[object, object], None]
  43. # For type checker purposes - actual implementation supports both styles
  44. assertRaises: Callable[..., Any]
  45. assertNotIn: Callable[[object, object], None]
  46. assertNotEqual: Callable[[object, object], None]
  47. assertIn: Callable[[object, object], None]
  48. def test_determine_wants_all(self) -> None:
  49. self.assertEqual(
  50. [b"1" * 40],
  51. self.store.determine_wants_all({b"refs/heads/foo": b"1" * 40}),
  52. )
  53. def test_determine_wants_all_zero(self) -> None:
  54. self.assertEqual(
  55. [], self.store.determine_wants_all({b"refs/heads/foo": b"0" * 40})
  56. )
  57. def test_determine_wants_all_depth(self) -> None:
  58. self.store.add_object(testobject)
  59. refs = {b"refs/heads/foo": testobject.id}
  60. with patch.object(self.store, "_get_depth", return_value=1) as m:
  61. self.assertEqual([], self.store.determine_wants_all(refs, depth=0))
  62. self.assertEqual(
  63. [testobject.id],
  64. self.store.determine_wants_all(refs, depth=DEPTH_INFINITE),
  65. )
  66. m.assert_not_called()
  67. self.assertEqual([], self.store.determine_wants_all(refs, depth=1))
  68. m.assert_called_with(testobject.id)
  69. self.assertEqual(
  70. [testobject.id], self.store.determine_wants_all(refs, depth=2)
  71. )
  72. def test_get_depth(self) -> None:
  73. self.assertEqual(0, self.store._get_depth(testobject.id))
  74. self.store.add_object(testobject)
  75. self.assertEqual(
  76. 1, self.store._get_depth(testobject.id, get_parents=lambda x: [])
  77. )
  78. parent = make_object(Blob, data=b"parent data")
  79. self.store.add_object(parent)
  80. self.assertEqual(
  81. 2,
  82. self.store._get_depth(
  83. testobject.id,
  84. get_parents=lambda x: [parent.id] if x == testobject else [],
  85. ),
  86. )
  87. def test_iter(self) -> None:
  88. self.assertEqual([], list(self.store))
  89. def test_get_nonexistant(self) -> None:
  90. self.assertRaises(KeyError, lambda: self.store[b"a" * 40])
  91. def test_contains_nonexistant(self) -> None:
  92. self.assertNotIn(b"a" * 40, self.store)
  93. def test_add_objects_empty(self) -> None:
  94. self.store.add_objects([])
  95. def test_add_commit(self) -> None:
  96. # TODO: Argh, no way to construct Git commit objects without
  97. # access to a serialized form.
  98. self.store.add_objects([])
  99. def test_store_resilience(self) -> None:
  100. """Test if updating an existing stored object doesn't erase the
  101. object from the store.
  102. """
  103. test_object = make_object(Blob, data=b"data")
  104. self.store.add_object(test_object)
  105. test_object_id = test_object.id
  106. test_object.data = test_object.data + b"update"
  107. stored_test_object = self.store[test_object_id]
  108. self.assertNotEqual(test_object.id, stored_test_object.id)
  109. self.assertEqual(stored_test_object.id, test_object_id)
  110. def test_add_object(self) -> None:
  111. self.store.add_object(testobject)
  112. self.assertEqual({testobject.id}, set(self.store))
  113. self.assertIn(testobject.id, self.store)
  114. r = self.store[testobject.id]
  115. self.assertEqual(r, testobject)
  116. def test_add_objects(self) -> None:
  117. data = [(testobject, "mypath")]
  118. self.store.add_objects(data)
  119. self.assertEqual({testobject.id}, set(self.store))
  120. self.assertIn(testobject.id, self.store)
  121. r = self.store[testobject.id]
  122. self.assertEqual(r, testobject)
  123. def test_tree_changes(self) -> None:
  124. blob_a1 = make_object(Blob, data=b"a1")
  125. blob_a2 = make_object(Blob, data=b"a2")
  126. blob_b = make_object(Blob, data=b"b")
  127. for blob in [blob_a1, blob_a2, blob_b]:
  128. self.store.add_object(blob)
  129. blobs_1 = [(b"a", blob_a1.id, 0o100644), (b"b", blob_b.id, 0o100644)]
  130. tree1_id = commit_tree(self.store, blobs_1)
  131. blobs_2 = [(b"a", blob_a2.id, 0o100644), (b"b", blob_b.id, 0o100644)]
  132. tree2_id = commit_tree(self.store, blobs_2)
  133. change_a = (
  134. (b"a", b"a"),
  135. (0o100644, 0o100644),
  136. (blob_a1.id, blob_a2.id),
  137. )
  138. self.assertEqual([change_a], list(self.store.tree_changes(tree1_id, tree2_id)))
  139. self.assertEqual(
  140. [
  141. change_a,
  142. ((b"b", b"b"), (0o100644, 0o100644), (blob_b.id, blob_b.id)),
  143. ],
  144. list(self.store.tree_changes(tree1_id, tree2_id, want_unchanged=True)),
  145. )
  146. def test_iter_tree_contents(self) -> None:
  147. blob_a = make_object(Blob, data=b"a")
  148. blob_b = make_object(Blob, data=b"b")
  149. blob_c = make_object(Blob, data=b"c")
  150. for blob in [blob_a, blob_b, blob_c]:
  151. self.store.add_object(blob)
  152. blobs = [
  153. (b"a", blob_a.id, 0o100644),
  154. (b"ad/b", blob_b.id, 0o100644),
  155. (b"ad/bd/c", blob_c.id, 0o100755),
  156. (b"ad/c", blob_c.id, 0o100644),
  157. (b"c", blob_c.id, 0o100644),
  158. ]
  159. tree_id = commit_tree(self.store, blobs)
  160. self.assertEqual(
  161. [TreeEntry(p, m, h) for (p, h, m) in blobs],
  162. list(iter_tree_contents(self.store, tree_id)),
  163. )
  164. self.assertEqual([], list(iter_tree_contents(self.store, None)))
  165. def test_iter_tree_contents_include_trees(self) -> None:
  166. blob_a = make_object(Blob, data=b"a")
  167. blob_b = make_object(Blob, data=b"b")
  168. blob_c = make_object(Blob, data=b"c")
  169. for blob in [blob_a, blob_b, blob_c]:
  170. self.store.add_object(blob)
  171. blobs = [
  172. (b"a", blob_a.id, 0o100644),
  173. (b"ad/b", blob_b.id, 0o100644),
  174. (b"ad/bd/c", blob_c.id, 0o100755),
  175. ]
  176. tree_id = commit_tree(self.store, blobs)
  177. tree = self.store[tree_id]
  178. assert isinstance(tree, Tree)
  179. tree_ad = self.store[tree[b"ad"][1]]
  180. assert isinstance(tree_ad, Tree)
  181. tree_bd = self.store[tree_ad[b"bd"][1]]
  182. expected = [
  183. TreeEntry(b"", 0o040000, tree_id),
  184. TreeEntry(b"a", 0o100644, blob_a.id),
  185. TreeEntry(b"ad", 0o040000, tree_ad.id),
  186. TreeEntry(b"ad/b", 0o100644, blob_b.id),
  187. TreeEntry(b"ad/bd", 0o040000, tree_bd.id),
  188. TreeEntry(b"ad/bd/c", 0o100755, blob_c.id),
  189. ]
  190. actual = iter_tree_contents(self.store, tree_id, include_trees=True)
  191. self.assertEqual(expected, list(actual))
  192. def make_tag(self, name, obj):
  193. tag = make_tag(obj, name=name)
  194. self.store.add_object(tag)
  195. return tag
  196. def test_peel_sha(self) -> None:
  197. self.store.add_object(testobject)
  198. tag1 = self.make_tag(b"1", testobject)
  199. tag2 = self.make_tag(b"2", testobject)
  200. tag3 = self.make_tag(b"3", testobject)
  201. for obj in [testobject, tag1, tag2, tag3]:
  202. self.assertEqual((obj, testobject), peel_sha(self.store, obj.id))
  203. def test_get_raw(self) -> None:
  204. self.store.add_object(testobject)
  205. self.assertEqual(
  206. (Blob.type_num, b"yummy data"), self.store.get_raw(testobject.id)
  207. )
  208. def test_close(self) -> None:
  209. # For now, just check that close doesn't barf.
  210. self.store.add_object(testobject)
  211. self.store.close()
  212. def test_iter_prefix(self) -> None:
  213. self.store.add_object(testobject)
  214. self.assertEqual([testobject.id], list(self.store.iter_prefix(testobject.id)))
  215. self.assertEqual(
  216. [testobject.id], list(self.store.iter_prefix(testobject.id[:10]))
  217. )
  218. def test_iterobjects_subset_all_present(self) -> None:
  219. """Test iterating over a subset of objects that all exist."""
  220. blob1 = make_object(Blob, data=b"blob 1 data")
  221. blob2 = make_object(Blob, data=b"blob 2 data")
  222. self.store.add_object(blob1)
  223. self.store.add_object(blob2)
  224. objects = list(self.store.iterobjects_subset([blob1.id, blob2.id]))
  225. self.assertEqual(2, len(objects))
  226. object_ids = set(o.id for o in objects)
  227. self.assertEqual(set([blob1.id, blob2.id]), object_ids)
  228. def test_iterobjects_subset_missing_not_allowed(self) -> None:
  229. """Test iterating with missing objects when not allowed."""
  230. blob1 = make_object(Blob, data=b"blob 1 data")
  231. self.store.add_object(blob1)
  232. missing_sha = b"1" * 40
  233. with self.assertRaises(KeyError):
  234. list(self.store.iterobjects_subset([blob1.id, missing_sha]))
  235. def test_iterobjects_subset_missing_allowed(self) -> None:
  236. """Test iterating with missing objects when allowed."""
  237. blob1 = make_object(Blob, data=b"blob 1 data")
  238. self.store.add_object(blob1)
  239. missing_sha = b"1" * 40
  240. objects = list(
  241. self.store.iterobjects_subset([blob1.id, missing_sha], allow_missing=True)
  242. )
  243. self.assertEqual(1, len(objects))
  244. self.assertEqual(blob1.id, objects[0].id)
  245. def test_iter_prefix_not_found(self) -> None:
  246. self.assertEqual([], list(self.store.iter_prefix(b"1" * 40)))
  247. class PackBasedObjectStoreTests(ObjectStoreTests):
  248. store: PackBasedObjectStore
  249. def tearDown(self) -> None:
  250. for pack in self.store.packs:
  251. pack.close()
  252. def test_empty_packs(self) -> None:
  253. self.assertEqual([], list(self.store.packs))
  254. def test_pack_loose_objects(self) -> None:
  255. b1 = make_object(Blob, data=b"yummy data")
  256. self.store.add_object(b1)
  257. b2 = make_object(Blob, data=b"more yummy data")
  258. self.store.add_object(b2)
  259. b3 = make_object(Blob, data=b"even more yummy data")
  260. b4 = make_object(Blob, data=b"and more yummy data")
  261. self.store.add_objects([(b3, None), (b4, None)])
  262. self.assertEqual({b1.id, b2.id, b3.id, b4.id}, set(self.store))
  263. self.assertEqual(1, len(self.store.packs))
  264. self.assertEqual(2, self.store.pack_loose_objects())
  265. self.assertNotEqual([], list(self.store.packs))
  266. self.assertEqual(0, self.store.pack_loose_objects())
  267. def test_repack(self) -> None:
  268. b1 = make_object(Blob, data=b"yummy data")
  269. self.store.add_object(b1)
  270. b2 = make_object(Blob, data=b"more yummy data")
  271. self.store.add_object(b2)
  272. b3 = make_object(Blob, data=b"even more yummy data")
  273. b4 = make_object(Blob, data=b"and more yummy data")
  274. self.store.add_objects([(b3, None), (b4, None)])
  275. b5 = make_object(Blob, data=b"and more data")
  276. b6 = make_object(Blob, data=b"and some more data")
  277. self.store.add_objects([(b5, None), (b6, None)])
  278. self.assertEqual({b1.id, b2.id, b3.id, b4.id, b5.id, b6.id}, set(self.store))
  279. self.assertEqual(2, len(self.store.packs))
  280. self.assertEqual(6, self.store.repack())
  281. self.assertEqual(1, len(self.store.packs))
  282. self.assertEqual(0, self.store.pack_loose_objects())
  283. def test_repack_existing(self) -> None:
  284. b1 = make_object(Blob, data=b"yummy data")
  285. self.store.add_object(b1)
  286. b2 = make_object(Blob, data=b"more yummy data")
  287. self.store.add_object(b2)
  288. self.store.add_objects([(b1, None), (b2, None)])
  289. self.store.add_objects([(b2, None)])
  290. self.assertEqual({b1.id, b2.id}, set(self.store))
  291. self.assertEqual(2, len(self.store.packs))
  292. self.assertEqual(2, self.store.repack())
  293. self.assertEqual(1, len(self.store.packs))
  294. self.assertEqual(0, self.store.pack_loose_objects())
  295. self.assertEqual({b1.id, b2.id}, set(self.store))
  296. self.assertEqual(1, len(self.store.packs))
  297. self.assertEqual(2, self.store.repack())
  298. self.assertEqual(1, len(self.store.packs))
  299. self.assertEqual(0, self.store.pack_loose_objects())