test_object_store.py 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484
  1. # test_object_store.py -- tests for object_store.py
  2. # Copyright (C) 2008 Jelmer Vernooij <jelmer@samba.org>
  3. #
  4. # This program is free software; you can redistribute it and/or
  5. # modify it under the terms of the GNU General Public License
  6. # as published by the Free Software Foundation; version 2
  7. # or (at your option) any later version of the License.
  8. #
  9. # This program is distributed in the hope that it will be useful,
  10. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. # GNU General Public License for more details.
  13. #
  14. # You should have received a copy of the GNU General Public License
  15. # along with this program; if not, write to the Free Software
  16. # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
  17. # MA 02110-1301, USA.
  18. """Tests for the object store interface."""
  19. from contextlib import closing
  20. from io import BytesIO
  21. import os
  22. import shutil
  23. import tempfile
  24. from dulwich.index import (
  25. commit_tree,
  26. )
  27. from dulwich.errors import (
  28. NotTreeError,
  29. )
  30. from dulwich.objects import (
  31. sha_to_hex,
  32. Blob,
  33. Tree,
  34. TreeEntry,
  35. )
  36. from dulwich.object_store import (
  37. DiskObjectStore,
  38. MemoryObjectStore,
  39. ObjectStoreGraphWalker,
  40. tree_lookup_path,
  41. )
  42. from dulwich.pack import (
  43. REF_DELTA,
  44. write_pack_objects,
  45. )
  46. from dulwich.tests import (
  47. TestCase,
  48. )
  49. from dulwich.tests.utils import (
  50. make_object,
  51. make_tag,
  52. build_pack,
  53. )
  54. testobject = make_object(Blob, data=b"yummy data")
  55. class ObjectStoreTests(object):
  56. def test_determine_wants_all(self):
  57. self.assertEqual([b"1" * 40],
  58. self.store.determine_wants_all({b"refs/heads/foo": b"1" * 40}))
  59. def test_determine_wants_all_zero(self):
  60. self.assertEqual([],
  61. self.store.determine_wants_all({b"refs/heads/foo": b"0" * 40}))
  62. def test_iter(self):
  63. self.assertEqual([], list(self.store))
  64. def test_get_nonexistant(self):
  65. self.assertRaises(KeyError, lambda: self.store[b"a" * 40])
  66. def test_contains_nonexistant(self):
  67. self.assertFalse((b"a" * 40) in self.store)
  68. def test_add_objects_empty(self):
  69. self.store.add_objects([])
  70. def test_add_commit(self):
  71. # TODO: Argh, no way to construct Git commit objects without
  72. # access to a serialized form.
  73. self.store.add_objects([])
  74. def test_store_resilience(self):
  75. """Test if updating an existing stored object doesn't erase the
  76. object from the store.
  77. """
  78. test_object = make_object(Blob, data=b'data')
  79. self.store.add_object(test_object)
  80. test_object_id = test_object.id
  81. test_object.data = test_object.data + b'update'
  82. stored_test_object = self.store[test_object_id]
  83. self.assertNotEqual(test_object.id, stored_test_object.id)
  84. self.assertEqual(stored_test_object.id, test_object_id)
  85. def test_add_object(self):
  86. self.store.add_object(testobject)
  87. self.assertEqual(set([testobject.id]), set(self.store))
  88. self.assertTrue(testobject.id in self.store)
  89. r = self.store[testobject.id]
  90. self.assertEqual(r, testobject)
  91. def test_add_objects(self):
  92. data = [(testobject, "mypath")]
  93. self.store.add_objects(data)
  94. self.assertEqual(set([testobject.id]), set(self.store))
  95. self.assertTrue(testobject.id in self.store)
  96. r = self.store[testobject.id]
  97. self.assertEqual(r, testobject)
  98. def test_tree_changes(self):
  99. blob_a1 = make_object(Blob, data=b'a1')
  100. blob_a2 = make_object(Blob, data=b'a2')
  101. blob_b = make_object(Blob, data=b'b')
  102. for blob in [blob_a1, blob_a2, blob_b]:
  103. self.store.add_object(blob)
  104. blobs_1 = [(b'a', blob_a1.id, 0o100644), (b'b', blob_b.id, 0o100644)]
  105. tree1_id = commit_tree(self.store, blobs_1)
  106. blobs_2 = [(b'a', blob_a2.id, 0o100644), (b'b', blob_b.id, 0o100644)]
  107. tree2_id = commit_tree(self.store, blobs_2)
  108. change_a = ((b'a', b'a'), (0o100644, 0o100644), (blob_a1.id, blob_a2.id))
  109. self.assertEqual([change_a],
  110. list(self.store.tree_changes(tree1_id, tree2_id)))
  111. self.assertEqual(
  112. [change_a, ((b'b', b'b'), (0o100644, 0o100644), (blob_b.id, blob_b.id))],
  113. list(self.store.tree_changes(tree1_id, tree2_id,
  114. want_unchanged=True)))
  115. def test_iter_tree_contents(self):
  116. blob_a = make_object(Blob, data=b'a')
  117. blob_b = make_object(Blob, data=b'b')
  118. blob_c = make_object(Blob, data=b'c')
  119. for blob in [blob_a, blob_b, blob_c]:
  120. self.store.add_object(blob)
  121. blobs = [
  122. (b'a', blob_a.id, 0o100644),
  123. (b'ad/b', blob_b.id, 0o100644),
  124. (b'ad/bd/c', blob_c.id, 0o100755),
  125. (b'ad/c', blob_c.id, 0o100644),
  126. (b'c', blob_c.id, 0o100644),
  127. ]
  128. tree_id = commit_tree(self.store, blobs)
  129. self.assertEqual([TreeEntry(p, m, h) for (p, h, m) in blobs],
  130. list(self.store.iter_tree_contents(tree_id)))
  131. def test_iter_tree_contents_include_trees(self):
  132. blob_a = make_object(Blob, data=b'a')
  133. blob_b = make_object(Blob, data=b'b')
  134. blob_c = make_object(Blob, data=b'c')
  135. for blob in [blob_a, blob_b, blob_c]:
  136. self.store.add_object(blob)
  137. blobs = [
  138. (b'a', blob_a.id, 0o100644),
  139. (b'ad/b', blob_b.id, 0o100644),
  140. (b'ad/bd/c', blob_c.id, 0o100755),
  141. ]
  142. tree_id = commit_tree(self.store, blobs)
  143. tree = self.store[tree_id]
  144. tree_ad = self.store[tree[b'ad'][1]]
  145. tree_bd = self.store[tree_ad[b'bd'][1]]
  146. expected = [
  147. TreeEntry(b'', 0o040000, tree_id),
  148. TreeEntry(b'a', 0o100644, blob_a.id),
  149. TreeEntry(b'ad', 0o040000, tree_ad.id),
  150. TreeEntry(b'ad/b', 0o100644, blob_b.id),
  151. TreeEntry(b'ad/bd', 0o040000, tree_bd.id),
  152. TreeEntry(b'ad/bd/c', 0o100755, blob_c.id),
  153. ]
  154. actual = self.store.iter_tree_contents(tree_id, include_trees=True)
  155. self.assertEqual(expected, list(actual))
  156. def make_tag(self, name, obj):
  157. tag = make_tag(obj, name=name)
  158. self.store.add_object(tag)
  159. return tag
  160. def test_peel_sha(self):
  161. self.store.add_object(testobject)
  162. tag1 = self.make_tag(b'1', testobject)
  163. tag2 = self.make_tag(b'2', testobject)
  164. tag3 = self.make_tag(b'3', testobject)
  165. for obj in [testobject, tag1, tag2, tag3]:
  166. self.assertEqual(testobject, self.store.peel_sha(obj.id))
  167. def test_get_raw(self):
  168. self.store.add_object(testobject)
  169. self.assertEqual((Blob.type_num, b'yummy data'),
  170. self.store.get_raw(testobject.id))
  171. def test_close(self):
  172. # For now, just check that close doesn't barf.
  173. self.store.add_object(testobject)
  174. self.store.close()
  175. class MemoryObjectStoreTests(ObjectStoreTests, TestCase):
  176. def setUp(self):
  177. TestCase.setUp(self)
  178. self.store = MemoryObjectStore()
  179. def test_add_pack(self):
  180. o = MemoryObjectStore()
  181. f, commit, abort = o.add_pack()
  182. try:
  183. b = make_object(Blob, data=b"more yummy data")
  184. write_pack_objects(f, [(b, None)])
  185. except:
  186. abort()
  187. raise
  188. else:
  189. commit()
  190. def test_add_pack_emtpy(self):
  191. o = MemoryObjectStore()
  192. f, commit, abort = o.add_pack()
  193. commit()
  194. def test_add_thin_pack(self):
  195. o = MemoryObjectStore()
  196. blob = make_object(Blob, data=b'yummy data')
  197. o.add_object(blob)
  198. f = BytesIO()
  199. entries = build_pack(f, [
  200. (REF_DELTA, (blob.id, b'more yummy data')),
  201. ], store=o)
  202. o.add_thin_pack(f.read, None)
  203. packed_blob_sha = sha_to_hex(entries[0][3])
  204. self.assertEqual((Blob.type_num, b'more yummy data'),
  205. o.get_raw(packed_blob_sha))
  206. def test_add_thin_pack_empty(self):
  207. o = MemoryObjectStore()
  208. f = BytesIO()
  209. entries = build_pack(f, [], store=o)
  210. self.assertEqual([], entries)
  211. o.add_thin_pack(f.read, None)
  212. class PackBasedObjectStoreTests(ObjectStoreTests):
  213. def tearDown(self):
  214. for pack in self.store.packs:
  215. pack.close()
  216. def test_empty_packs(self):
  217. self.assertEqual([], list(self.store.packs))
  218. def test_pack_loose_objects(self):
  219. b1 = make_object(Blob, data=b"yummy data")
  220. self.store.add_object(b1)
  221. b2 = make_object(Blob, data=b"more yummy data")
  222. self.store.add_object(b2)
  223. self.assertEqual([], list(self.store.packs))
  224. self.assertEqual(2, self.store.pack_loose_objects())
  225. self.assertNotEqual([], list(self.store.packs))
  226. self.assertEqual(0, self.store.pack_loose_objects())
  227. class DiskObjectStoreTests(PackBasedObjectStoreTests, TestCase):
  228. def setUp(self):
  229. TestCase.setUp(self)
  230. self.store_dir = tempfile.mkdtemp()
  231. self.addCleanup(shutil.rmtree, self.store_dir)
  232. self.store = DiskObjectStore.init(self.store_dir)
  233. def tearDown(self):
  234. TestCase.tearDown(self)
  235. PackBasedObjectStoreTests.tearDown(self)
  236. def test_alternates(self):
  237. alternate_dir = tempfile.mkdtemp()
  238. self.addCleanup(shutil.rmtree, alternate_dir)
  239. alternate_store = DiskObjectStore(alternate_dir)
  240. b2 = make_object(Blob, data=b"yummy data")
  241. alternate_store.add_object(b2)
  242. store = DiskObjectStore(self.store_dir)
  243. self.assertRaises(KeyError, store.__getitem__, b2.id)
  244. store.add_alternate_path(alternate_dir)
  245. self.assertIn(b2.id, store)
  246. self.assertEqual(b2, store[b2.id])
  247. def test_add_alternate_path(self):
  248. store = DiskObjectStore(self.store_dir)
  249. self.assertEqual([], list(store._read_alternate_paths()))
  250. store.add_alternate_path("/foo/path")
  251. self.assertEqual(["/foo/path"], list(store._read_alternate_paths()))
  252. store.add_alternate_path("/bar/path")
  253. self.assertEqual(
  254. ["/foo/path", "/bar/path"],
  255. list(store._read_alternate_paths()))
  256. def test_rel_alternative_path(self):
  257. alternate_dir = tempfile.mkdtemp()
  258. self.addCleanup(shutil.rmtree, alternate_dir)
  259. alternate_store = DiskObjectStore(alternate_dir)
  260. b2 = make_object(Blob, data=b"yummy data")
  261. alternate_store.add_object(b2)
  262. store = DiskObjectStore(self.store_dir)
  263. self.assertRaises(KeyError, store.__getitem__, b2.id)
  264. store.add_alternate_path(os.path.relpath(alternate_dir, self.store_dir))
  265. self.assertEqual(list(alternate_store), list(store.alternates[0]))
  266. self.assertIn(b2.id, store)
  267. self.assertEqual(b2, store[b2.id])
  268. def test_pack_dir(self):
  269. o = DiskObjectStore(self.store_dir)
  270. self.assertEqual(os.path.join(self.store_dir, "pack"), o.pack_dir)
  271. def test_add_pack(self):
  272. o = DiskObjectStore(self.store_dir)
  273. f, commit, abort = o.add_pack()
  274. try:
  275. b = make_object(Blob, data=b"more yummy data")
  276. write_pack_objects(f, [(b, None)])
  277. except:
  278. abort()
  279. raise
  280. else:
  281. commit()
  282. def test_add_thin_pack(self):
  283. o = DiskObjectStore(self.store_dir)
  284. try:
  285. blob = make_object(Blob, data=b'yummy data')
  286. o.add_object(blob)
  287. f = BytesIO()
  288. entries = build_pack(f, [
  289. (REF_DELTA, (blob.id, b'more yummy data')),
  290. ], store=o)
  291. with o.add_thin_pack(f.read, None) as pack:
  292. packed_blob_sha = sha_to_hex(entries[0][3])
  293. pack.check_length_and_checksum()
  294. self.assertEqual(sorted([blob.id, packed_blob_sha]), list(pack))
  295. self.assertTrue(o.contains_packed(packed_blob_sha))
  296. self.assertTrue(o.contains_packed(blob.id))
  297. self.assertEqual((Blob.type_num, b'more yummy data'),
  298. o.get_raw(packed_blob_sha))
  299. finally:
  300. o.close()
  301. def test_add_thin_pack_empty(self):
  302. with closing(DiskObjectStore(self.store_dir)) as o:
  303. f = BytesIO()
  304. entries = build_pack(f, [], store=o)
  305. self.assertEqual([], entries)
  306. o.add_thin_pack(f.read, None)
  307. class TreeLookupPathTests(TestCase):
  308. def setUp(self):
  309. TestCase.setUp(self)
  310. self.store = MemoryObjectStore()
  311. blob_a = make_object(Blob, data=b'a')
  312. blob_b = make_object(Blob, data=b'b')
  313. blob_c = make_object(Blob, data=b'c')
  314. for blob in [blob_a, blob_b, blob_c]:
  315. self.store.add_object(blob)
  316. blobs = [
  317. (b'a', blob_a.id, 0o100644),
  318. (b'ad/b', blob_b.id, 0o100644),
  319. (b'ad/bd/c', blob_c.id, 0o100755),
  320. (b'ad/c', blob_c.id, 0o100644),
  321. (b'c', blob_c.id, 0o100644),
  322. ]
  323. self.tree_id = commit_tree(self.store, blobs)
  324. def get_object(self, sha):
  325. return self.store[sha]
  326. def test_lookup_blob(self):
  327. o_id = tree_lookup_path(self.get_object, self.tree_id, b'a')[1]
  328. self.assertTrue(isinstance(self.store[o_id], Blob))
  329. def test_lookup_tree(self):
  330. o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad')[1]
  331. self.assertTrue(isinstance(self.store[o_id], Tree))
  332. o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad/bd')[1]
  333. self.assertTrue(isinstance(self.store[o_id], Tree))
  334. o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad/bd/')[1]
  335. self.assertTrue(isinstance(self.store[o_id], Tree))
  336. def test_lookup_nonexistent(self):
  337. self.assertRaises(KeyError, tree_lookup_path, self.get_object, self.tree_id, b'j')
  338. def test_lookup_not_tree(self):
  339. self.assertRaises(NotTreeError, tree_lookup_path, self.get_object, self.tree_id, b'ad/b/j')
  340. class ObjectStoreGraphWalkerTests(TestCase):
  341. def get_walker(self, heads, parent_map):
  342. new_parent_map = dict([
  343. (k * 40, [(p * 40) for p in ps]) for (k, ps) in parent_map.items()])
  344. return ObjectStoreGraphWalker([x * 40 for x in heads],
  345. new_parent_map.__getitem__)
  346. def test_ack_invalid_value(self):
  347. gw = self.get_walker([], {})
  348. self.assertRaises(ValueError, gw.ack, "tooshort")
  349. def test_empty(self):
  350. gw = self.get_walker([], {})
  351. self.assertIs(None, next(gw))
  352. gw.ack(b"a" * 40)
  353. self.assertIs(None, next(gw))
  354. def test_descends(self):
  355. gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
  356. self.assertEqual(b"a" * 40, next(gw))
  357. self.assertEqual(b"b" * 40, next(gw))
  358. def test_present(self):
  359. gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
  360. gw.ack(b"a" * 40)
  361. self.assertIs(None, next(gw))
  362. def test_parent_present(self):
  363. gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
  364. self.assertEqual(b"a" * 40, next(gw))
  365. gw.ack(b"a" * 40)
  366. self.assertIs(None, next(gw))
  367. def test_child_ack_later(self):
  368. gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": [b"c"], b"c": []})
  369. self.assertEqual(b"a" * 40, next(gw))
  370. self.assertEqual(b"b" * 40, next(gw))
  371. gw.ack(b"a" * 40)
  372. self.assertIs(None, next(gw))
  373. def test_only_once(self):
  374. # a b
  375. # | |
  376. # c d
  377. # \ /
  378. # e
  379. gw = self.get_walker([b"a", b"b"], {
  380. b"a": [b"c"],
  381. b"b": [b"d"],
  382. b"c": [b"e"],
  383. b"d": [b"e"],
  384. b"e": [],
  385. })
  386. walk = []
  387. acked = False
  388. walk.append(next(gw))
  389. walk.append(next(gw))
  390. # A branch (a, c) or (b, d) may be done after 2 steps or 3 depending on
  391. # the order walked: 3-step walks include (a, b, c) and (b, a, d), etc.
  392. if walk == [b"a" * 40, b"c" * 40] or walk == [b"b" * 40, b"d" * 40]:
  393. gw.ack(walk[0])
  394. acked = True
  395. walk.append(next(gw))
  396. if not acked and walk[2] == b"c" * 40:
  397. gw.ack(b"a" * 40)
  398. elif not acked and walk[2] == b"d" * 40:
  399. gw.ack(b"b" * 40)
  400. walk.append(next(gw))
  401. self.assertIs(None, next(gw))
  402. self.assertEqual([b"a" * 40, b"b" * 40, b"c" * 40, b"d" * 40], sorted(walk))
  403. self.assertLess(walk.index(b"a" * 40), walk.index(b"c" * 40))
  404. self.assertLess(walk.index(b"b" * 40), walk.index(b"d" * 40))