test_object_store.py 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470
  1. # test_object_store.py -- tests for object_store.py
  2. # Copyright (C) 2008 Jelmer Vernooij <jelmer@samba.org>
  3. #
  4. # This program is free software; you can redistribute it and/or
  5. # modify it under the terms of the GNU General Public License
  6. # as published by the Free Software Foundation; version 2
  7. # or (at your option) any later version of the License.
  8. #
  9. # This program is distributed in the hope that it will be useful,
  10. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. # GNU General Public License for more details.
  13. #
  14. # You should have received a copy of the GNU General Public License
  15. # along with this program; if not, write to the Free Software
  16. # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
  17. # MA 02110-1301, USA.
  18. """Tests for the object store interface."""
  19. from io import BytesIO
  20. import os
  21. import shutil
  22. import tempfile
  23. from dulwich.index import (
  24. commit_tree,
  25. )
  26. from dulwich.errors import (
  27. NotTreeError,
  28. )
  29. from dulwich.objects import (
  30. sha_to_hex,
  31. object_class,
  32. Blob,
  33. Tag,
  34. Tree,
  35. TreeEntry,
  36. )
  37. from dulwich.object_store import (
  38. DiskObjectStore,
  39. MemoryObjectStore,
  40. ObjectStoreGraphWalker,
  41. tree_lookup_path,
  42. )
  43. from dulwich.pack import (
  44. REF_DELTA,
  45. write_pack_objects,
  46. )
  47. from dulwich.tests import (
  48. TestCase,
  49. )
  50. from dulwich.tests.utils import (
  51. make_object,
  52. build_pack,
  53. )
  54. testobject = make_object(Blob, data="yummy data")
  55. class ObjectStoreTests(object):
  56. def test_determine_wants_all(self):
  57. self.assertEqual(["1" * 40],
  58. self.store.determine_wants_all({"refs/heads/foo": "1" * 40}))
  59. def test_determine_wants_all_zero(self):
  60. self.assertEqual([],
  61. self.store.determine_wants_all({"refs/heads/foo": "0" * 40}))
  62. def test_iter(self):
  63. self.assertEqual([], list(self.store))
  64. def test_get_nonexistant(self):
  65. self.assertRaises(KeyError, lambda: self.store["a" * 40])
  66. def test_contains_nonexistant(self):
  67. self.assertFalse(("a" * 40) in self.store)
  68. def test_add_objects_empty(self):
  69. self.store.add_objects([])
  70. def test_add_commit(self):
  71. # TODO: Argh, no way to construct Git commit objects without
  72. # access to a serialized form.
  73. self.store.add_objects([])
  74. def test_add_object(self):
  75. self.store.add_object(testobject)
  76. self.assertEqual(set([testobject.id]), set(self.store))
  77. self.assertTrue(testobject.id in self.store)
  78. r = self.store[testobject.id]
  79. self.assertEqual(r, testobject)
  80. def test_add_objects(self):
  81. data = [(testobject, "mypath")]
  82. self.store.add_objects(data)
  83. self.assertEqual(set([testobject.id]), set(self.store))
  84. self.assertTrue(testobject.id in self.store)
  85. r = self.store[testobject.id]
  86. self.assertEqual(r, testobject)
  87. def test_tree_changes(self):
  88. blob_a1 = make_object(Blob, data='a1')
  89. blob_a2 = make_object(Blob, data='a2')
  90. blob_b = make_object(Blob, data='b')
  91. for blob in [blob_a1, blob_a2, blob_b]:
  92. self.store.add_object(blob)
  93. blobs_1 = [('a', blob_a1.id, 0o100644), ('b', blob_b.id, 0o100644)]
  94. tree1_id = commit_tree(self.store, blobs_1)
  95. blobs_2 = [('a', blob_a2.id, 0o100644), ('b', blob_b.id, 0o100644)]
  96. tree2_id = commit_tree(self.store, blobs_2)
  97. change_a = (('a', 'a'), (0o100644, 0o100644), (blob_a1.id, blob_a2.id))
  98. self.assertEqual([change_a],
  99. list(self.store.tree_changes(tree1_id, tree2_id)))
  100. self.assertEqual(
  101. [change_a, (('b', 'b'), (0o100644, 0o100644), (blob_b.id, blob_b.id))],
  102. list(self.store.tree_changes(tree1_id, tree2_id,
  103. want_unchanged=True)))
  104. def test_iter_tree_contents(self):
  105. blob_a = make_object(Blob, data='a')
  106. blob_b = make_object(Blob, data='b')
  107. blob_c = make_object(Blob, data='c')
  108. for blob in [blob_a, blob_b, blob_c]:
  109. self.store.add_object(blob)
  110. blobs = [
  111. ('a', blob_a.id, 0o100644),
  112. ('ad/b', blob_b.id, 0o100644),
  113. ('ad/bd/c', blob_c.id, 0o100755),
  114. ('ad/c', blob_c.id, 0o100644),
  115. ('c', blob_c.id, 0o100644),
  116. ]
  117. tree_id = commit_tree(self.store, blobs)
  118. self.assertEqual([TreeEntry(p, m, h) for (p, h, m) in blobs],
  119. list(self.store.iter_tree_contents(tree_id)))
  120. def test_iter_tree_contents_include_trees(self):
  121. blob_a = make_object(Blob, data='a')
  122. blob_b = make_object(Blob, data='b')
  123. blob_c = make_object(Blob, data='c')
  124. for blob in [blob_a, blob_b, blob_c]:
  125. self.store.add_object(blob)
  126. blobs = [
  127. ('a', blob_a.id, 0o100644),
  128. ('ad/b', blob_b.id, 0o100644),
  129. ('ad/bd/c', blob_c.id, 0o100755),
  130. ]
  131. tree_id = commit_tree(self.store, blobs)
  132. tree = self.store[tree_id]
  133. tree_ad = self.store[tree['ad'][1]]
  134. tree_bd = self.store[tree_ad['bd'][1]]
  135. expected = [
  136. TreeEntry('', 0o040000, tree_id),
  137. TreeEntry('a', 0o100644, blob_a.id),
  138. TreeEntry('ad', 0o040000, tree_ad.id),
  139. TreeEntry('ad/b', 0o100644, blob_b.id),
  140. TreeEntry('ad/bd', 0o040000, tree_bd.id),
  141. TreeEntry('ad/bd/c', 0o100755, blob_c.id),
  142. ]
  143. actual = self.store.iter_tree_contents(tree_id, include_trees=True)
  144. self.assertEqual(expected, list(actual))
  145. def make_tag(self, name, obj):
  146. tag = make_object(Tag, name=name, message='',
  147. tag_time=12345, tag_timezone=0,
  148. tagger='Test Tagger <test@example.com>',
  149. object=(object_class(obj.type_name), obj.id))
  150. self.store.add_object(tag)
  151. return tag
  152. def test_peel_sha(self):
  153. self.store.add_object(testobject)
  154. tag1 = self.make_tag('1', testobject)
  155. tag2 = self.make_tag('2', testobject)
  156. tag3 = self.make_tag('3', testobject)
  157. for obj in [testobject, tag1, tag2, tag3]:
  158. self.assertEqual(testobject, self.store.peel_sha(obj.id))
  159. def test_get_raw(self):
  160. self.store.add_object(testobject)
  161. self.assertEqual((Blob.type_num, 'yummy data'),
  162. self.store.get_raw(testobject.id))
  163. def test_close(self):
  164. # For now, just check that close doesn't barf.
  165. self.store.add_object(testobject)
  166. self.store.close()
  167. class MemoryObjectStoreTests(ObjectStoreTests, TestCase):
  168. def setUp(self):
  169. TestCase.setUp(self)
  170. self.store = MemoryObjectStore()
  171. def test_add_pack(self):
  172. o = MemoryObjectStore()
  173. f, commit, abort = o.add_pack()
  174. try:
  175. b = make_object(Blob, data="more yummy data")
  176. write_pack_objects(f, [(b, None)])
  177. except:
  178. abort()
  179. raise
  180. else:
  181. commit()
  182. def test_add_thin_pack(self):
  183. o = MemoryObjectStore()
  184. blob = make_object(Blob, data='yummy data')
  185. o.add_object(blob)
  186. f = BytesIO()
  187. entries = build_pack(f, [
  188. (REF_DELTA, (blob.id, 'more yummy data')),
  189. ], store=o)
  190. o.add_thin_pack(f.read, None)
  191. packed_blob_sha = sha_to_hex(entries[0][3])
  192. self.assertEqual((Blob.type_num, 'more yummy data'),
  193. o.get_raw(packed_blob_sha))
  194. def test_add_thin_pack_empty(self):
  195. o = MemoryObjectStore()
  196. f = BytesIO()
  197. entries = build_pack(f, [], store=o)
  198. self.assertEquals([], entries)
  199. o.add_thin_pack(f.read, None)
  200. class PackBasedObjectStoreTests(ObjectStoreTests):
  201. def tearDown(self):
  202. for pack in self.store.packs:
  203. pack.close()
  204. def test_empty_packs(self):
  205. self.assertEqual([], self.store.packs)
  206. def test_pack_loose_objects(self):
  207. b1 = make_object(Blob, data="yummy data")
  208. self.store.add_object(b1)
  209. b2 = make_object(Blob, data="more yummy data")
  210. self.store.add_object(b2)
  211. self.assertEqual([], self.store.packs)
  212. self.assertEqual(2, self.store.pack_loose_objects())
  213. self.assertNotEqual([], self.store.packs)
  214. self.assertEqual(0, self.store.pack_loose_objects())
  215. class DiskObjectStoreTests(PackBasedObjectStoreTests, TestCase):
  216. def setUp(self):
  217. TestCase.setUp(self)
  218. self.store_dir = tempfile.mkdtemp()
  219. self.addCleanup(shutil.rmtree, self.store_dir)
  220. self.store = DiskObjectStore.init(self.store_dir)
  221. def tearDown(self):
  222. TestCase.tearDown(self)
  223. PackBasedObjectStoreTests.tearDown(self)
  224. def test_alternates(self):
  225. alternate_dir = tempfile.mkdtemp()
  226. self.addCleanup(shutil.rmtree, alternate_dir)
  227. alternate_store = DiskObjectStore(alternate_dir)
  228. b2 = make_object(Blob, data="yummy data")
  229. alternate_store.add_object(b2)
  230. store = DiskObjectStore(self.store_dir)
  231. self.assertRaises(KeyError, store.__getitem__, b2.id)
  232. store.add_alternate_path(alternate_dir)
  233. self.assertIn(b2.id, store)
  234. self.assertEqual(b2, store[b2.id])
  235. def test_add_alternate_path(self):
  236. store = DiskObjectStore(self.store_dir)
  237. self.assertEqual([], store._read_alternate_paths())
  238. store.add_alternate_path("/foo/path")
  239. self.assertEqual(["/foo/path"], store._read_alternate_paths())
  240. store.add_alternate_path("/bar/path")
  241. self.assertEqual(
  242. ["/foo/path", "/bar/path"],
  243. store._read_alternate_paths())
  244. def test_rel_alternative_path(self):
  245. alternate_dir = tempfile.mkdtemp()
  246. self.addCleanup(shutil.rmtree, alternate_dir)
  247. alternate_store = DiskObjectStore(alternate_dir)
  248. b2 = make_object(Blob, data="yummy data")
  249. alternate_store.add_object(b2)
  250. store = DiskObjectStore(self.store_dir)
  251. self.assertRaises(KeyError, store.__getitem__, b2.id)
  252. store.add_alternate_path(os.path.relpath(alternate_dir, self.store_dir))
  253. self.assertEqual(list(alternate_store), list(store.alternates[0]))
  254. self.assertIn(b2.id, store)
  255. self.assertEqual(b2, store[b2.id])
  256. def test_pack_dir(self):
  257. o = DiskObjectStore(self.store_dir)
  258. self.assertEqual(os.path.join(self.store_dir, "pack"), o.pack_dir)
  259. def test_add_pack(self):
  260. o = DiskObjectStore(self.store_dir)
  261. f, commit, abort = o.add_pack()
  262. try:
  263. b = make_object(Blob, data="more yummy data")
  264. write_pack_objects(f, [(b, None)])
  265. except:
  266. abort()
  267. raise
  268. else:
  269. commit()
  270. def test_add_thin_pack(self):
  271. o = DiskObjectStore(self.store_dir)
  272. try:
  273. blob = make_object(Blob, data='yummy data')
  274. o.add_object(blob)
  275. f = BytesIO()
  276. entries = build_pack(f, [
  277. (REF_DELTA, (blob.id, 'more yummy data')),
  278. ], store=o)
  279. with o.add_thin_pack(f.read, None) as pack:
  280. packed_blob_sha = sha_to_hex(entries[0][3])
  281. pack.check_length_and_checksum()
  282. self.assertEqual(sorted([blob.id, packed_blob_sha]), list(pack))
  283. self.assertTrue(o.contains_packed(packed_blob_sha))
  284. self.assertTrue(o.contains_packed(blob.id))
  285. self.assertEqual((Blob.type_num, 'more yummy data'),
  286. o.get_raw(packed_blob_sha))
  287. finally:
  288. o.close()
  289. def test_add_thin_pack_empty(self):
  290. o = DiskObjectStore(self.store_dir)
  291. f = BytesIO()
  292. entries = build_pack(f, [], store=o)
  293. self.assertEquals([], entries)
  294. o.add_thin_pack(f.read, None)
  295. class TreeLookupPathTests(TestCase):
  296. def setUp(self):
  297. TestCase.setUp(self)
  298. self.store = MemoryObjectStore()
  299. blob_a = make_object(Blob, data='a')
  300. blob_b = make_object(Blob, data='b')
  301. blob_c = make_object(Blob, data='c')
  302. for blob in [blob_a, blob_b, blob_c]:
  303. self.store.add_object(blob)
  304. blobs = [
  305. ('a', blob_a.id, 0o100644),
  306. ('ad/b', blob_b.id, 0o100644),
  307. ('ad/bd/c', blob_c.id, 0o100755),
  308. ('ad/c', blob_c.id, 0o100644),
  309. ('c', blob_c.id, 0o100644),
  310. ]
  311. self.tree_id = commit_tree(self.store, blobs)
  312. def get_object(self, sha):
  313. return self.store[sha]
  314. def test_lookup_blob(self):
  315. o_id = tree_lookup_path(self.get_object, self.tree_id, 'a')[1]
  316. self.assertTrue(isinstance(self.store[o_id], Blob))
  317. def test_lookup_tree(self):
  318. o_id = tree_lookup_path(self.get_object, self.tree_id, 'ad')[1]
  319. self.assertTrue(isinstance(self.store[o_id], Tree))
  320. o_id = tree_lookup_path(self.get_object, self.tree_id, 'ad/bd')[1]
  321. self.assertTrue(isinstance(self.store[o_id], Tree))
  322. o_id = tree_lookup_path(self.get_object, self.tree_id, 'ad/bd/')[1]
  323. self.assertTrue(isinstance(self.store[o_id], Tree))
  324. def test_lookup_nonexistent(self):
  325. self.assertRaises(KeyError, tree_lookup_path, self.get_object, self.tree_id, 'j')
  326. def test_lookup_not_tree(self):
  327. self.assertRaises(NotTreeError, tree_lookup_path, self.get_object, self.tree_id, 'ad/b/j')
  328. # TODO: MissingObjectFinderTests
  329. class ObjectStoreGraphWalkerTests(TestCase):
  330. def get_walker(self, heads, parent_map):
  331. new_parent_map = dict([
  332. (k * 40, [(p * 40) for p in ps]) for (k, ps) in parent_map.items()])
  333. return ObjectStoreGraphWalker([x * 40 for x in heads],
  334. new_parent_map.__getitem__)
  335. def test_ack_invalid_value(self):
  336. gw = self.get_walker([], {})
  337. self.assertRaises(ValueError, gw.ack, "tooshort")
  338. def test_empty(self):
  339. gw = self.get_walker([], {})
  340. self.assertIs(None, next(gw))
  341. gw.ack("a" * 40)
  342. self.assertIs(None, next(gw))
  343. def test_descends(self):
  344. gw = self.get_walker(["a"], {"a": ["b"], "b": []})
  345. self.assertEqual("a" * 40, next(gw))
  346. self.assertEqual("b" * 40, next(gw))
  347. def test_present(self):
  348. gw = self.get_walker(["a"], {"a": ["b"], "b": []})
  349. gw.ack("a" * 40)
  350. self.assertIs(None, next(gw))
  351. def test_parent_present(self):
  352. gw = self.get_walker(["a"], {"a": ["b"], "b": []})
  353. self.assertEqual("a" * 40, next(gw))
  354. gw.ack("a" * 40)
  355. self.assertIs(None, next(gw))
  356. def test_child_ack_later(self):
  357. gw = self.get_walker(["a"], {"a": ["b"], "b": ["c"], "c": []})
  358. self.assertEqual("a" * 40, next(gw))
  359. self.assertEqual("b" * 40, next(gw))
  360. gw.ack("a" * 40)
  361. self.assertIs(None, next(gw))
  362. def test_only_once(self):
  363. # a b
  364. # | |
  365. # c d
  366. # \ /
  367. # e
  368. gw = self.get_walker(["a", "b"], {
  369. "a": ["c"],
  370. "b": ["d"],
  371. "c": ["e"],
  372. "d": ["e"],
  373. "e": [],
  374. })
  375. walk = []
  376. acked = False
  377. walk.append(next(gw))
  378. walk.append(next(gw))
  379. # A branch (a, c) or (b, d) may be done after 2 steps or 3 depending on
  380. # the order walked: 3-step walks include (a, b, c) and (b, a, d), etc.
  381. if walk == ["a" * 40, "c" * 40] or walk == ["b" * 40, "d" * 40]:
  382. gw.ack(walk[0])
  383. acked = True
  384. walk.append(next(gw))
  385. if not acked and walk[2] == "c" * 40:
  386. gw.ack("a" * 40)
  387. elif not acked and walk[2] == "d" * 40:
  388. gw.ack("b" * 40)
  389. walk.append(next(gw))
  390. self.assertIs(None, next(gw))
  391. self.assertEqual(["a" * 40, "b" * 40, "c" * 40, "d" * 40], sorted(walk))
  392. self.assertLess(walk.index("a" * 40), walk.index("c" * 40))
  393. self.assertLess(walk.index("b" * 40), walk.index("d" * 40))