2
0

test_object_store.py 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495
  1. # test_object_store.py -- tests for object_store.py
  2. # Copyright (C) 2008 Jelmer Vernooij <jelmer@samba.org>
  3. #
  4. # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
  5. # General Public License as public by the Free Software Foundation; version 2.0
  6. # or (at your option) any later version. You can redistribute it and/or
  7. # modify it under the terms of either of these two licenses.
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. #
  15. # You should have received a copy of the licenses; if not, see
  16. # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
  17. # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
  18. # License, Version 2.0.
  19. #
  20. """Tests for the object store interface."""
  21. from contextlib import closing
  22. from io import BytesIO
  23. import os
  24. import shutil
  25. import tempfile
  26. from dulwich.index import (
  27. commit_tree,
  28. )
  29. from dulwich.errors import (
  30. NotTreeError,
  31. )
  32. from dulwich.objects import (
  33. sha_to_hex,
  34. Blob,
  35. Tree,
  36. TreeEntry,
  37. )
  38. from dulwich.object_store import (
  39. DiskObjectStore,
  40. MemoryObjectStore,
  41. ObjectStoreGraphWalker,
  42. tree_lookup_path,
  43. )
  44. from dulwich.pack import (
  45. REF_DELTA,
  46. write_pack_objects,
  47. )
  48. from dulwich.tests import (
  49. TestCase,
  50. )
  51. from dulwich.tests.utils import (
  52. make_object,
  53. make_tag,
  54. build_pack,
  55. )
  56. testobject = make_object(Blob, data=b"yummy data")
  57. class ObjectStoreTests(object):
  58. def test_determine_wants_all(self):
  59. self.assertEqual(
  60. [b"1" * 40],
  61. self.store.determine_wants_all({b"refs/heads/foo": b"1" * 40}))
  62. def test_determine_wants_all_zero(self):
  63. self.assertEqual(
  64. [], self.store.determine_wants_all({b"refs/heads/foo": b"0" * 40}))
  65. def test_iter(self):
  66. self.assertEqual([], list(self.store))
  67. def test_get_nonexistant(self):
  68. self.assertRaises(KeyError, lambda: self.store[b"a" * 40])
  69. def test_contains_nonexistant(self):
  70. self.assertFalse((b"a" * 40) in self.store)
  71. def test_add_objects_empty(self):
  72. self.store.add_objects([])
  73. def test_add_commit(self):
  74. # TODO: Argh, no way to construct Git commit objects without
  75. # access to a serialized form.
  76. self.store.add_objects([])
  77. def test_store_resilience(self):
  78. """Test if updating an existing stored object doesn't erase the
  79. object from the store.
  80. """
  81. test_object = make_object(Blob, data=b'data')
  82. self.store.add_object(test_object)
  83. test_object_id = test_object.id
  84. test_object.data = test_object.data + b'update'
  85. stored_test_object = self.store[test_object_id]
  86. self.assertNotEqual(test_object.id, stored_test_object.id)
  87. self.assertEqual(stored_test_object.id, test_object_id)
  88. def test_add_object(self):
  89. self.store.add_object(testobject)
  90. self.assertEqual(set([testobject.id]), set(self.store))
  91. self.assertTrue(testobject.id in self.store)
  92. r = self.store[testobject.id]
  93. self.assertEqual(r, testobject)
  94. def test_add_objects(self):
  95. data = [(testobject, "mypath")]
  96. self.store.add_objects(data)
  97. self.assertEqual(set([testobject.id]), set(self.store))
  98. self.assertTrue(testobject.id in self.store)
  99. r = self.store[testobject.id]
  100. self.assertEqual(r, testobject)
  101. def test_tree_changes(self):
  102. blob_a1 = make_object(Blob, data=b'a1')
  103. blob_a2 = make_object(Blob, data=b'a2')
  104. blob_b = make_object(Blob, data=b'b')
  105. for blob in [blob_a1, blob_a2, blob_b]:
  106. self.store.add_object(blob)
  107. blobs_1 = [(b'a', blob_a1.id, 0o100644), (b'b', blob_b.id, 0o100644)]
  108. tree1_id = commit_tree(self.store, blobs_1)
  109. blobs_2 = [(b'a', blob_a2.id, 0o100644), (b'b', blob_b.id, 0o100644)]
  110. tree2_id = commit_tree(self.store, blobs_2)
  111. change_a = ((b'a', b'a'), (0o100644, 0o100644),
  112. (blob_a1.id, blob_a2.id))
  113. self.assertEqual([change_a],
  114. list(self.store.tree_changes(tree1_id, tree2_id)))
  115. self.assertEqual(
  116. [change_a, ((b'b', b'b'), (0o100644, 0o100644),
  117. (blob_b.id, blob_b.id))],
  118. list(self.store.tree_changes(tree1_id, tree2_id,
  119. want_unchanged=True)))
  120. def test_iter_tree_contents(self):
  121. blob_a = make_object(Blob, data=b'a')
  122. blob_b = make_object(Blob, data=b'b')
  123. blob_c = make_object(Blob, data=b'c')
  124. for blob in [blob_a, blob_b, blob_c]:
  125. self.store.add_object(blob)
  126. blobs = [
  127. (b'a', blob_a.id, 0o100644),
  128. (b'ad/b', blob_b.id, 0o100644),
  129. (b'ad/bd/c', blob_c.id, 0o100755),
  130. (b'ad/c', blob_c.id, 0o100644),
  131. (b'c', blob_c.id, 0o100644),
  132. ]
  133. tree_id = commit_tree(self.store, blobs)
  134. self.assertEqual([TreeEntry(p, m, h) for (p, h, m) in blobs],
  135. list(self.store.iter_tree_contents(tree_id)))
  136. def test_iter_tree_contents_include_trees(self):
  137. blob_a = make_object(Blob, data=b'a')
  138. blob_b = make_object(Blob, data=b'b')
  139. blob_c = make_object(Blob, data=b'c')
  140. for blob in [blob_a, blob_b, blob_c]:
  141. self.store.add_object(blob)
  142. blobs = [
  143. (b'a', blob_a.id, 0o100644),
  144. (b'ad/b', blob_b.id, 0o100644),
  145. (b'ad/bd/c', blob_c.id, 0o100755),
  146. ]
  147. tree_id = commit_tree(self.store, blobs)
  148. tree = self.store[tree_id]
  149. tree_ad = self.store[tree[b'ad'][1]]
  150. tree_bd = self.store[tree_ad[b'bd'][1]]
  151. expected = [
  152. TreeEntry(b'', 0o040000, tree_id),
  153. TreeEntry(b'a', 0o100644, blob_a.id),
  154. TreeEntry(b'ad', 0o040000, tree_ad.id),
  155. TreeEntry(b'ad/b', 0o100644, blob_b.id),
  156. TreeEntry(b'ad/bd', 0o040000, tree_bd.id),
  157. TreeEntry(b'ad/bd/c', 0o100755, blob_c.id),
  158. ]
  159. actual = self.store.iter_tree_contents(tree_id, include_trees=True)
  160. self.assertEqual(expected, list(actual))
  161. def make_tag(self, name, obj):
  162. tag = make_tag(obj, name=name)
  163. self.store.add_object(tag)
  164. return tag
  165. def test_peel_sha(self):
  166. self.store.add_object(testobject)
  167. tag1 = self.make_tag(b'1', testobject)
  168. tag2 = self.make_tag(b'2', testobject)
  169. tag3 = self.make_tag(b'3', testobject)
  170. for obj in [testobject, tag1, tag2, tag3]:
  171. self.assertEqual(testobject, self.store.peel_sha(obj.id))
  172. def test_get_raw(self):
  173. self.store.add_object(testobject)
  174. self.assertEqual((Blob.type_num, b'yummy data'),
  175. self.store.get_raw(testobject.id))
  176. def test_close(self):
  177. # For now, just check that close doesn't barf.
  178. self.store.add_object(testobject)
  179. self.store.close()
  180. class MemoryObjectStoreTests(ObjectStoreTests, TestCase):
  181. def setUp(self):
  182. TestCase.setUp(self)
  183. self.store = MemoryObjectStore()
  184. def test_add_pack(self):
  185. o = MemoryObjectStore()
  186. f, commit, abort = o.add_pack()
  187. try:
  188. b = make_object(Blob, data=b"more yummy data")
  189. write_pack_objects(f, [(b, None)])
  190. except:
  191. abort()
  192. raise
  193. else:
  194. commit()
  195. def test_add_pack_emtpy(self):
  196. o = MemoryObjectStore()
  197. f, commit, abort = o.add_pack()
  198. commit()
  199. def test_add_thin_pack(self):
  200. o = MemoryObjectStore()
  201. blob = make_object(Blob, data=b'yummy data')
  202. o.add_object(blob)
  203. f = BytesIO()
  204. entries = build_pack(f, [
  205. (REF_DELTA, (blob.id, b'more yummy data')),
  206. ], store=o)
  207. o.add_thin_pack(f.read, None)
  208. packed_blob_sha = sha_to_hex(entries[0][3])
  209. self.assertEqual((Blob.type_num, b'more yummy data'),
  210. o.get_raw(packed_blob_sha))
  211. def test_add_thin_pack_empty(self):
  212. o = MemoryObjectStore()
  213. f = BytesIO()
  214. entries = build_pack(f, [], store=o)
  215. self.assertEqual([], entries)
  216. o.add_thin_pack(f.read, None)
  217. class PackBasedObjectStoreTests(ObjectStoreTests):
  218. def tearDown(self):
  219. for pack in self.store.packs:
  220. pack.close()
  221. def test_empty_packs(self):
  222. self.assertEqual([], list(self.store.packs))
  223. def test_pack_loose_objects(self):
  224. b1 = make_object(Blob, data=b"yummy data")
  225. self.store.add_object(b1)
  226. b2 = make_object(Blob, data=b"more yummy data")
  227. self.store.add_object(b2)
  228. self.assertEqual([], list(self.store.packs))
  229. self.assertEqual(2, self.store.pack_loose_objects())
  230. self.assertNotEqual([], list(self.store.packs))
  231. self.assertEqual(0, self.store.pack_loose_objects())
  232. class DiskObjectStoreTests(PackBasedObjectStoreTests, TestCase):
  233. def setUp(self):
  234. TestCase.setUp(self)
  235. self.store_dir = tempfile.mkdtemp()
  236. self.addCleanup(shutil.rmtree, self.store_dir)
  237. self.store = DiskObjectStore.init(self.store_dir)
  238. def tearDown(self):
  239. TestCase.tearDown(self)
  240. PackBasedObjectStoreTests.tearDown(self)
  241. def test_alternates(self):
  242. alternate_dir = tempfile.mkdtemp()
  243. self.addCleanup(shutil.rmtree, alternate_dir)
  244. alternate_store = DiskObjectStore(alternate_dir)
  245. b2 = make_object(Blob, data=b"yummy data")
  246. alternate_store.add_object(b2)
  247. store = DiskObjectStore(self.store_dir)
  248. self.assertRaises(KeyError, store.__getitem__, b2.id)
  249. store.add_alternate_path(alternate_dir)
  250. self.assertIn(b2.id, store)
  251. self.assertEqual(b2, store[b2.id])
  252. def test_add_alternate_path(self):
  253. store = DiskObjectStore(self.store_dir)
  254. self.assertEqual([], list(store._read_alternate_paths()))
  255. store.add_alternate_path("/foo/path")
  256. self.assertEqual(["/foo/path"], list(store._read_alternate_paths()))
  257. store.add_alternate_path("/bar/path")
  258. self.assertEqual(
  259. ["/foo/path", "/bar/path"],
  260. list(store._read_alternate_paths()))
  261. def test_rel_alternative_path(self):
  262. alternate_dir = tempfile.mkdtemp()
  263. self.addCleanup(shutil.rmtree, alternate_dir)
  264. alternate_store = DiskObjectStore(alternate_dir)
  265. b2 = make_object(Blob, data=b"yummy data")
  266. alternate_store.add_object(b2)
  267. store = DiskObjectStore(self.store_dir)
  268. self.assertRaises(KeyError, store.__getitem__, b2.id)
  269. store.add_alternate_path(
  270. os.path.relpath(alternate_dir, self.store_dir))
  271. self.assertEqual(list(alternate_store), list(store.alternates[0]))
  272. self.assertIn(b2.id, store)
  273. self.assertEqual(b2, store[b2.id])
  274. def test_pack_dir(self):
  275. o = DiskObjectStore(self.store_dir)
  276. self.assertEqual(os.path.join(self.store_dir, "pack"), o.pack_dir)
  277. def test_add_pack(self):
  278. o = DiskObjectStore(self.store_dir)
  279. f, commit, abort = o.add_pack()
  280. try:
  281. b = make_object(Blob, data=b"more yummy data")
  282. write_pack_objects(f, [(b, None)])
  283. except:
  284. abort()
  285. raise
  286. else:
  287. commit()
  288. def test_add_thin_pack(self):
  289. o = DiskObjectStore(self.store_dir)
  290. try:
  291. blob = make_object(Blob, data=b'yummy data')
  292. o.add_object(blob)
  293. f = BytesIO()
  294. entries = build_pack(f, [
  295. (REF_DELTA, (blob.id, b'more yummy data')),
  296. ], store=o)
  297. with o.add_thin_pack(f.read, None) as pack:
  298. packed_blob_sha = sha_to_hex(entries[0][3])
  299. pack.check_length_and_checksum()
  300. self.assertEqual(
  301. sorted([blob.id, packed_blob_sha]), list(pack))
  302. self.assertTrue(o.contains_packed(packed_blob_sha))
  303. self.assertTrue(o.contains_packed(blob.id))
  304. self.assertEqual((Blob.type_num, b'more yummy data'),
  305. o.get_raw(packed_blob_sha))
  306. finally:
  307. o.close()
  308. def test_add_thin_pack_empty(self):
  309. with closing(DiskObjectStore(self.store_dir)) as o:
  310. f = BytesIO()
  311. entries = build_pack(f, [], store=o)
  312. self.assertEqual([], entries)
  313. o.add_thin_pack(f.read, None)
  314. class TreeLookupPathTests(TestCase):
  315. def setUp(self):
  316. TestCase.setUp(self)
  317. self.store = MemoryObjectStore()
  318. blob_a = make_object(Blob, data=b'a')
  319. blob_b = make_object(Blob, data=b'b')
  320. blob_c = make_object(Blob, data=b'c')
  321. for blob in [blob_a, blob_b, blob_c]:
  322. self.store.add_object(blob)
  323. blobs = [
  324. (b'a', blob_a.id, 0o100644),
  325. (b'ad/b', blob_b.id, 0o100644),
  326. (b'ad/bd/c', blob_c.id, 0o100755),
  327. (b'ad/c', blob_c.id, 0o100644),
  328. (b'c', blob_c.id, 0o100644),
  329. ]
  330. self.tree_id = commit_tree(self.store, blobs)
  331. def get_object(self, sha):
  332. return self.store[sha]
  333. def test_lookup_blob(self):
  334. o_id = tree_lookup_path(self.get_object, self.tree_id, b'a')[1]
  335. self.assertTrue(isinstance(self.store[o_id], Blob))
  336. def test_lookup_tree(self):
  337. o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad')[1]
  338. self.assertTrue(isinstance(self.store[o_id], Tree))
  339. o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad/bd')[1]
  340. self.assertTrue(isinstance(self.store[o_id], Tree))
  341. o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad/bd/')[1]
  342. self.assertTrue(isinstance(self.store[o_id], Tree))
  343. def test_lookup_nonexistent(self):
  344. self.assertRaises(
  345. KeyError, tree_lookup_path, self.get_object, self.tree_id, b'j')
  346. def test_lookup_not_tree(self):
  347. self.assertRaises(
  348. NotTreeError, tree_lookup_path, self.get_object, self.tree_id,
  349. b'ad/b/j')
  350. class ObjectStoreGraphWalkerTests(TestCase):
  351. def get_walker(self, heads, parent_map):
  352. new_parent_map = dict(
  353. [(k * 40, [(p * 40) for p in ps])
  354. for (k, ps) in parent_map.items()])
  355. return ObjectStoreGraphWalker([x * 40 for x in heads],
  356. new_parent_map.__getitem__)
  357. def test_ack_invalid_value(self):
  358. gw = self.get_walker([], {})
  359. self.assertRaises(ValueError, gw.ack, "tooshort")
  360. def test_empty(self):
  361. gw = self.get_walker([], {})
  362. self.assertIs(None, next(gw))
  363. gw.ack(b"a" * 40)
  364. self.assertIs(None, next(gw))
  365. def test_descends(self):
  366. gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
  367. self.assertEqual(b"a" * 40, next(gw))
  368. self.assertEqual(b"b" * 40, next(gw))
  369. def test_present(self):
  370. gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
  371. gw.ack(b"a" * 40)
  372. self.assertIs(None, next(gw))
  373. def test_parent_present(self):
  374. gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
  375. self.assertEqual(b"a" * 40, next(gw))
  376. gw.ack(b"a" * 40)
  377. self.assertIs(None, next(gw))
  378. def test_child_ack_later(self):
  379. gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": [b"c"], b"c": []})
  380. self.assertEqual(b"a" * 40, next(gw))
  381. self.assertEqual(b"b" * 40, next(gw))
  382. gw.ack(b"a" * 40)
  383. self.assertIs(None, next(gw))
  384. def test_only_once(self):
  385. # a b
  386. # | |
  387. # c d
  388. # \ /
  389. # e
  390. gw = self.get_walker([b"a", b"b"], {
  391. b"a": [b"c"],
  392. b"b": [b"d"],
  393. b"c": [b"e"],
  394. b"d": [b"e"],
  395. b"e": [],
  396. })
  397. walk = []
  398. acked = False
  399. walk.append(next(gw))
  400. walk.append(next(gw))
  401. # A branch (a, c) or (b, d) may be done after 2 steps or 3 depending on
  402. # the order walked: 3-step walks include (a, b, c) and (b, a, d), etc.
  403. if walk == [b"a" * 40, b"c" * 40] or walk == [b"b" * 40, b"d" * 40]:
  404. gw.ack(walk[0])
  405. acked = True
  406. walk.append(next(gw))
  407. if not acked and walk[2] == b"c" * 40:
  408. gw.ack(b"a" * 40)
  409. elif not acked and walk[2] == b"d" * 40:
  410. gw.ack(b"b" * 40)
  411. walk.append(next(gw))
  412. self.assertIs(None, next(gw))
  413. self.assertEqual([b"a" * 40, b"b" * 40, b"c" * 40, b"d" * 40],
  414. sorted(walk))
  415. self.assertLess(walk.index(b"a" * 40), walk.index(b"c" * 40))
  416. self.assertLess(walk.index(b"b" * 40), walk.index(b"d" * 40))