123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591 |
- # test_object_store.py -- tests for object_store.py
- # Copyright (C) 2008 Jelmer Vernooij <jelmer@samba.org>
- #
- # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
- # General Public License as public by the Free Software Foundation; version 2.0
- # or (at your option) any later version. You can redistribute it and/or
- # modify it under the terms of either of these two licenses.
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- # You should have received a copy of the licenses; if not, see
- # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
- # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
- # License, Version 2.0.
- #
- """Tests for the object store interface."""
- from contextlib import closing
- from io import BytesIO
- import os
- import shutil
- import stat
- import tempfile
- from dulwich.index import (
- commit_tree,
- )
- from dulwich.errors import (
- NotTreeError,
- )
- from dulwich.objects import (
- sha_to_hex,
- Blob,
- Tree,
- TreeEntry,
- )
- from dulwich.object_store import (
- DiskObjectStore,
- MemoryObjectStore,
- ObjectStoreGraphWalker,
- commit_tree_changes,
- tree_lookup_path,
- )
- from dulwich.pack import (
- REF_DELTA,
- write_pack_objects,
- )
- from dulwich.tests import (
- TestCase,
- )
- from dulwich.tests.utils import (
- make_object,
- make_tag,
- build_pack,
- )
- testobject = make_object(Blob, data=b"yummy data")
- class ObjectStoreTests(object):
- def test_determine_wants_all(self):
- self.assertEqual(
- [b"1" * 40],
- self.store.determine_wants_all({b"refs/heads/foo": b"1" * 40}))
- def test_determine_wants_all_zero(self):
- self.assertEqual(
- [], self.store.determine_wants_all({b"refs/heads/foo": b"0" * 40}))
- def test_iter(self):
- self.assertEqual([], list(self.store))
- def test_get_nonexistant(self):
- self.assertRaises(KeyError, lambda: self.store[b"a" * 40])
- def test_contains_nonexistant(self):
- self.assertFalse((b"a" * 40) in self.store)
- def test_add_objects_empty(self):
- self.store.add_objects([])
- def test_add_commit(self):
- # TODO: Argh, no way to construct Git commit objects without
- # access to a serialized form.
- self.store.add_objects([])
- def test_store_resilience(self):
- """Test if updating an existing stored object doesn't erase the
- object from the store.
- """
- test_object = make_object(Blob, data=b'data')
- self.store.add_object(test_object)
- test_object_id = test_object.id
- test_object.data = test_object.data + b'update'
- stored_test_object = self.store[test_object_id]
- self.assertNotEqual(test_object.id, stored_test_object.id)
- self.assertEqual(stored_test_object.id, test_object_id)
- def test_add_object(self):
- self.store.add_object(testobject)
- self.assertEqual(set([testobject.id]), set(self.store))
- self.assertTrue(testobject.id in self.store)
- r = self.store[testobject.id]
- self.assertEqual(r, testobject)
- def test_add_objects(self):
- data = [(testobject, "mypath")]
- self.store.add_objects(data)
- self.assertEqual(set([testobject.id]), set(self.store))
- self.assertTrue(testobject.id in self.store)
- r = self.store[testobject.id]
- self.assertEqual(r, testobject)
- def test_tree_changes(self):
- blob_a1 = make_object(Blob, data=b'a1')
- blob_a2 = make_object(Blob, data=b'a2')
- blob_b = make_object(Blob, data=b'b')
- for blob in [blob_a1, blob_a2, blob_b]:
- self.store.add_object(blob)
- blobs_1 = [(b'a', blob_a1.id, 0o100644), (b'b', blob_b.id, 0o100644)]
- tree1_id = commit_tree(self.store, blobs_1)
- blobs_2 = [(b'a', blob_a2.id, 0o100644), (b'b', blob_b.id, 0o100644)]
- tree2_id = commit_tree(self.store, blobs_2)
- change_a = ((b'a', b'a'), (0o100644, 0o100644),
- (blob_a1.id, blob_a2.id))
- self.assertEqual([change_a],
- list(self.store.tree_changes(tree1_id, tree2_id)))
- self.assertEqual(
- [change_a, ((b'b', b'b'), (0o100644, 0o100644),
- (blob_b.id, blob_b.id))],
- list(self.store.tree_changes(tree1_id, tree2_id,
- want_unchanged=True)))
- def test_iter_tree_contents(self):
- blob_a = make_object(Blob, data=b'a')
- blob_b = make_object(Blob, data=b'b')
- blob_c = make_object(Blob, data=b'c')
- for blob in [blob_a, blob_b, blob_c]:
- self.store.add_object(blob)
- blobs = [
- (b'a', blob_a.id, 0o100644),
- (b'ad/b', blob_b.id, 0o100644),
- (b'ad/bd/c', blob_c.id, 0o100755),
- (b'ad/c', blob_c.id, 0o100644),
- (b'c', blob_c.id, 0o100644),
- ]
- tree_id = commit_tree(self.store, blobs)
- self.assertEqual([TreeEntry(p, m, h) for (p, h, m) in blobs],
- list(self.store.iter_tree_contents(tree_id)))
- def test_iter_tree_contents_include_trees(self):
- blob_a = make_object(Blob, data=b'a')
- blob_b = make_object(Blob, data=b'b')
- blob_c = make_object(Blob, data=b'c')
- for blob in [blob_a, blob_b, blob_c]:
- self.store.add_object(blob)
- blobs = [
- (b'a', blob_a.id, 0o100644),
- (b'ad/b', blob_b.id, 0o100644),
- (b'ad/bd/c', blob_c.id, 0o100755),
- ]
- tree_id = commit_tree(self.store, blobs)
- tree = self.store[tree_id]
- tree_ad = self.store[tree[b'ad'][1]]
- tree_bd = self.store[tree_ad[b'bd'][1]]
- expected = [
- TreeEntry(b'', 0o040000, tree_id),
- TreeEntry(b'a', 0o100644, blob_a.id),
- TreeEntry(b'ad', 0o040000, tree_ad.id),
- TreeEntry(b'ad/b', 0o100644, blob_b.id),
- TreeEntry(b'ad/bd', 0o040000, tree_bd.id),
- TreeEntry(b'ad/bd/c', 0o100755, blob_c.id),
- ]
- actual = self.store.iter_tree_contents(tree_id, include_trees=True)
- self.assertEqual(expected, list(actual))
- def make_tag(self, name, obj):
- tag = make_tag(obj, name=name)
- self.store.add_object(tag)
- return tag
- def test_peel_sha(self):
- self.store.add_object(testobject)
- tag1 = self.make_tag(b'1', testobject)
- tag2 = self.make_tag(b'2', testobject)
- tag3 = self.make_tag(b'3', testobject)
- for obj in [testobject, tag1, tag2, tag3]:
- self.assertEqual(testobject, self.store.peel_sha(obj.id))
- def test_get_raw(self):
- self.store.add_object(testobject)
- self.assertEqual((Blob.type_num, b'yummy data'),
- self.store.get_raw(testobject.id))
- def test_close(self):
- # For now, just check that close doesn't barf.
- self.store.add_object(testobject)
- self.store.close()
- class MemoryObjectStoreTests(ObjectStoreTests, TestCase):
- def setUp(self):
- TestCase.setUp(self)
- self.store = MemoryObjectStore()
- def test_add_pack(self):
- o = MemoryObjectStore()
- f, commit, abort = o.add_pack()
- try:
- b = make_object(Blob, data=b"more yummy data")
- write_pack_objects(f, [(b, None)])
- except:
- abort()
- raise
- else:
- commit()
- def test_add_pack_emtpy(self):
- o = MemoryObjectStore()
- f, commit, abort = o.add_pack()
- commit()
- def test_add_thin_pack(self):
- o = MemoryObjectStore()
- blob = make_object(Blob, data=b'yummy data')
- o.add_object(blob)
- f = BytesIO()
- entries = build_pack(f, [
- (REF_DELTA, (blob.id, b'more yummy data')),
- ], store=o)
- o.add_thin_pack(f.read, None)
- packed_blob_sha = sha_to_hex(entries[0][3])
- self.assertEqual((Blob.type_num, b'more yummy data'),
- o.get_raw(packed_blob_sha))
- def test_add_thin_pack_empty(self):
- o = MemoryObjectStore()
- f = BytesIO()
- entries = build_pack(f, [], store=o)
- self.assertEqual([], entries)
- o.add_thin_pack(f.read, None)
- class PackBasedObjectStoreTests(ObjectStoreTests):
- def tearDown(self):
- for pack in self.store.packs:
- pack.close()
- def test_empty_packs(self):
- self.assertEqual([], list(self.store.packs))
- def test_pack_loose_objects(self):
- b1 = make_object(Blob, data=b"yummy data")
- self.store.add_object(b1)
- b2 = make_object(Blob, data=b"more yummy data")
- self.store.add_object(b2)
- b3 = make_object(Blob, data=b"even more yummy data")
- b4 = make_object(Blob, data=b"and more yummy data")
- self.store.add_objects([(b3, None), (b4, None)])
- self.assertEqual({b1.id, b2.id, b3.id, b4.id}, set(self.store))
- self.assertEqual(1, len(self.store.packs))
- self.assertEqual(2, self.store.pack_loose_objects())
- self.assertNotEqual([], list(self.store.packs))
- self.assertEqual(0, self.store.pack_loose_objects())
- def test_repack(self):
- b1 = make_object(Blob, data=b"yummy data")
- self.store.add_object(b1)
- b2 = make_object(Blob, data=b"more yummy data")
- self.store.add_object(b2)
- b3 = make_object(Blob, data=b"even more yummy data")
- b4 = make_object(Blob, data=b"and more yummy data")
- self.store.add_objects([(b3, None), (b4, None)])
- b5 = make_object(Blob, data=b"and more data")
- b6 = make_object(Blob, data=b"and some more data")
- self.store.add_objects([(b5, None), (b6, None)])
- self.assertEqual({b1.id, b2.id, b3.id, b4.id, b5.id, b6.id},
- set(self.store))
- self.assertEqual(2, len(self.store.packs))
- self.assertEqual(6, self.store.repack())
- self.assertEqual(1, len(self.store.packs))
- self.assertEqual(0, self.store.pack_loose_objects())
- class DiskObjectStoreTests(PackBasedObjectStoreTests, TestCase):
- def setUp(self):
- TestCase.setUp(self)
- self.store_dir = tempfile.mkdtemp()
- self.addCleanup(shutil.rmtree, self.store_dir)
- self.store = DiskObjectStore.init(self.store_dir)
- def tearDown(self):
- TestCase.tearDown(self)
- PackBasedObjectStoreTests.tearDown(self)
- def test_alternates(self):
- alternate_dir = tempfile.mkdtemp()
- self.addCleanup(shutil.rmtree, alternate_dir)
- alternate_store = DiskObjectStore(alternate_dir)
- b2 = make_object(Blob, data=b"yummy data")
- alternate_store.add_object(b2)
- store = DiskObjectStore(self.store_dir)
- self.assertRaises(KeyError, store.__getitem__, b2.id)
- store.add_alternate_path(alternate_dir)
- self.assertIn(b2.id, store)
- self.assertEqual(b2, store[b2.id])
- def test_add_alternate_path(self):
- store = DiskObjectStore(self.store_dir)
- self.assertEqual([], list(store._read_alternate_paths()))
- store.add_alternate_path("/foo/path")
- self.assertEqual(["/foo/path"], list(store._read_alternate_paths()))
- store.add_alternate_path("/bar/path")
- self.assertEqual(
- ["/foo/path", "/bar/path"],
- list(store._read_alternate_paths()))
- def test_rel_alternative_path(self):
- alternate_dir = tempfile.mkdtemp()
- self.addCleanup(shutil.rmtree, alternate_dir)
- alternate_store = DiskObjectStore(alternate_dir)
- b2 = make_object(Blob, data=b"yummy data")
- alternate_store.add_object(b2)
- store = DiskObjectStore(self.store_dir)
- self.assertRaises(KeyError, store.__getitem__, b2.id)
- store.add_alternate_path(
- os.path.relpath(alternate_dir, self.store_dir))
- self.assertEqual(list(alternate_store), list(store.alternates[0]))
- self.assertIn(b2.id, store)
- self.assertEqual(b2, store[b2.id])
- def test_pack_dir(self):
- o = DiskObjectStore(self.store_dir)
- self.assertEqual(os.path.join(self.store_dir, "pack"), o.pack_dir)
- def test_add_pack(self):
- o = DiskObjectStore(self.store_dir)
- f, commit, abort = o.add_pack()
- try:
- b = make_object(Blob, data=b"more yummy data")
- write_pack_objects(f, [(b, None)])
- except:
- abort()
- raise
- else:
- commit()
- def test_add_thin_pack(self):
- o = DiskObjectStore(self.store_dir)
- try:
- blob = make_object(Blob, data=b'yummy data')
- o.add_object(blob)
- f = BytesIO()
- entries = build_pack(f, [
- (REF_DELTA, (blob.id, b'more yummy data')),
- ], store=o)
- with o.add_thin_pack(f.read, None) as pack:
- packed_blob_sha = sha_to_hex(entries[0][3])
- pack.check_length_and_checksum()
- self.assertEqual(
- sorted([blob.id, packed_blob_sha]), list(pack))
- self.assertTrue(o.contains_packed(packed_blob_sha))
- self.assertTrue(o.contains_packed(blob.id))
- self.assertEqual((Blob.type_num, b'more yummy data'),
- o.get_raw(packed_blob_sha))
- finally:
- o.close()
- def test_add_thin_pack_empty(self):
- with closing(DiskObjectStore(self.store_dir)) as o:
- f = BytesIO()
- entries = build_pack(f, [], store=o)
- self.assertEqual([], entries)
- o.add_thin_pack(f.read, None)
- class TreeLookupPathTests(TestCase):
- def setUp(self):
- TestCase.setUp(self)
- self.store = MemoryObjectStore()
- blob_a = make_object(Blob, data=b'a')
- blob_b = make_object(Blob, data=b'b')
- blob_c = make_object(Blob, data=b'c')
- for blob in [blob_a, blob_b, blob_c]:
- self.store.add_object(blob)
- blobs = [
- (b'a', blob_a.id, 0o100644),
- (b'ad/b', blob_b.id, 0o100644),
- (b'ad/bd/c', blob_c.id, 0o100755),
- (b'ad/c', blob_c.id, 0o100644),
- (b'c', blob_c.id, 0o100644),
- ]
- self.tree_id = commit_tree(self.store, blobs)
- def get_object(self, sha):
- return self.store[sha]
- def test_lookup_blob(self):
- o_id = tree_lookup_path(self.get_object, self.tree_id, b'a')[1]
- self.assertTrue(isinstance(self.store[o_id], Blob))
- def test_lookup_tree(self):
- o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad')[1]
- self.assertTrue(isinstance(self.store[o_id], Tree))
- o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad/bd')[1]
- self.assertTrue(isinstance(self.store[o_id], Tree))
- o_id = tree_lookup_path(self.get_object, self.tree_id, b'ad/bd/')[1]
- self.assertTrue(isinstance(self.store[o_id], Tree))
- def test_lookup_nonexistent(self):
- self.assertRaises(
- KeyError, tree_lookup_path, self.get_object, self.tree_id, b'j')
- def test_lookup_not_tree(self):
- self.assertRaises(
- NotTreeError, tree_lookup_path, self.get_object, self.tree_id,
- b'ad/b/j')
- class ObjectStoreGraphWalkerTests(TestCase):
- def get_walker(self, heads, parent_map):
- new_parent_map = dict(
- [(k * 40, [(p * 40) for p in ps])
- for (k, ps) in parent_map.items()])
- return ObjectStoreGraphWalker([x * 40 for x in heads],
- new_parent_map.__getitem__)
- def test_ack_invalid_value(self):
- gw = self.get_walker([], {})
- self.assertRaises(ValueError, gw.ack, "tooshort")
- def test_empty(self):
- gw = self.get_walker([], {})
- self.assertIs(None, next(gw))
- gw.ack(b"a" * 40)
- self.assertIs(None, next(gw))
- def test_descends(self):
- gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
- self.assertEqual(b"a" * 40, next(gw))
- self.assertEqual(b"b" * 40, next(gw))
- def test_present(self):
- gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
- gw.ack(b"a" * 40)
- self.assertIs(None, next(gw))
- def test_parent_present(self):
- gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": []})
- self.assertEqual(b"a" * 40, next(gw))
- gw.ack(b"a" * 40)
- self.assertIs(None, next(gw))
- def test_child_ack_later(self):
- gw = self.get_walker([b"a"], {b"a": [b"b"], b"b": [b"c"], b"c": []})
- self.assertEqual(b"a" * 40, next(gw))
- self.assertEqual(b"b" * 40, next(gw))
- gw.ack(b"a" * 40)
- self.assertIs(None, next(gw))
- def test_only_once(self):
- # a b
- # | |
- # c d
- # \ /
- # e
- gw = self.get_walker([b"a", b"b"], {
- b"a": [b"c"],
- b"b": [b"d"],
- b"c": [b"e"],
- b"d": [b"e"],
- b"e": [],
- })
- walk = []
- acked = False
- walk.append(next(gw))
- walk.append(next(gw))
- # A branch (a, c) or (b, d) may be done after 2 steps or 3 depending on
- # the order walked: 3-step walks include (a, b, c) and (b, a, d), etc.
- if walk == [b"a" * 40, b"c" * 40] or walk == [b"b" * 40, b"d" * 40]:
- gw.ack(walk[0])
- acked = True
- walk.append(next(gw))
- if not acked and walk[2] == b"c" * 40:
- gw.ack(b"a" * 40)
- elif not acked and walk[2] == b"d" * 40:
- gw.ack(b"b" * 40)
- walk.append(next(gw))
- self.assertIs(None, next(gw))
- self.assertEqual([b"a" * 40, b"b" * 40, b"c" * 40, b"d" * 40],
- sorted(walk))
- self.assertLess(walk.index(b"a" * 40), walk.index(b"c" * 40))
- self.assertLess(walk.index(b"b" * 40), walk.index(b"d" * 40))
- class CommitTreeChangesTests(TestCase):
- def setUp(self):
- super(CommitTreeChangesTests, self).setUp()
- self.store = MemoryObjectStore()
- self.blob_a = make_object(Blob, data=b'a')
- self.blob_b = make_object(Blob, data=b'b')
- self.blob_c = make_object(Blob, data=b'c')
- for blob in [self.blob_a, self.blob_b, self.blob_c]:
- self.store.add_object(blob)
- blobs = [
- (b'a', self.blob_a.id, 0o100644),
- (b'ad/b', self.blob_b.id, 0o100644),
- (b'ad/bd/c', self.blob_c.id, 0o100755),
- (b'ad/c', self.blob_c.id, 0o100644),
- (b'c', self.blob_c.id, 0o100644),
- ]
- self.tree_id = commit_tree(self.store, blobs)
- def test_no_changes(self):
- self.assertEqual(
- self.store[self.tree_id],
- commit_tree_changes(self.store, self.store[self.tree_id], []))
- def test_add_blob(self):
- blob_d = make_object(Blob, data=b'd')
- new_tree = commit_tree_changes(
- self.store, self.store[self.tree_id], [
- (b'd', 0o100644, blob_d.id)])
- self.assertEqual(
- new_tree[b'd'],
- (33188, b'c59d9b6344f1af00e504ba698129f07a34bbed8d'))
- def test_add_blob_in_dir(self):
- blob_d = make_object(Blob, data=b'd')
- new_tree = commit_tree_changes(
- self.store, self.store[self.tree_id], [
- (b'e/f/d', 0o100644, blob_d.id)])
- self.assertEqual(
- new_tree.items(), [
- TreeEntry(path=b'a', mode=stat.S_IFREG | 0o100644,
- sha=self.blob_a.id),
- TreeEntry(path=b'ad', mode=stat.S_IFDIR,
- sha=b'0e2ce2cd7725ff4817791be31ccd6e627e801f4a'),
- TreeEntry(path=b'c', mode=stat.S_IFREG | 0o100644,
- sha=self.blob_c.id),
- TreeEntry(path=b'e', mode=stat.S_IFDIR,
- sha=b'6ab344e288724ac2fb38704728b8896e367ed108')
- ])
- e_tree = self.store[new_tree[b'e'][1]]
- self.assertEqual(
- e_tree.items(), [
- TreeEntry(path=b'f', mode=stat.S_IFDIR,
- sha=b'24d2c94d8af232b15a0978c006bf61ef4479a0a5')
- ])
- f_tree = self.store[e_tree[b'f'][1]]
- self.assertEqual(
- f_tree.items(), [
- TreeEntry(path=b'd', mode=stat.S_IFREG | 0o100644,
- sha=blob_d.id)
- ])
- def test_delete_blob(self):
- new_tree = commit_tree_changes(
- self.store, self.store[self.tree_id], [
- (b'ad/bd/c', None, None)])
- self.assertEqual(set(new_tree), {b'a', b'ad', b'c'})
- ad_tree = self.store[new_tree[b'ad'][1]]
- self.assertEqual(set(ad_tree), {b'b', b'c'})
|