test_lru_cache.py 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447
  1. # Copyright (C) 2006, 2008 Canonical Ltd
  2. #
  3. # This program is free software; you can redistribute it and/or modify
  4. # it under the terms of the GNU General Public License as published by
  5. # the Free Software Foundation; either version 2 of the License, or
  6. # (at your option) any later version.
  7. #
  8. # This program is distributed in the hope that it will be useful,
  9. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. # GNU General Public License for more details.
  12. #
  13. # You should have received a copy of the GNU General Public License
  14. # along with this program; if not, write to the Free Software
  15. # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  16. """Tests for the lru_cache module."""
  17. from dulwich import (
  18. lru_cache,
  19. )
  20. import unittest
  21. class TestLRUCache(unittest.TestCase):
  22. """Test that LRU cache properly keeps track of entries."""
  23. def test_cache_size(self):
  24. cache = lru_cache.LRUCache(max_cache=10)
  25. self.assertEqual(10, cache.cache_size())
  26. cache = lru_cache.LRUCache(max_cache=256)
  27. self.assertEqual(256, cache.cache_size())
  28. cache.resize(512)
  29. self.assertEqual(512, cache.cache_size())
  30. def test_missing(self):
  31. cache = lru_cache.LRUCache(max_cache=10)
  32. self.failIf('foo' in cache)
  33. self.assertRaises(KeyError, cache.__getitem__, 'foo')
  34. cache['foo'] = 'bar'
  35. self.assertEqual('bar', cache['foo'])
  36. self.failUnless('foo' in cache)
  37. self.failIf('bar' in cache)
  38. def test_map_None(self):
  39. # Make sure that we can properly map None as a key.
  40. cache = lru_cache.LRUCache(max_cache=10)
  41. self.failIf(None in cache)
  42. cache[None] = 1
  43. self.assertEqual(1, cache[None])
  44. cache[None] = 2
  45. self.assertEqual(2, cache[None])
  46. # Test the various code paths of __getitem__, to make sure that we can
  47. # handle when None is the key for the LRU and the MRU
  48. cache[1] = 3
  49. cache[None] = 1
  50. cache[None]
  51. cache[1]
  52. cache[None]
  53. self.assertEqual([None, 1], [n.key for n in cache._walk_lru()])
  54. def test_add__null_key(self):
  55. cache = lru_cache.LRUCache(max_cache=10)
  56. self.assertRaises(ValueError, cache.add, lru_cache._null_key, 1)
  57. def test_overflow(self):
  58. """Adding extra entries will pop out old ones."""
  59. cache = lru_cache.LRUCache(max_cache=1, after_cleanup_count=1)
  60. cache['foo'] = 'bar'
  61. # With a max cache of 1, adding 'baz' should pop out 'foo'
  62. cache['baz'] = 'biz'
  63. self.failIf('foo' in cache)
  64. self.failUnless('baz' in cache)
  65. self.assertEqual('biz', cache['baz'])
  66. def test_by_usage(self):
  67. """Accessing entries bumps them up in priority."""
  68. cache = lru_cache.LRUCache(max_cache=2)
  69. cache['baz'] = 'biz'
  70. cache['foo'] = 'bar'
  71. self.assertEqual('biz', cache['baz'])
  72. # This must kick out 'foo' because it was the last accessed
  73. cache['nub'] = 'in'
  74. self.failIf('foo' in cache)
  75. def test_cleanup(self):
  76. """Test that we can use a cleanup function."""
  77. cleanup_called = []
  78. def cleanup_func(key, val):
  79. cleanup_called.append((key, val))
  80. cache = lru_cache.LRUCache(max_cache=2)
  81. cache.add('baz', '1', cleanup=cleanup_func)
  82. cache.add('foo', '2', cleanup=cleanup_func)
  83. cache.add('biz', '3', cleanup=cleanup_func)
  84. self.assertEqual([('baz', '1')], cleanup_called)
  85. # 'foo' is now most recent, so final cleanup will call it last
  86. cache['foo']
  87. cache.clear()
  88. self.assertEqual([('baz', '1'), ('biz', '3'), ('foo', '2')],
  89. cleanup_called)
  90. def test_cleanup_on_replace(self):
  91. """Replacing an object should cleanup the old value."""
  92. cleanup_called = []
  93. def cleanup_func(key, val):
  94. cleanup_called.append((key, val))
  95. cache = lru_cache.LRUCache(max_cache=2)
  96. cache.add(1, 10, cleanup=cleanup_func)
  97. cache.add(2, 20, cleanup=cleanup_func)
  98. cache.add(2, 25, cleanup=cleanup_func)
  99. self.assertEqual([(2, 20)], cleanup_called)
  100. self.assertEqual(25, cache[2])
  101. # Even __setitem__ should make sure cleanup() is called
  102. cache[2] = 26
  103. self.assertEqual([(2, 20), (2, 25)], cleanup_called)
  104. def test_len(self):
  105. cache = lru_cache.LRUCache(max_cache=10, after_cleanup_count=10)
  106. cache[1] = 10
  107. cache[2] = 20
  108. cache[3] = 30
  109. cache[4] = 40
  110. self.assertEqual(4, len(cache))
  111. cache[5] = 50
  112. cache[6] = 60
  113. cache[7] = 70
  114. cache[8] = 80
  115. self.assertEqual(8, len(cache))
  116. cache[1] = 15 # replacement
  117. self.assertEqual(8, len(cache))
  118. cache[9] = 90
  119. cache[10] = 100
  120. cache[11] = 110
  121. # We hit the max
  122. self.assertEqual(10, len(cache))
  123. self.assertEqual([11, 10, 9, 1, 8, 7, 6, 5, 4, 3],
  124. [n.key for n in cache._walk_lru()])
  125. def test_cleanup_shrinks_to_after_clean_count(self):
  126. cache = lru_cache.LRUCache(max_cache=5, after_cleanup_count=3)
  127. cache.add(1, 10)
  128. cache.add(2, 20)
  129. cache.add(3, 25)
  130. cache.add(4, 30)
  131. cache.add(5, 35)
  132. self.assertEqual(5, len(cache))
  133. # This will bump us over the max, which causes us to shrink down to
  134. # after_cleanup_cache size
  135. cache.add(6, 40)
  136. self.assertEqual(3, len(cache))
  137. def test_after_cleanup_larger_than_max(self):
  138. cache = lru_cache.LRUCache(max_cache=5, after_cleanup_count=10)
  139. self.assertEqual(5, cache._after_cleanup_count)
  140. def test_after_cleanup_none(self):
  141. cache = lru_cache.LRUCache(max_cache=5, after_cleanup_count=None)
  142. # By default _after_cleanup_size is 80% of the normal size
  143. self.assertEqual(4, cache._after_cleanup_count)
  144. def test_cleanup(self):
  145. cache = lru_cache.LRUCache(max_cache=5, after_cleanup_count=2)
  146. # Add these in order
  147. cache.add(1, 10)
  148. cache.add(2, 20)
  149. cache.add(3, 25)
  150. cache.add(4, 30)
  151. cache.add(5, 35)
  152. self.assertEqual(5, len(cache))
  153. # Force a compaction
  154. cache.cleanup()
  155. self.assertEqual(2, len(cache))
  156. def test_preserve_last_access_order(self):
  157. cache = lru_cache.LRUCache(max_cache=5)
  158. # Add these in order
  159. cache.add(1, 10)
  160. cache.add(2, 20)
  161. cache.add(3, 25)
  162. cache.add(4, 30)
  163. cache.add(5, 35)
  164. self.assertEqual([5, 4, 3, 2, 1], [n.key for n in cache._walk_lru()])
  165. # Now access some randomly
  166. cache[2]
  167. cache[5]
  168. cache[3]
  169. cache[2]
  170. self.assertEqual([2, 3, 5, 4, 1], [n.key for n in cache._walk_lru()])
  171. def test_get(self):
  172. cache = lru_cache.LRUCache(max_cache=5)
  173. cache.add(1, 10)
  174. cache.add(2, 20)
  175. self.assertEqual(20, cache.get(2))
  176. self.assertEquals(None, cache.get(3))
  177. obj = object()
  178. self.assertTrue(obj is cache.get(3, obj))
  179. self.assertEqual([2, 1], [n.key for n in cache._walk_lru()])
  180. self.assertEqual(10, cache.get(1))
  181. self.assertEqual([1, 2], [n.key for n in cache._walk_lru()])
  182. def test_keys(self):
  183. cache = lru_cache.LRUCache(max_cache=5, after_cleanup_count=5)
  184. cache[1] = 2
  185. cache[2] = 3
  186. cache[3] = 4
  187. self.assertEqual([1, 2, 3], sorted(cache.keys()))
  188. cache[4] = 5
  189. cache[5] = 6
  190. cache[6] = 7
  191. self.assertEqual([2, 3, 4, 5, 6], sorted(cache.keys()))
  192. def test_resize_smaller(self):
  193. cache = lru_cache.LRUCache(max_cache=5, after_cleanup_count=4)
  194. cache[1] = 2
  195. cache[2] = 3
  196. cache[3] = 4
  197. cache[4] = 5
  198. cache[5] = 6
  199. self.assertEqual([1, 2, 3, 4, 5], sorted(cache.keys()))
  200. cache[6] = 7
  201. self.assertEqual([3, 4, 5, 6], sorted(cache.keys()))
  202. # Now resize to something smaller, which triggers a cleanup
  203. cache.resize(max_cache=3, after_cleanup_count=2)
  204. self.assertEqual([5, 6], sorted(cache.keys()))
  205. # Adding something will use the new size
  206. cache[7] = 8
  207. self.assertEqual([5, 6, 7], sorted(cache.keys()))
  208. cache[8] = 9
  209. self.assertEqual([7, 8], sorted(cache.keys()))
  210. def test_resize_larger(self):
  211. cache = lru_cache.LRUCache(max_cache=5, after_cleanup_count=4)
  212. cache[1] = 2
  213. cache[2] = 3
  214. cache[3] = 4
  215. cache[4] = 5
  216. cache[5] = 6
  217. self.assertEqual([1, 2, 3, 4, 5], sorted(cache.keys()))
  218. cache[6] = 7
  219. self.assertEqual([3, 4, 5, 6], sorted(cache.keys()))
  220. cache.resize(max_cache=8, after_cleanup_count=6)
  221. self.assertEqual([3, 4, 5, 6], sorted(cache.keys()))
  222. cache[7] = 8
  223. cache[8] = 9
  224. cache[9] = 10
  225. cache[10] = 11
  226. self.assertEqual([3, 4, 5, 6, 7, 8, 9, 10], sorted(cache.keys()))
  227. cache[11] = 12 # triggers cleanup back to new after_cleanup_count
  228. self.assertEqual([6, 7, 8, 9, 10, 11], sorted(cache.keys()))
  229. class TestLRUSizeCache(unittest.TestCase):
  230. def test_basic_init(self):
  231. cache = lru_cache.LRUSizeCache()
  232. self.assertEqual(2048, cache._max_cache)
  233. self.assertEqual(int(cache._max_size*0.8), cache._after_cleanup_size)
  234. self.assertEqual(0, cache._value_size)
  235. def test_add__null_key(self):
  236. cache = lru_cache.LRUSizeCache()
  237. self.assertRaises(ValueError, cache.add, lru_cache._null_key, 1)
  238. def test_add_tracks_size(self):
  239. cache = lru_cache.LRUSizeCache()
  240. self.assertEqual(0, cache._value_size)
  241. cache.add('my key', 'my value text')
  242. self.assertEqual(13, cache._value_size)
  243. def test_remove_tracks_size(self):
  244. cache = lru_cache.LRUSizeCache()
  245. self.assertEqual(0, cache._value_size)
  246. cache.add('my key', 'my value text')
  247. self.assertEqual(13, cache._value_size)
  248. node = cache._cache['my key']
  249. cache._remove_node(node)
  250. self.assertEqual(0, cache._value_size)
  251. def test_no_add_over_size(self):
  252. """Adding a large value may not be cached at all."""
  253. cache = lru_cache.LRUSizeCache(max_size=10, after_cleanup_size=5)
  254. self.assertEqual(0, cache._value_size)
  255. self.assertEqual({}, cache.items())
  256. cache.add('test', 'key')
  257. self.assertEqual(3, cache._value_size)
  258. self.assertEqual({'test': 'key'}, cache.items())
  259. cache.add('test2', 'key that is too big')
  260. self.assertEqual(3, cache._value_size)
  261. self.assertEqual({'test':'key'}, cache.items())
  262. # If we would add a key, only to cleanup and remove all cached entries,
  263. # then obviously that value should not be stored
  264. cache.add('test3', 'bigkey')
  265. self.assertEqual(3, cache._value_size)
  266. self.assertEqual({'test':'key'}, cache.items())
  267. cache.add('test4', 'bikey')
  268. self.assertEqual(3, cache._value_size)
  269. self.assertEqual({'test':'key'}, cache.items())
  270. def test_no_add_over_size_cleanup(self):
  271. """If a large value is not cached, we will call cleanup right away."""
  272. cleanup_calls = []
  273. def cleanup(key, value):
  274. cleanup_calls.append((key, value))
  275. cache = lru_cache.LRUSizeCache(max_size=10, after_cleanup_size=5)
  276. self.assertEqual(0, cache._value_size)
  277. self.assertEqual({}, cache.items())
  278. cache.add('test', 'key that is too big', cleanup=cleanup)
  279. # key was not added
  280. self.assertEqual(0, cache._value_size)
  281. self.assertEqual({}, cache.items())
  282. # and cleanup was called
  283. self.assertEqual([('test', 'key that is too big')], cleanup_calls)
  284. def test_adding_clears_cache_based_on_size(self):
  285. """The cache is cleared in LRU order until small enough"""
  286. cache = lru_cache.LRUSizeCache(max_size=20)
  287. cache.add('key1', 'value') # 5 chars
  288. cache.add('key2', 'value2') # 6 chars
  289. cache.add('key3', 'value23') # 7 chars
  290. self.assertEqual(5+6+7, cache._value_size)
  291. cache['key2'] # reference key2 so it gets a newer reference time
  292. cache.add('key4', 'value234') # 8 chars, over limit
  293. # We have to remove 2 keys to get back under limit
  294. self.assertEqual(6+8, cache._value_size)
  295. self.assertEqual({'key2':'value2', 'key4':'value234'},
  296. cache.items())
  297. def test_adding_clears_to_after_cleanup_size(self):
  298. cache = lru_cache.LRUSizeCache(max_size=20, after_cleanup_size=10)
  299. cache.add('key1', 'value') # 5 chars
  300. cache.add('key2', 'value2') # 6 chars
  301. cache.add('key3', 'value23') # 7 chars
  302. self.assertEqual(5+6+7, cache._value_size)
  303. cache['key2'] # reference key2 so it gets a newer reference time
  304. cache.add('key4', 'value234') # 8 chars, over limit
  305. # We have to remove 3 keys to get back under limit
  306. self.assertEqual(8, cache._value_size)
  307. self.assertEqual({'key4':'value234'}, cache.items())
  308. def test_custom_sizes(self):
  309. def size_of_list(lst):
  310. return sum(len(x) for x in lst)
  311. cache = lru_cache.LRUSizeCache(max_size=20, after_cleanup_size=10,
  312. compute_size=size_of_list)
  313. cache.add('key1', ['val', 'ue']) # 5 chars
  314. cache.add('key2', ['val', 'ue2']) # 6 chars
  315. cache.add('key3', ['val', 'ue23']) # 7 chars
  316. self.assertEqual(5+6+7, cache._value_size)
  317. cache['key2'] # reference key2 so it gets a newer reference time
  318. cache.add('key4', ['value', '234']) # 8 chars, over limit
  319. # We have to remove 3 keys to get back under limit
  320. self.assertEqual(8, cache._value_size)
  321. self.assertEqual({'key4':['value', '234']}, cache.items())
  322. def test_cleanup(self):
  323. cache = lru_cache.LRUSizeCache(max_size=20, after_cleanup_size=10)
  324. # Add these in order
  325. cache.add('key1', 'value') # 5 chars
  326. cache.add('key2', 'value2') # 6 chars
  327. cache.add('key3', 'value23') # 7 chars
  328. self.assertEqual(5+6+7, cache._value_size)
  329. cache.cleanup()
  330. # Only the most recent fits after cleaning up
  331. self.assertEqual(7, cache._value_size)
  332. def test_keys(self):
  333. cache = lru_cache.LRUSizeCache(max_size=10)
  334. cache[1] = 'a'
  335. cache[2] = 'b'
  336. cache[3] = 'cdef'
  337. self.assertEqual([1, 2, 3], sorted(cache.keys()))
  338. def test_resize_smaller(self):
  339. cache = lru_cache.LRUSizeCache(max_size=10, after_cleanup_size=9)
  340. cache[1] = 'abc'
  341. cache[2] = 'def'
  342. cache[3] = 'ghi'
  343. cache[4] = 'jkl'
  344. # Triggers a cleanup
  345. self.assertEqual([2, 3, 4], sorted(cache.keys()))
  346. # Resize should also cleanup again
  347. cache.resize(max_size=6, after_cleanup_size=4)
  348. self.assertEqual([4], sorted(cache.keys()))
  349. # Adding should use the new max size
  350. cache[5] = 'mno'
  351. self.assertEqual([4, 5], sorted(cache.keys()))
  352. cache[6] = 'pqr'
  353. self.assertEqual([6], sorted(cache.keys()))
  354. def test_resize_larger(self):
  355. cache = lru_cache.LRUSizeCache(max_size=10, after_cleanup_size=9)
  356. cache[1] = 'abc'
  357. cache[2] = 'def'
  358. cache[3] = 'ghi'
  359. cache[4] = 'jkl'
  360. # Triggers a cleanup
  361. self.assertEqual([2, 3, 4], sorted(cache.keys()))
  362. cache.resize(max_size=15, after_cleanup_size=12)
  363. self.assertEqual([2, 3, 4], sorted(cache.keys()))
  364. cache[5] = 'mno'
  365. cache[6] = 'pqr'
  366. self.assertEqual([2, 3, 4, 5, 6], sorted(cache.keys()))
  367. cache[7] = 'stu'
  368. self.assertEqual([4, 5, 6, 7], sorted(cache.keys()))