repository.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329
  1. import os
  2. import shutil
  3. import tempfile
  4. from attic.testsuite.mock import patch
  5. from attic.hashindex import NSIndex
  6. from attic.helpers import Location, IntegrityError, UpgradableLock
  7. from attic.remote import RemoteRepository, InvalidRPCMethod
  8. from attic.repository import Repository
  9. from attic.testsuite import BaseTestCase
  10. class RepositoryTestCaseBase(BaseTestCase):
  11. key_size = 32
  12. def open(self, create=False):
  13. return Repository(os.path.join(self.tmppath, 'repository'), create=create)
  14. def setUp(self):
  15. self.tmppath = tempfile.mkdtemp()
  16. self.repository = self.open(create=True)
  17. def tearDown(self):
  18. self.repository.close()
  19. shutil.rmtree(self.tmppath)
  20. def reopen(self):
  21. if self.repository:
  22. self.repository.close()
  23. self.repository = self.open()
  24. class RepositoryTestCase(RepositoryTestCaseBase):
  25. def test1(self):
  26. for x in range(100):
  27. self.repository.put(('%-32d' % x).encode('ascii'), b'SOMEDATA')
  28. key50 = ('%-32d' % 50).encode('ascii')
  29. self.assert_equal(self.repository.get(key50), b'SOMEDATA')
  30. self.repository.delete(key50)
  31. self.assert_raises(Repository.ObjectNotFound, lambda: self.repository.get(key50))
  32. self.repository.commit()
  33. self.repository.close()
  34. repository2 = self.open()
  35. self.assert_raises(Repository.ObjectNotFound, lambda: repository2.get(key50))
  36. for x in range(100):
  37. if x == 50:
  38. continue
  39. self.assert_equal(repository2.get(('%-32d' % x).encode('ascii')), b'SOMEDATA')
  40. repository2.close()
  41. def test2(self):
  42. """Test multiple sequential transactions
  43. """
  44. self.repository.put(b'00000000000000000000000000000000', b'foo')
  45. self.repository.put(b'00000000000000000000000000000001', b'foo')
  46. self.repository.commit()
  47. self.repository.delete(b'00000000000000000000000000000000')
  48. self.repository.put(b'00000000000000000000000000000001', b'bar')
  49. self.repository.commit()
  50. self.assert_equal(self.repository.get(b'00000000000000000000000000000001'), b'bar')
  51. def test_consistency(self):
  52. """Test cache consistency
  53. """
  54. self.repository.put(b'00000000000000000000000000000000', b'foo')
  55. self.assert_equal(self.repository.get(b'00000000000000000000000000000000'), b'foo')
  56. self.repository.put(b'00000000000000000000000000000000', b'foo2')
  57. self.assert_equal(self.repository.get(b'00000000000000000000000000000000'), b'foo2')
  58. self.repository.put(b'00000000000000000000000000000000', b'bar')
  59. self.assert_equal(self.repository.get(b'00000000000000000000000000000000'), b'bar')
  60. self.repository.delete(b'00000000000000000000000000000000')
  61. self.assert_raises(Repository.ObjectNotFound, lambda: self.repository.get(b'00000000000000000000000000000000'))
  62. def test_consistency2(self):
  63. """Test cache consistency2
  64. """
  65. self.repository.put(b'00000000000000000000000000000000', b'foo')
  66. self.assert_equal(self.repository.get(b'00000000000000000000000000000000'), b'foo')
  67. self.repository.commit()
  68. self.repository.put(b'00000000000000000000000000000000', b'foo2')
  69. self.assert_equal(self.repository.get(b'00000000000000000000000000000000'), b'foo2')
  70. self.repository.rollback()
  71. self.assert_equal(self.repository.get(b'00000000000000000000000000000000'), b'foo')
  72. def test_overwrite_in_same_transaction(self):
  73. """Test cache consistency2
  74. """
  75. self.repository.put(b'00000000000000000000000000000000', b'foo')
  76. self.repository.put(b'00000000000000000000000000000000', b'foo2')
  77. self.repository.commit()
  78. self.assert_equal(self.repository.get(b'00000000000000000000000000000000'), b'foo2')
  79. def test_single_kind_transactions(self):
  80. # put
  81. self.repository.put(b'00000000000000000000000000000000', b'foo')
  82. self.repository.commit()
  83. self.repository.close()
  84. # replace
  85. self.repository = self.open()
  86. self.repository.put(b'00000000000000000000000000000000', b'bar')
  87. self.repository.commit()
  88. self.repository.close()
  89. # delete
  90. self.repository = self.open()
  91. self.repository.delete(b'00000000000000000000000000000000')
  92. self.repository.commit()
  93. def test_list(self):
  94. for x in range(100):
  95. self.repository.put(('%-32d' % x).encode('ascii'), b'SOMEDATA')
  96. all = self.repository.list()
  97. self.assert_equal(len(all), 100)
  98. first_half = self.repository.list(limit=50)
  99. self.assert_equal(len(first_half), 50)
  100. self.assert_equal(first_half, all[:50])
  101. second_half = self.repository.list(marker=first_half[-1])
  102. self.assert_equal(len(second_half), 50)
  103. self.assert_equal(second_half, all[50:])
  104. self.assert_equal(len(self.repository.list(limit=50)), 50)
  105. class RepositoryCommitTestCase(RepositoryTestCaseBase):
  106. def add_keys(self):
  107. self.repository.put(b'00000000000000000000000000000000', b'foo')
  108. self.repository.put(b'00000000000000000000000000000001', b'bar')
  109. self.repository.put(b'00000000000000000000000000000003', b'bar')
  110. self.repository.commit()
  111. self.repository.put(b'00000000000000000000000000000001', b'bar2')
  112. self.repository.put(b'00000000000000000000000000000002', b'boo')
  113. self.repository.delete(b'00000000000000000000000000000003')
  114. def test_replay_of_missing_index(self):
  115. self.add_keys()
  116. for name in os.listdir(self.repository.path):
  117. if name.startswith('index.'):
  118. os.unlink(os.path.join(self.repository.path, name))
  119. self.reopen()
  120. self.assert_equal(len(self.repository), 3)
  121. self.assert_equal(self.repository.check(), True)
  122. def test_crash_before_compact_segments(self):
  123. self.add_keys()
  124. self.repository.compact_segments = None
  125. try:
  126. self.repository.commit()
  127. except TypeError:
  128. pass
  129. self.reopen()
  130. self.assert_equal(len(self.repository), 3)
  131. self.assert_equal(self.repository.check(), True)
  132. def test_replay_of_readonly_repository(self):
  133. self.add_keys()
  134. for name in os.listdir(self.repository.path):
  135. if name.startswith('index.'):
  136. os.unlink(os.path.join(self.repository.path, name))
  137. with patch.object(UpgradableLock, 'upgrade', side_effect=UpgradableLock.WriteLockFailed) as upgrade:
  138. self.reopen()
  139. self.assert_raises(UpgradableLock.WriteLockFailed, lambda: len(self.repository))
  140. upgrade.assert_called_once()
  141. def test_crash_before_write_index(self):
  142. self.add_keys()
  143. self.repository.write_index = None
  144. try:
  145. self.repository.commit()
  146. except TypeError:
  147. pass
  148. self.reopen()
  149. self.assert_equal(len(self.repository), 3)
  150. self.assert_equal(self.repository.check(), True)
  151. def test_crash_before_deleting_compacted_segments(self):
  152. self.add_keys()
  153. self.repository.io.delete_segment = None
  154. try:
  155. self.repository.commit()
  156. except TypeError:
  157. pass
  158. self.reopen()
  159. self.assert_equal(len(self.repository), 3)
  160. self.assert_equal(self.repository.check(), True)
  161. self.assert_equal(len(self.repository), 3)
  162. class RepositoryCheckTestCase(RepositoryTestCaseBase):
  163. def list_indices(self):
  164. return [name for name in os.listdir(os.path.join(self.tmppath, 'repository')) if name.startswith('index.')]
  165. def check(self, repair=False, status=True):
  166. self.assert_equal(self.repository.check(repair=repair), status)
  167. # Make sure no tmp files are left behind
  168. self.assert_equal([name for name in os.listdir(os.path.join(self.tmppath, 'repository')) if 'tmp' in name], [], 'Found tmp files')
  169. def get_objects(self, *ids):
  170. for id_ in ids:
  171. self.repository.get(('%032d' % id_).encode('ascii'))
  172. def add_objects(self, segments):
  173. for ids in segments:
  174. for id_ in ids:
  175. self.repository.put(('%032d' % id_).encode('ascii'), b'data')
  176. self.repository.commit()
  177. def get_head(self):
  178. return sorted(int(n) for n in os.listdir(os.path.join(self.tmppath, 'repository', 'data', '0')) if n.isdigit())[-1]
  179. def open_index(self):
  180. return NSIndex.read(os.path.join(self.tmppath, 'repository', 'index.{}'.format(self.get_head())))
  181. def corrupt_object(self, id_):
  182. idx = self.open_index()
  183. segment, offset = idx[('%032d' % id_).encode('ascii')]
  184. with open(os.path.join(self.tmppath, 'repository', 'data', '0', str(segment)), 'r+b') as fd:
  185. fd.seek(offset)
  186. fd.write(b'BOOM')
  187. def delete_segment(self, segment):
  188. os.unlink(os.path.join(self.tmppath, 'repository', 'data', '0', str(segment)))
  189. def delete_index(self):
  190. os.unlink(os.path.join(self.tmppath, 'repository', 'index.{}'.format(self.get_head())))
  191. def rename_index(self, new_name):
  192. os.rename(os.path.join(self.tmppath, 'repository', 'index.{}'.format(self.get_head())),
  193. os.path.join(self.tmppath, 'repository', new_name))
  194. def list_objects(self):
  195. return set(int(key) for key in self.repository.list())
  196. def test_repair_corrupted_segment(self):
  197. self.add_objects([[1, 2, 3], [4, 5, 6]])
  198. self.assert_equal(set([1, 2, 3, 4, 5, 6]), self.list_objects())
  199. self.check(status=True)
  200. self.corrupt_object(5)
  201. self.assert_raises(IntegrityError, lambda: self.get_objects(5))
  202. self.repository.rollback()
  203. # Make sure a regular check does not repair anything
  204. self.check(status=False)
  205. self.check(status=False)
  206. # Make sure a repair actually repairs the repo
  207. self.check(repair=True, status=True)
  208. self.get_objects(4)
  209. self.check(status=True)
  210. self.assert_equal(set([1, 2, 3, 4, 6]), self.list_objects())
  211. def test_repair_missing_segment(self):
  212. self.add_objects([[1, 2, 3], [4, 5, 6]])
  213. self.assert_equal(set([1, 2, 3, 4, 5, 6]), self.list_objects())
  214. self.check(status=True)
  215. self.delete_segment(1)
  216. self.repository.rollback()
  217. self.check(repair=True, status=True)
  218. self.assert_equal(set([1, 2, 3]), self.list_objects())
  219. def test_repair_missing_commit_segment(self):
  220. self.add_objects([[1, 2, 3], [4, 5, 6]])
  221. self.delete_segment(1)
  222. self.assert_raises(Repository.ObjectNotFound, lambda: self.get_objects(4))
  223. self.assert_equal(set([1, 2, 3]), self.list_objects())
  224. def test_repair_corrupted_commit_segment(self):
  225. self.add_objects([[1, 2, 3], [4, 5, 6]])
  226. with open(os.path.join(self.tmppath, 'repository', 'data', '0', '1'), 'r+b') as fd:
  227. fd.seek(-1, os.SEEK_END)
  228. fd.write(b'X')
  229. self.assert_raises(Repository.ObjectNotFound, lambda: self.get_objects(4))
  230. self.check(status=True)
  231. self.get_objects(3)
  232. self.assert_equal(set([1, 2, 3]), self.list_objects())
  233. def test_repair_no_commits(self):
  234. self.add_objects([[1, 2, 3]])
  235. with open(os.path.join(self.tmppath, 'repository', 'data', '0', '0'), 'r+b') as fd:
  236. fd.seek(-1, os.SEEK_END)
  237. fd.write(b'X')
  238. self.assert_raises(Repository.CheckNeeded, lambda: self.get_objects(4))
  239. self.check(status=False)
  240. self.check(status=False)
  241. self.assert_equal(self.list_indices(), ['index.0'])
  242. self.check(repair=True, status=True)
  243. self.assert_equal(self.list_indices(), ['index.1'])
  244. self.check(status=True)
  245. self.get_objects(3)
  246. self.assert_equal(set([1, 2, 3]), self.list_objects())
  247. def test_repair_missing_index(self):
  248. self.add_objects([[1, 2, 3], [4, 5, 6]])
  249. self.delete_index()
  250. self.check(status=True)
  251. self.get_objects(4)
  252. self.assert_equal(set([1, 2, 3, 4, 5, 6]), self.list_objects())
  253. def test_repair_index_too_new(self):
  254. self.add_objects([[1, 2, 3], [4, 5, 6]])
  255. self.assert_equal(self.list_indices(), ['index.1'])
  256. self.rename_index('index.100')
  257. self.check(status=True)
  258. self.assert_equal(self.list_indices(), ['index.1'])
  259. self.get_objects(4)
  260. self.assert_equal(set([1, 2, 3, 4, 5, 6]), self.list_objects())
  261. def test_crash_before_compact(self):
  262. self.repository.put(bytes(32), b'data')
  263. self.repository.put(bytes(32), b'data2')
  264. # Simulate a crash before compact
  265. with patch.object(Repository, 'compact_segments') as compact:
  266. self.repository.commit()
  267. compact.assert_called_once()
  268. self.reopen()
  269. self.check(repair=True)
  270. self.assert_equal(self.repository.get(bytes(32)), b'data2')
  271. class RemoteRepositoryTestCase(RepositoryTestCase):
  272. def open(self, create=False):
  273. return RemoteRepository(Location('__testsuite__:' + os.path.join(self.tmppath, 'repository')), create=create)
  274. def test_invalid_rpc(self):
  275. self.assert_raises(InvalidRPCMethod, lambda: self.repository.call('__init__', None))
  276. class RemoteRepositoryCheckTestCase(RepositoryCheckTestCase):
  277. def open(self, create=False):
  278. return RemoteRepository(Location('__testsuite__:' + os.path.join(self.tmppath, 'repository')), create=create)