123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222 |
- #!/usr/bin/env python
- import fcntl
- import tempfile
- import logging
- import os
- import posixpath
- import shutil
- import unittest
- import uuid
- log = logging.getLogger('')
- # FIXME: UUID
- class Repository(object):
- """
- """
- IDLE = 'Idle'
- OPEN = 'Open'
- ACTIVE = 'Active'
- VERSION = 'DEDUPSTORE REPOSITORY VERSION 1'
- def __init__(self, path):
- self.tid = -1
- self.state = Repository.IDLE
- if not os.path.exists(path):
- self.create(path)
- self.open(path)
-
- def create(self, path):
- log.info('Initializing Repository at "%s"' % path)
- os.mkdir(path)
- open(os.path.join(path, 'VERSION'), 'wb').write(self.VERSION)
- open(os.path.join(path, 'uuid'), 'wb').write(str(uuid.uuid4()))
- open(os.path.join(path, 'tid'), 'wb').write('0')
- os.mkdir(os.path.join(path, 'data'))
- def open(self, path):
- self.path = path
- if not os.path.isdir(path):
- raise Exception('%s Does not look like a repository')
- version_path = os.path.join(path, 'version')
- if not os.path.exists(version_path) or open(version_path, 'rb').read() != self.VERSION:
- raise Exception('%s Does not look like a repository2')
- self.uuid = open(os.path.join(path, 'uuid'), 'rb').read()
- self.lock_fd = open(os.path.join(path, 'lock'), 'w')
- fcntl.flock(self.lock_fd, fcntl.LOCK_EX)
- self.tid = int(open(os.path.join(path, 'tid'), 'r').read())
- self.recover()
- def recover(self):
- if os.path.exists(os.path.join(self.path, 'txn-active')):
- self.rollback()
- if os.path.exists(os.path.join(self.path, 'txn-commit')):
- self.apply_txn()
- if os.path.exists(os.path.join(self.path, 'txn-applied')):
- shutil.rmtree(os.path.join(self.path, 'txn-applied'))
- self.state = Repository.OPEN
- def close(self):
- self.recover()
- self.lock_fd.close()
- self.state = Repository.IDLE
- def commit(self):
- """
- """
- if self.state == Repository.OPEN:
- return
- assert self.state == Repository.ACTIVE
- remove_fd = open(os.path.join(self.path, 'txn-active', 'remove'), 'wb')
- remove_fd.write('\n'.join(self.txn_removed))
- remove_fd.close()
- add_fd = open(os.path.join(self.path, 'txn-active', 'add_index'), 'wb')
- add_fd.write('\n'.join(self.txn_added))
- add_fd.close()
- tid_fd = open(os.path.join(self.path, 'txn-active', 'tid'), 'wb')
- tid_fd.write(str(self.tid + 1))
- tid_fd.close()
- os.rename(os.path.join(self.path, 'txn-active'),
- os.path.join(self.path, 'txn-commit'))
- self.apply_txn()
- def apply_txn(self):
- assert os.path.isdir(os.path.join(self.path, 'txn-commit'))
- tid = int(open(os.path.join(self.path, 'txn-commit', 'tid'), 'rb').read())
- assert tid >= self.tid
- remove_list = [line.strip() for line in
- open(os.path.join(self.path, 'txn-commit', 'remove'), 'rb').readlines()]
- for name in remove_list:
- path = os.path.join(self.path, 'data', name)
- os.unlink(path)
- add_list = [line.strip() for line in
- open(os.path.join(self.path, 'txn-commit', 'add_index'), 'rb').readlines()]
- for name in add_list:
- destname = os.path.join(self.path, 'data', name)
- if not os.path.exists(os.path.dirname(destname)):
- os.makedirs(os.path.dirname(destname))
- shutil.move(os.path.join(self.path, 'txn-commit', 'add', name), destname)
- tid_fd = open(os.path.join(self.path, 'tid'), 'wb')
- tid_fd.write(str(tid))
- tid_fd.close()
- os.rename(os.path.join(self.path, 'txn-commit'),
- os.path.join(self.path, 'txn-applied'))
- shutil.rmtree(os.path.join(self.path, 'txn-applied'))
- self.state = Repository.OPEN
- def rollback(self):
- """
- """
- txn_path = os.path.join(self.path, 'txn-active')
- if os.path.exists(txn_path):
- shutil.rmtree(txn_path)
- self.state = Repository.OPEN
- def prepare_txn(self):
- if self.state == Repository.ACTIVE:
- return os.path.join(self.path, 'txn-active')
- elif self.state == Repository.OPEN:
- os.mkdir(os.path.join(self.path, 'txn-active'))
- os.mkdir(os.path.join(self.path, 'txn-active', 'add'))
- self.txn_removed = []
- self.txn_added = []
- self.state = Repository.ACTIVE
-
- def get_file(self, path):
- """
- """
- if os.path.exists(os.path.join(self.path, 'txn-active', 'add', path)):
- return open(os.path.join(self.path, 'txn-active', 'add', path), 'rb').read()
- elif os.path.exists(os.path.join(self.path, 'data', path)):
- return open(os.path.join(self.path, 'data', path), 'rb').read()
- else:
- raise Exception('FileNotFound: %s' % path)
- def put_file(self, path, data):
- """
- """
- self.prepare_txn()
- if os.path.exists(os.path.join(self.path, 'txn-active', 'add', path)):
- raise Exception('FileAlreadyExists: %s' % path)
- if path in self.txn_removed:
- self.txn_removed.remove(path)
- if path not in self.txn_added:
- self.txn_added.append(path)
- filename = os.path.join(self.path, 'txn-active', 'add', path)
- if not os.path.exists(os.path.dirname(filename)):
- os.makedirs(os.path.dirname(filename))
- fd = open(filename, 'wb')
- try:
- fd.write(data)
- finally:
- fd.close()
- def delete(self, path):
- """
- """
- self.prepare_txn()
- if os.path.exists(os.path.join(self.path, 'txn-active', 'add', path)):
- os.unlink(os.path.join(self.path, 'txn-active', 'add', path))
- elif os.path.exists(os.path.join(self.path, 'data', path)):
- self.txn_removed.append(path)
- else:
- raise Exception('FileNotFound: %s' % path)
- def listdir(self, path):
- """
- """
- entries = set(os.listdir(os.path.join(self.path, 'data', path)))
- if self.state == Repository.ACTIVE:
- txn_entries = set(os.listdir(os.path.join(self.path, 'txn-active', 'add', path)))
- entries = entries.union(txn_entries)
- for e in entries:
- if posixpath.join(path, e) in self.txn_removed:
- entries.remove(e)
- return list(entries)
- def mkdir(self, path):
- """
- """
- def rmdir(self, path):
- """
- """
- class RepositoryTestCase(unittest.TestCase):
-
- def setUp(self):
- self.tmppath = tempfile.mkdtemp()
- self.repo = Repository(os.path.join(self.tmppath, 'repo'))
- def tearDown(self):
- shutil.rmtree(self.tmppath)
-
- def test1(self):
- self.assertEqual(self.repo.tid, 0)
- self.assertEqual(self.repo.state, Repository.OPEN)
- self.assertEqual(self.repo.listdir(''), [])
- self.repo.put_file('foo', 'SOMEDATA')
- self.assertRaises(Exception, lambda: self.repo.put_file('foo', 'SOMETHINGELSE'))
- self.assertEqual(self.repo.get_file('foo'), 'SOMEDATA')
- self.assertEqual(self.repo.listdir(''), ['foo'])
- self.repo.rollback()
- self.assertEqual(self.repo.listdir(''), [])
- def test2(self):
- self.repo.put_file('foo', 'SOMEDATA')
- self.repo.put_file('bar', 'SOMEDATAbar')
- self.assertEqual(self.repo.listdir(''), ['foo', 'bar'])
- self.assertEqual(self.repo.get_file('foo'), 'SOMEDATA')
- self.repo.delete('foo')
- self.assertRaises(Exception, lambda: self.repo.get_file('foo'))
- self.assertEqual(self.repo.listdir(''), ['bar'])
- self.assertEqual(self.repo.state, Repository.ACTIVE)
- self.assertEqual(os.path.exists(os.path.join(self.tmppath, 'repo', 'data', 'bar')), False)
- self.repo.commit()
- self.assertEqual(os.path.exists(os.path.join(self.tmppath, 'repo', 'data', 'bar')), True)
- self.assertEqual(self.repo.listdir(''), ['bar'])
- self.assertEqual(self.repo.state, Repository.IDLE)
- if __name__ == '__main__':
- unittest.main()
|