tahoe-lafs/src/allmydata/storageserver.py

123 lines
4.5 KiB
Python
Raw Normal View History

import os, re
from foolscap import Referenceable
from twisted.application import service
from zope.interface import implements
2007-03-30 03:19:52 +00:00
from allmydata.interfaces import RIStorageServer, RIBucketWriter
from allmydata import interfaces
from allmydata.util import bencode, fileutil, idlib
from allmydata.util.assertutil import _assert, precondition
2007-03-30 03:19:52 +00:00
# store/
# store/incoming # temp dirs named $VERIFIERID/$SHARENUM that will be moved to store/ on success
2007-03-30 03:19:52 +00:00
# store/$VERIFIERID
# store/$VERIFIERID/$SHARENUM
# store/$VERIFIERID/$SHARENUM/blocksize
# store/$VERIFIERID/$SHARENUM/data
# store/$VERIFIERID/$SHARENUM/blockhashes
# store/$VERIFIERID/$SHARENUM/sharehashtree
2007-03-30 03:19:52 +00:00
# $SHARENUM matches this regex:
NUM_RE=re.compile("[0-9]*")
2007-03-30 03:19:52 +00:00
class BucketWriter(Referenceable):
implements(RIBucketWriter)
def __init__(self, incominghome, finalhome, blocksize):
self.incominghome = incominghome
2007-03-30 03:19:52 +00:00
self.finalhome = finalhome
self.blocksize = blocksize
self.closed = False
fileutil.make_dirs(incominghome)
fileutil.make_dirs(finalhome)
2007-03-30 03:19:52 +00:00
self._write_file('blocksize', str(blocksize))
def _write_file(self, fname, data):
open(os.path.join(self.incominghome, fname), 'wb').write(data)
2007-03-30 03:19:52 +00:00
def remote_put_block(self, segmentnum, data):
precondition(not self.closed)
assert len(data) == self.blocksize
f = open(os.path.join(self.incominghome, 'data'), 'wb')
2007-03-30 03:19:52 +00:00
f.seek(self.blocksize*segmentnum)
f.write(data)
def remote_put_block_hashes(self, blockhashes):
precondition(not self.closed)
# TODO: verify the length of blockhashes.
# TODO: tighten foolscap schema to require exactly 32 bytes.
self._write_file('blockhashes', ''.join(blockhashes))
def remote_put_share_hashes(self, sharehashes):
precondition(not self.closed)
self._write_file('sharehashree', bencode.bencode(sharehashes))
def remote_close(self):
2007-03-30 03:19:52 +00:00
precondition(not self.closed)
# TODO assert or check the completeness and consistency of the data that has been written
fileutil.rename(self.incominghome, self.finalhome)
2007-03-30 03:19:52 +00:00
self.closed = True
def str2l(s):
""" split string (pulled from storage) into a list of blockids """
return [ s[i:i+interfaces.HASH_SIZE] for i in range(0, len(s), interfaces.HASH_SIZE) ]
class BucketReader(Referenceable):
def __init__(self, home):
self.home = home
self.blocksize = int(self._read_file('blocksize'))
def _read_file(self, fname):
return open(os.path.join(self.home, fname), 'rb').read()
def remote_get_block(self, blocknum):
f = open(os.path.join(self.home, 'data'), 'rb')
f.seek(self.blocksize * blocknum)
return f.read(self.blocksize) # this might be short for the last block
2007-03-30 03:19:52 +00:00
def remote_get_block_hashes(self):
return str2l(self._read_file('blockhashes'))
def remote_get_share_hashes(self):
return bencode.bdecode(self._read_file('sharehashes'))
class StorageServer(service.MultiService, Referenceable):
implements(RIStorageServer)
name = 'storageserver'
2007-03-30 03:19:52 +00:00
def __init__(self, storedir):
fileutil.make_dirs(storedir)
self.storedir = storedir
self.incomingdir = os.path.join(storedir, 'incoming')
self._clean_incomplete()
fileutil.make_dirs(self.incomingdir)
2007-03-30 03:19:52 +00:00
service.MultiService.__init__(self)
def _clean_incomplete(self):
fileutil.rm_dir(self.incomingdir)
2007-03-30 03:19:52 +00:00
def remote_allocate_buckets(self, verifierid, sharenums, sharesize,
blocksize, canary):
alreadygot = set()
bucketwriters = {} # k: shnum, v: BucketWriter
for shnum in sharenums:
incominghome = os.path.join(self.incomingdir,
idlib.b2a(verifierid) + "%d"%shnum)
finalhome = os.path.join(self.storedir, idlib.b2a(verifierid), "%d"%shnum)
if os.path.exists(incominghome) or os.path.exists(finalhome):
alreadygot.add(shnum)
else:
bucketwriters[shnum] = BucketWriter(incominghome, finalhome, blocksize)
2007-03-30 03:19:52 +00:00
return alreadygot, bucketwriters
def remote_get_buckets(self, verifierid):
2007-03-30 03:19:52 +00:00
bucketreaders = {} # k: sharenum, v: BucketReader
verifierdir = os.path.join(self.storedir, idlib.b2a(verifierid))
for f in os.listdir(verifierdir):
_assert(NUM_RE.match(f), f)
2007-03-30 03:19:52 +00:00
bucketreaders[int(f)] = BucketReader(os.path.join(verifierdir, f))
return bucketreaders