2007-01-05 04:52:51 +00:00
|
|
|
# -*- test-case-name: allmydata.test.test_encode_share -*-
|
|
|
|
|
|
|
|
from zope.interface import implements
|
2006-12-03 00:31:26 +00:00
|
|
|
from twisted.internet import defer
|
2006-12-03 10:01:43 +00:00
|
|
|
import sha
|
2007-01-05 04:52:51 +00:00
|
|
|
from allmydata.util import idlib, mathutil
|
2007-02-02 00:13:01 +00:00
|
|
|
from allmydata.util.assertutil import precondition
|
2007-01-12 03:57:14 +00:00
|
|
|
from allmydata.interfaces import ICodecEncoder, ICodecDecoder
|
2007-02-01 23:07:00 +00:00
|
|
|
import fec
|
2006-12-03 10:01:43 +00:00
|
|
|
|
|
|
|
def netstring(s):
|
|
|
|
return "%d:%s," % (len(s), s)
|
2006-12-03 00:31:26 +00:00
|
|
|
|
2007-02-01 23:07:00 +00:00
|
|
|
from base64 import b32encode
|
|
|
|
def ab(x): # debuggery
|
|
|
|
if len(x) >= 3:
|
|
|
|
return "%s:%s" % (len(x), b32encode(x[-3:]),)
|
|
|
|
elif len(x) == 2:
|
|
|
|
return "%s:%s" % (len(x), b32encode(x[-2:]),)
|
|
|
|
elif len(x) == 1:
|
|
|
|
return "%s:%s" % (len(x), b32encode(x[-1:]),)
|
|
|
|
elif len(x) == 0:
|
|
|
|
return "%s:%s" % (len(x), "--empty--",)
|
|
|
|
|
|
|
|
|
2007-01-05 04:52:51 +00:00
|
|
|
class ReplicatingEncoder(object):
|
2007-01-12 03:57:14 +00:00
|
|
|
implements(ICodecEncoder)
|
2007-01-17 04:29:59 +00:00
|
|
|
ENCODER_TYPE = "rep"
|
2007-01-05 04:52:51 +00:00
|
|
|
|
2007-01-16 04:22:22 +00:00
|
|
|
def set_params(self, data_size, required_shares, max_shares):
|
2007-03-28 05:17:31 +00:00
|
|
|
assert required_shares % data_size == 0
|
|
|
|
assert required_shares <= max_shares
|
2007-01-05 04:52:51 +00:00
|
|
|
self.data_size = data_size
|
|
|
|
self.required_shares = required_shares
|
2007-01-16 04:22:22 +00:00
|
|
|
self.max_shares = max_shares
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
def get_encoder_type(self):
|
|
|
|
return self.ENCODER_TYPE
|
|
|
|
|
|
|
|
def get_serialized_params(self):
|
|
|
|
return "%d" % self.required_shares
|
|
|
|
|
|
|
|
def get_share_size(self):
|
|
|
|
return self.data_size
|
|
|
|
|
2007-03-28 05:17:31 +00:00
|
|
|
def encode(self, inshares, desired_shareids=None):
|
|
|
|
assert isinstance(data, list)
|
|
|
|
for inshare in inshares:
|
|
|
|
assert isinstance(inshare, str)
|
|
|
|
assert self.required_shares * len(inshare) == self.data_size
|
|
|
|
data = "".join(inshares)
|
2007-02-01 23:07:00 +00:00
|
|
|
if desired_shareids is None:
|
|
|
|
desired_shareids = range(self.max_shares)
|
|
|
|
shares = [data for i in desired_shareids]
|
|
|
|
return defer.succeed((shares, desired_shareids))
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
class ReplicatingDecoder(object):
|
2007-01-12 03:57:14 +00:00
|
|
|
implements(ICodecDecoder)
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
def set_serialized_params(self, params):
|
|
|
|
self.required_shares = int(params)
|
|
|
|
|
2007-01-16 04:22:22 +00:00
|
|
|
def get_required_shares(self):
|
|
|
|
return self.required_shares
|
|
|
|
|
2007-02-01 23:07:00 +00:00
|
|
|
def decode(self, some_shares, their_shareids):
|
|
|
|
assert len(some_shares) == self.required_shares
|
|
|
|
assert len(some_shares) == len(their_shareids)
|
2007-03-28 05:17:31 +00:00
|
|
|
return defer.succeed([some_shares[0]])
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
|
2006-12-03 00:31:26 +00:00
|
|
|
class Encoder(object):
|
|
|
|
def __init__(self, infile, m):
|
|
|
|
self.infile = infile
|
|
|
|
self.k = 2
|
|
|
|
self.m = m
|
|
|
|
|
|
|
|
def do_upload(self, landlords):
|
2006-12-03 07:53:38 +00:00
|
|
|
dl = []
|
2006-12-03 00:31:26 +00:00
|
|
|
data = self.infile.read()
|
|
|
|
for (peerid, bucket_num, remotebucket) in landlords:
|
2006-12-03 07:53:38 +00:00
|
|
|
dl.append(remotebucket.callRemote('write', data))
|
|
|
|
dl.append(remotebucket.callRemote('close'))
|
2006-12-03 00:31:26 +00:00
|
|
|
|
2006-12-03 07:53:38 +00:00
|
|
|
return defer.DeferredList(dl)
|
2006-12-03 10:01:43 +00:00
|
|
|
|
|
|
|
class Decoder(object):
|
|
|
|
def __init__(self, outfile, k, m, verifierid):
|
|
|
|
self.outfile = outfile
|
2007-02-01 23:07:00 +00:00
|
|
|
self.k = k
|
2006-12-03 10:01:43 +00:00
|
|
|
self.m = m
|
|
|
|
self._verifierid = verifierid
|
|
|
|
|
|
|
|
def start(self, buckets):
|
|
|
|
assert len(buckets) >= self.k
|
|
|
|
dl = []
|
|
|
|
for bucketnum, bucket in buckets[:self.k]:
|
|
|
|
d = bucket.callRemote("read")
|
|
|
|
dl.append(d)
|
|
|
|
d2 = defer.DeferredList(dl)
|
|
|
|
d2.addCallback(self._got_all_data)
|
|
|
|
return d2
|
|
|
|
|
|
|
|
def _got_all_data(self, resultslist):
|
|
|
|
shares = [results for success,results in resultslist if success]
|
|
|
|
assert len(shares) >= self.k
|
|
|
|
# here's where the Reed-Solomon magic takes place
|
|
|
|
self.outfile.write(shares[0])
|
|
|
|
hasher = sha.new(netstring("allmydata_v1_verifierid"))
|
|
|
|
hasher.update(shares[0])
|
|
|
|
vid = hasher.digest()
|
|
|
|
if self._verifierid:
|
|
|
|
assert self._verifierid == vid, "%s != %s" % (idlib.b2a(self._verifierid), idlib.b2a(vid))
|
|
|
|
|
2007-01-05 04:52:51 +00:00
|
|
|
|
2007-02-01 23:07:00 +00:00
|
|
|
class CRSEncoder(object):
|
2007-01-12 03:57:14 +00:00
|
|
|
implements(ICodecEncoder)
|
2007-02-01 23:07:00 +00:00
|
|
|
ENCODER_TYPE = 2
|
2007-01-05 07:42:52 +00:00
|
|
|
|
2007-01-16 04:22:22 +00:00
|
|
|
def set_params(self, data_size, required_shares, max_shares):
|
|
|
|
assert required_shares <= max_shares
|
2007-01-05 04:52:51 +00:00
|
|
|
self.data_size = data_size
|
|
|
|
self.required_shares = required_shares
|
2007-01-16 04:22:22 +00:00
|
|
|
self.max_shares = max_shares
|
2007-02-01 23:07:00 +00:00
|
|
|
self.share_size = mathutil.div_ceil(data_size, required_shares)
|
|
|
|
self.last_share_padding = mathutil.pad_size(self.share_size, required_shares)
|
|
|
|
self.encoder = fec.Encoder(required_shares, max_shares)
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
def get_encoder_type(self):
|
|
|
|
return self.ENCODER_TYPE
|
|
|
|
|
|
|
|
def get_serialized_params(self):
|
2007-02-01 23:07:00 +00:00
|
|
|
return "%d:%d:%d" % (self.data_size, self.required_shares,
|
2007-01-16 04:22:22 +00:00
|
|
|
self.max_shares)
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
def get_share_size(self):
|
|
|
|
return self.share_size
|
|
|
|
|
2007-02-01 23:07:00 +00:00
|
|
|
def encode(self, inshares, desired_share_ids=None):
|
|
|
|
precondition(desired_share_ids is None or len(desired_share_ids) <= self.max_shares, desired_share_ids, self.max_shares)
|
|
|
|
|
|
|
|
if desired_share_ids is None:
|
|
|
|
desired_share_ids = range(self.max_shares)
|
|
|
|
|
|
|
|
for inshare in inshares:
|
|
|
|
assert len(inshare) == self.share_size, (len(inshare), self.share_size, self.data_size, self.required_shares)
|
|
|
|
shares = self.encoder.encode(inshares, desired_share_ids)
|
|
|
|
|
|
|
|
return defer.succeed((shares, desired_share_ids))
|
|
|
|
|
|
|
|
class CRSDecoder(object):
|
2007-01-12 03:57:14 +00:00
|
|
|
implements(ICodecDecoder)
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
def set_serialized_params(self, params):
|
2007-02-01 23:07:00 +00:00
|
|
|
pieces = params.split(":")
|
2007-01-05 04:52:51 +00:00
|
|
|
self.data_size = int(pieces[0])
|
|
|
|
self.required_shares = int(pieces[1])
|
2007-01-16 04:22:22 +00:00
|
|
|
self.max_shares = int(pieces[2])
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
self.chunk_size = self.required_shares
|
|
|
|
self.num_chunks = mathutil.div_ceil(self.data_size, self.chunk_size)
|
|
|
|
self.share_size = self.num_chunks
|
2007-02-01 23:07:00 +00:00
|
|
|
self.decoder = fec.Decoder(self.required_shares, self.max_shares)
|
2007-01-05 07:06:42 +00:00
|
|
|
if False:
|
|
|
|
print "chunk_size: %d" % self.chunk_size
|
|
|
|
print "num_chunks: %d" % self.num_chunks
|
|
|
|
print "share_size: %d" % self.share_size
|
2007-01-16 04:22:22 +00:00
|
|
|
print "max_shares: %d" % self.max_shares
|
2007-01-05 07:06:42 +00:00
|
|
|
print "required_shares: %d" % self.required_shares
|
2007-01-05 04:52:51 +00:00
|
|
|
|
2007-01-16 04:22:22 +00:00
|
|
|
def get_required_shares(self):
|
|
|
|
return self.required_shares
|
|
|
|
|
2007-02-01 23:07:00 +00:00
|
|
|
def decode(self, some_shares, their_shareids):
|
|
|
|
precondition(len(some_shares) == len(their_shareids), len(some_shares), len(their_shareids))
|
|
|
|
precondition(len(some_shares) == self.required_shares, len(some_shares), self.required_shares)
|
|
|
|
return defer.succeed(self.decoder.decode(some_shares, their_shareids))
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
|
|
|
|
all_encoders = {
|
|
|
|
ReplicatingEncoder.ENCODER_TYPE: (ReplicatingEncoder, ReplicatingDecoder),
|
2007-02-01 23:07:00 +00:00
|
|
|
CRSEncoder.ENCODER_TYPE: (CRSEncoder, CRSDecoder),
|
2007-01-05 04:52:51 +00:00
|
|
|
}
|
2007-01-17 04:29:59 +00:00
|
|
|
|
|
|
|
def get_decoder_by_name(name):
|
|
|
|
decoder_class = all_encoders[name][1]
|
|
|
|
return decoder_class()
|
|
|
|
|