2007-01-05 04:52:51 +00:00
|
|
|
|
2007-01-06 01:53:22 +00:00
|
|
|
import os, time
|
2007-01-05 04:52:51 +00:00
|
|
|
from twisted.trial import unittest
|
|
|
|
from twisted.internet import defer
|
2007-01-05 07:06:42 +00:00
|
|
|
from twisted.python import log
|
2007-01-12 03:51:27 +00:00
|
|
|
from allmydata.codec import PyRSEncoder, PyRSDecoder, ReplicatingEncoder, ReplicatingDecoder
|
2007-01-05 04:52:51 +00:00
|
|
|
import random
|
|
|
|
|
|
|
|
class Tester:
|
|
|
|
#enc_class = PyRSEncoder
|
|
|
|
#dec_class = PyRSDecoder
|
|
|
|
|
2007-01-16 04:22:22 +00:00
|
|
|
def do_test(self, size, required_shares, max_shares, fewer_shares=None):
|
2007-01-05 04:52:51 +00:00
|
|
|
data0 = os.urandom(size)
|
|
|
|
enc = self.enc_class()
|
2007-01-16 04:22:22 +00:00
|
|
|
enc.set_params(size, required_shares, max_shares)
|
2007-01-05 04:52:51 +00:00
|
|
|
serialized_params = enc.get_serialized_params()
|
2007-01-05 07:06:42 +00:00
|
|
|
log.msg("serialized_params: %s" % serialized_params)
|
2007-01-05 04:52:51 +00:00
|
|
|
d = enc.encode(data0)
|
2007-01-16 04:22:22 +00:00
|
|
|
def _done_encoding_all(shares):
|
|
|
|
self.failUnlessEqual(len(shares), max_shares)
|
2007-01-05 04:52:51 +00:00
|
|
|
self.shares = shares
|
2007-01-16 04:22:22 +00:00
|
|
|
d.addCallback(_done_encoding_all)
|
|
|
|
if fewer_shares is not None:
|
|
|
|
# also validate that the num_shares= parameter works
|
|
|
|
d.addCallback(lambda res: enc.encode(data0, fewer_shares))
|
|
|
|
def _check_fewer_shares(some_shares):
|
|
|
|
self.failUnlessEqual(len(some_shares), fewer_shares)
|
|
|
|
d.addCallback(_check_fewer_shares)
|
2007-01-05 04:52:51 +00:00
|
|
|
|
|
|
|
def _decode(shares):
|
|
|
|
dec = self.dec_class()
|
|
|
|
dec.set_serialized_params(serialized_params)
|
|
|
|
d1 = dec.decode(shares)
|
|
|
|
return d1
|
|
|
|
|
|
|
|
def _check_data(data1):
|
|
|
|
self.failUnlessEqual(len(data1), len(data0))
|
|
|
|
self.failUnless(data1 == data0)
|
|
|
|
|
|
|
|
def _decode_all_ordered(res):
|
2007-01-05 07:06:42 +00:00
|
|
|
log.msg("_decode_all_ordered")
|
2007-01-05 04:52:51 +00:00
|
|
|
# can we decode using all of the shares?
|
|
|
|
return _decode(self.shares)
|
|
|
|
d.addCallback(_decode_all_ordered)
|
|
|
|
d.addCallback(_check_data)
|
|
|
|
|
|
|
|
def _decode_all_shuffled(res):
|
2007-01-05 07:06:42 +00:00
|
|
|
log.msg("_decode_all_shuffled")
|
2007-01-05 04:52:51 +00:00
|
|
|
# can we decode, using all the shares, but in random order?
|
|
|
|
shuffled_shares = self.shares[:]
|
|
|
|
random.shuffle(shuffled_shares)
|
|
|
|
return _decode(shuffled_shares)
|
|
|
|
d.addCallback(_decode_all_shuffled)
|
|
|
|
d.addCallback(_check_data)
|
2007-01-05 07:06:42 +00:00
|
|
|
|
2007-01-05 04:52:51 +00:00
|
|
|
def _decode_some(res):
|
2007-01-05 07:06:42 +00:00
|
|
|
log.msg("_decode_some")
|
2007-01-05 04:52:51 +00:00
|
|
|
# decode with a minimal subset of the shares
|
|
|
|
some_shares = self.shares[:required_shares]
|
|
|
|
return _decode(some_shares)
|
|
|
|
d.addCallback(_decode_some)
|
|
|
|
d.addCallback(_check_data)
|
|
|
|
|
|
|
|
def _decode_some_random(res):
|
2007-01-05 07:06:42 +00:00
|
|
|
log.msg("_decode_some_random")
|
2007-01-05 04:52:51 +00:00
|
|
|
# use a randomly-selected minimal subset
|
|
|
|
some_shares = random.sample(self.shares, required_shares)
|
|
|
|
return _decode(some_shares)
|
|
|
|
d.addCallback(_decode_some_random)
|
|
|
|
d.addCallback(_check_data)
|
|
|
|
|
|
|
|
def _decode_multiple(res):
|
2007-01-05 07:06:42 +00:00
|
|
|
log.msg("_decode_multiple")
|
2007-01-05 04:52:51 +00:00
|
|
|
# make sure we can re-use the decoder object
|
|
|
|
shares1 = random.sample(self.shares, required_shares)
|
|
|
|
shares2 = random.sample(self.shares, required_shares)
|
|
|
|
dec = self.dec_class()
|
|
|
|
dec.set_serialized_params(serialized_params)
|
|
|
|
d1 = dec.decode(shares1)
|
|
|
|
d1.addCallback(_check_data)
|
|
|
|
d1.addCallback(lambda res: dec.decode(shares2))
|
|
|
|
d1.addCallback(_check_data)
|
|
|
|
return d1
|
|
|
|
d.addCallback(_decode_multiple)
|
|
|
|
|
|
|
|
return d
|
|
|
|
|
|
|
|
def test_encode(self):
|
2007-01-05 07:42:52 +00:00
|
|
|
if os.uname()[1] == "slave3" and self.enc_class == PyRSEncoder:
|
|
|
|
raise unittest.SkipTest("slave3 is really slow")
|
2007-01-05 04:52:51 +00:00
|
|
|
return self.do_test(1000, 25, 100)
|
|
|
|
|
2007-01-05 06:50:21 +00:00
|
|
|
def test_encode1(self):
|
|
|
|
return self.do_test(8, 8, 16)
|
|
|
|
|
2007-01-05 07:06:42 +00:00
|
|
|
def test_encode2(self):
|
2007-01-05 07:42:52 +00:00
|
|
|
if os.uname()[1] == "slave3" and self.enc_class == PyRSEncoder:
|
|
|
|
raise unittest.SkipTest("slave3 is really slow")
|
2007-01-16 04:22:22 +00:00
|
|
|
return self.do_test(123, 25, 100, 90)
|
2007-01-05 07:06:42 +00:00
|
|
|
|
2007-01-05 04:52:51 +00:00
|
|
|
def test_sizes(self):
|
2007-01-05 06:50:21 +00:00
|
|
|
raise unittest.SkipTest("omg this would take forever")
|
2007-01-05 04:52:51 +00:00
|
|
|
d = defer.succeed(None)
|
|
|
|
for i in range(1, 100):
|
|
|
|
d.addCallback(lambda res,size: self.do_test(size, 4, 10), i)
|
|
|
|
return d
|
|
|
|
|
|
|
|
class PyRS(unittest.TestCase, Tester):
|
|
|
|
enc_class = PyRSEncoder
|
|
|
|
dec_class = PyRSDecoder
|
|
|
|
|
|
|
|
class Replicating(unittest.TestCase, Tester):
|
|
|
|
enc_class = ReplicatingEncoder
|
|
|
|
dec_class = ReplicatingDecoder
|
2007-01-06 01:46:03 +00:00
|
|
|
|
|
|
|
|
|
|
|
class BenchPyRS(unittest.TestCase):
|
|
|
|
enc_class = PyRSEncoder
|
|
|
|
def test_big(self):
|
|
|
|
size = 10000
|
|
|
|
required_shares = 25
|
2007-01-16 04:22:22 +00:00
|
|
|
max_shares = 100
|
2007-01-06 01:46:03 +00:00
|
|
|
# this lets us use a persistent lookup table, stored outside the
|
|
|
|
# _trial_temp directory (which is deleted each time trial is run)
|
|
|
|
os.symlink("../ffield.lut.8", "ffield.lut.8")
|
|
|
|
enc = self.enc_class()
|
|
|
|
self.start()
|
2007-01-16 04:22:22 +00:00
|
|
|
enc.set_params(size, required_shares, max_shares)
|
2007-01-06 01:46:03 +00:00
|
|
|
serialized_params = enc.get_serialized_params()
|
|
|
|
print "encoder ready", self.stop()
|
|
|
|
self.start()
|
|
|
|
data0 = os.urandom(size)
|
|
|
|
print "data ready", self.stop()
|
|
|
|
self.start()
|
|
|
|
d = enc.encode(data0)
|
|
|
|
def _done(shares):
|
|
|
|
now_shares = time.time()
|
|
|
|
print "shares ready", self.stop()
|
|
|
|
self.start()
|
2007-01-16 04:22:22 +00:00
|
|
|
self.failUnlessEqual(len(shares), max_shares)
|
2007-01-06 01:46:03 +00:00
|
|
|
d.addCallback(_done)
|
|
|
|
d.addCallback(lambda res: enc.encode(data0))
|
|
|
|
d.addCallback(_done)
|
|
|
|
d.addCallback(lambda res: enc.encode(data0))
|
|
|
|
d.addCallback(_done)
|
|
|
|
return d
|
|
|
|
|
|
|
|
def start(self):
|
|
|
|
self.start_time = time.time()
|
|
|
|
|
|
|
|
def stop(self):
|
|
|
|
self.end_time = time.time()
|
|
|
|
return (self.end_time - self.start_time)
|
|
|
|
|
|
|
|
|
|
|
|
# to benchmark the encoder, delete this line
|
|
|
|
del BenchPyRS
|
|
|
|
# and then run 'make test TEST=allmydata.test.test_encode_share.BenchPyRS'
|