tahoe-lafs/src/allmydata/test/test_encode_share.py


import os
from twisted.trial import unittest
from twisted.internet import defer
from twisted.python import log
from allmydata.encode import PyRSEncoder, PyRSDecoder, ReplicatingEncoder, ReplicatingDecoder
import random

class Tester:
    #enc_class = PyRSEncoder
    #dec_class = PyRSDecoder

    def do_test(self, size, required_shares, total_shares):
        data0 = os.urandom(size)
        enc = self.enc_class()
        enc.set_params(size, required_shares, total_shares)
        serialized_params = enc.get_serialized_params()
        log.msg("serialized_params: %s" % serialized_params)
        d = enc.encode(data0)
        def _done(shares):
            self.failUnlessEqual(len(shares), total_shares)
            self.shares = shares
        d.addCallback(_done)

        def _decode(shares):
            dec = self.dec_class()
            dec.set_serialized_params(serialized_params)
            d1 = dec.decode(shares)
            return d1

        def _check_data(data1):
            self.failUnlessEqual(len(data1), len(data0))
            self.failUnless(data1 == data0)

        def _decode_all_ordered(res):
            log.msg("_decode_all_ordered")
            # can we decode using all of the shares?
            return _decode(self.shares)
        d.addCallback(_decode_all_ordered)
        d.addCallback(_check_data)

        def _decode_all_shuffled(res):
            log.msg("_decode_all_shuffled")
            # can we decode, using all the shares, but in random order?
            shuffled_shares = self.shares[:]
            random.shuffle(shuffled_shares)
            return _decode(shuffled_shares)
        d.addCallback(_decode_all_shuffled)
        d.addCallback(_check_data)

        def _decode_some(res):
            log.msg("_decode_some")
            # decode with a minimal subset of the shares
            some_shares = self.shares[:required_shares]
            return _decode(some_shares)
        d.addCallback(_decode_some)
        d.addCallback(_check_data)

        def _decode_some_random(res):
            log.msg("_decode_some_random")
            # use a randomly-selected minimal subset
            some_shares = random.sample(self.shares, required_shares)
            return _decode(some_shares)
        d.addCallback(_decode_some_random)
        d.addCallback(_check_data)

        def _decode_multiple(res):
            log.msg("_decode_multiple")
            # make sure we can re-use the decoder object
            shares1 = random.sample(self.shares, required_shares)
            shares2 = random.sample(self.shares, required_shares)
            dec = self.dec_class()
            dec.set_serialized_params(serialized_params)
            d1 = dec.decode(shares1)
            d1.addCallback(_check_data)
            d1.addCallback(lambda res: dec.decode(shares2))
            d1.addCallback(_check_data)
            return d1
        d.addCallback(_decode_multiple)

        return d

    def test_encode(self):
        if os.uname()[1] == "slave3" and self.enc_class == PyRSEncoder:
            raise unittest.SkipTest("slave3 is really slow")
        return self.do_test(1000, 25, 100)

    def test_encode1(self):
        return self.do_test(8, 8, 16)

    def test_encode2(self):
        if os.uname()[1] == "slave3" and self.enc_class == PyRSEncoder:
            raise unittest.SkipTest("slave3 is really slow")
        return self.do_test(123, 25, 100)

    def test_sizes(self):
        raise unittest.SkipTest("omg this would take forever")
        d = defer.succeed(None)
        for i in range(1, 100):
            d.addCallback(lambda res,size: self.do_test(size, 4, 10), i)
        return d

class PyRS(unittest.TestCase, Tester):
    enc_class = PyRSEncoder
    dec_class = PyRSDecoder

class Replicating(unittest.TestCase, Tester):
    enc_class = ReplicatingEncoder
    dec_class = ReplicatingDecoder


class BenchPyRS(unittest.TestCase):
    enc_class = PyRSEncoder
    def test_big(self):
        import time
        size = 10000
        required_shares = 25
        total_shares = 100
        import os
        # this lets us use a persistent lookup table, stored outside the
        # _trial_temp directory (which is deleted each time trial is run)
        os.symlink("../ffield.lut.8", "ffield.lut.8")
        enc = self.enc_class()
        self.start()
        enc.set_params(size, required_shares, total_shares)
        serialized_params = enc.get_serialized_params()
        print "encoder ready", self.stop()
        self.start()
        data0 = os.urandom(size)
        print "data ready", self.stop()
        self.start()
        d = enc.encode(data0)
        def _done(shares):
            now_shares = time.time()
            print "shares ready", self.stop()
            self.start()
            self.failUnlessEqual(len(shares), total_shares)
        d.addCallback(_done)
        d.addCallback(lambda res: enc.encode(data0))
        d.addCallback(_done)
        d.addCallback(lambda res: enc.encode(data0))
        d.addCallback(_done)
        return d

    def start(self):
        self.start_time = time.time()

    def stop(self):
        self.end_time = time.time()
        return (self.end_time - self.start_time)


# to benchmark the encoder, delete this line
del BenchPyRS
# and then run 'make test TEST=allmydata.test.test_encode_share.BenchPyRS'
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00
			`import os`
			`from twisted.trial import unittest`
			`from twisted.internet import defer`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`from twisted.python import log`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`from allmydata.encode import PyRSEncoder, PyRSDecoder, ReplicatingEncoder, ReplicatingDecoder`
			`import random`

			`class Tester:`
			`#enc_class = PyRSEncoder`
			`#dec_class = PyRSDecoder`

			`def do_test(self, size, required_shares, total_shares):`
			`data0 = os.urandom(size)`
			`enc = self.enc_class()`
			`enc.set_params(size, required_shares, total_shares)`
			`serialized_params = enc.get_serialized_params()`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`log.msg("serialized_params: %s" % serialized_params)`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`d = enc.encode(data0)`
			`def _done(shares):`
			`self.failUnlessEqual(len(shares), total_shares)`
			`self.shares = shares`
			`d.addCallback(_done)`

			`def _decode(shares):`
			`dec = self.dec_class()`
			`dec.set_serialized_params(serialized_params)`
			`d1 = dec.decode(shares)`
			`return d1`

			`def _check_data(data1):`
			`self.failUnlessEqual(len(data1), len(data0))`
			`self.failUnless(data1 == data0)`

			`def _decode_all_ordered(res):`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`log.msg("_decode_all_ordered")`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`# can we decode using all of the shares?`
			`return _decode(self.shares)`
			`d.addCallback(_decode_all_ordered)`
			`d.addCallback(_check_data)`

			`def _decode_all_shuffled(res):`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`log.msg("_decode_all_shuffled")`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`# can we decode, using all the shares, but in random order?`
			`shuffled_shares = self.shares[:]`
			`random.shuffle(shuffled_shares)`
			`return _decode(shuffled_shares)`
			`d.addCallback(_decode_all_shuffled)`
			`d.addCallback(_check_data)`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`def _decode_some(res):`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`log.msg("_decode_some")`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`# decode with a minimal subset of the shares`
			`some_shares = self.shares[:required_shares]`
			`return _decode(some_shares)`
			`d.addCallback(_decode_some)`
			`d.addCallback(_check_data)`

			`def _decode_some_random(res):`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`log.msg("_decode_some_random")`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`# use a randomly-selected minimal subset`
			`some_shares = random.sample(self.shares, required_shares)`
			`return _decode(some_shares)`
			`d.addCallback(_decode_some_random)`
			`d.addCallback(_check_data)`

			`def _decode_multiple(res):`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`log.msg("_decode_multiple")`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`# make sure we can re-use the decoder object`
			`shares1 = random.sample(self.shares, required_shares)`
			`shares2 = random.sample(self.shares, required_shares)`
			`dec = self.dec_class()`
			`dec.set_serialized_params(serialized_params)`
			`d1 = dec.decode(shares1)`
			`d1.addCallback(_check_data)`
			`d1.addCallback(lambda res: dec.decode(shares2))`
			`d1.addCallback(_check_data)`
			`return d1`
			`d.addCallback(_decode_multiple)`

			`return d`

			`def test_encode(self):`
only run a single (short) py_ecc test on slave3, since it is so slow the tests timeout 2007-01-05 07:42:52 +00:00			`if os.uname()[1] == "slave3" and self.enc_class == PyRSEncoder:`
			`raise unittest.SkipTest("slave3 is really slow")`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`return self.do_test(1000, 25, 100)`

fix our use of py_ecc (set log2FieldSize=8 explicitly) 2007-01-05 06:50:21 +00:00			`def test_encode1(self):`
			`return self.do_test(8, 8, 16)`

encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`def test_encode2(self):`
only run a single (short) py_ecc test on slave3, since it is so slow the tests timeout 2007-01-05 07:42:52 +00:00			`if os.uname()[1] == "slave3" and self.enc_class == PyRSEncoder:`
			`raise unittest.SkipTest("slave3 is really slow")`
encoding: fix the last py_ecc problem, tests pass now 2007-01-05 07:06:42 +00:00			`return self.do_test(123, 25, 100)`

establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`def test_sizes(self):`
fix our use of py_ecc (set log2FieldSize=8 explicitly) 2007-01-05 06:50:21 +00:00			`raise unittest.SkipTest("omg this would take forever")`
establish IEncoder/IDecoder, create suitable interfaces for both the simple replicating encoder and the py_ecc one, add a (failing) unit test for it 2007-01-05 04:52:51 +00:00			`d = defer.succeed(None)`
			`for i in range(1, 100):`
			`d.addCallback(lambda res,size: self.do_test(size, 4, 10), i)`
			`return d`

			`class PyRS(unittest.TestCase, Tester):`
			`enc_class = PyRSEncoder`
			`dec_class = PyRSDecoder`

			`class Replicating(unittest.TestCase, Tester):`
			`enc_class = ReplicatingEncoder`
			`dec_class = ReplicatingDecoder`
add some (disabled) encoder benchmarking code 2007-01-06 01:46:03 +00:00

			`class BenchPyRS(unittest.TestCase):`
			`enc_class = PyRSEncoder`
			`def test_big(self):`
			`import time`
			`size = 10000`
			`required_shares = 25`
			`total_shares = 100`
			`import os`
			`# this lets us use a persistent lookup table, stored outside the`
			`# _trial_temp directory (which is deleted each time trial is run)`
			`os.symlink("../ffield.lut.8", "ffield.lut.8")`
			`enc = self.enc_class()`
			`self.start()`
			`enc.set_params(size, required_shares, total_shares)`
			`serialized_params = enc.get_serialized_params()`
			`print "encoder ready", self.stop()`
			`self.start()`
			`data0 = os.urandom(size)`
			`print "data ready", self.stop()`
			`self.start()`
			`d = enc.encode(data0)`
			`def _done(shares):`
			`now_shares = time.time()`
			`print "shares ready", self.stop()`
			`self.start()`
			`self.failUnlessEqual(len(shares), total_shares)`
			`d.addCallback(_done)`
			`d.addCallback(lambda res: enc.encode(data0))`
			`d.addCallback(_done)`
			`d.addCallback(lambda res: enc.encode(data0))`
			`d.addCallback(_done)`
			`return d`

			`def start(self):`
			`self.start_time = time.time()`

			`def stop(self):`
			`self.end_time = time.time()`
			`return (self.end_time - self.start_time)`


			`# to benchmark the encoder, delete this line`
			`del BenchPyRS`
			`# and then run 'make test TEST=allmydata.test.test_encode_share.BenchPyRS'`