tahoe-lafs/src/allmydata/test/test_system.py

401 lines
17 KiB
Python
Raw Normal View History

2007-03-29 21:31:55 +00:00
import os
from cStringIO import StringIO
from twisted.trial import unittest
from twisted.internet import defer, reactor
from twisted.application import service
from allmydata import client, uri, download, upload
2007-06-01 01:31:01 +00:00
from allmydata.introducer_and_vdrive import IntroducerAndVdrive
from allmydata.util import idlib, fileutil, testutil
from allmydata.scripts import runner
from foolscap.eventual import flushEventualQueue
from twisted.python import log
from twisted.python.failure import Failure
2006-12-07 19:48:06 +00:00
from twisted.web.client import getPage
from twisted.web.error import PageRedirect
def flush_but_dont_ignore(res):
d = flushEventualQueue()
def _done(ignored):
return res
d.addCallback(_done)
return d
class SystemTest(testutil.SignalMixin, unittest.TestCase):
def setUp(self):
self.sparent = service.MultiService()
self.sparent.startService()
def tearDown(self):
log.msg("shutting down SystemTest services")
d = self.sparent.stopService()
d.addBoth(flush_but_dont_ignore)
return d
def getdir(self, subdir):
return os.path.join(self.basedir, subdir)
2006-12-03 07:56:27 +00:00
def add_service(self, s):
s.setServiceParent(self.sparent)
return s
2006-12-03 07:56:27 +00:00
def set_up_nodes(self, NUMCLIENTS=5):
self.numclients = NUMCLIENTS
2007-06-01 01:31:01 +00:00
iv_dir = self.getdir("introducer_and_vdrive")
if not os.path.isdir(iv_dir):
fileutil.make_dirs(iv_dir)
iv = IntroducerAndVdrive(basedir=iv_dir)
self.introducer_and_vdrive = self.add_service(iv)
d = self.introducer_and_vdrive.when_tub_ready()
d.addCallback(self._set_up_nodes_2)
return d
def _set_up_nodes_2(self, res):
q = self.introducer_and_vdrive
self.introducer_furl = q.urls["introducer"]
self.vdrive_furl = q.urls["vdrive"]
2006-12-03 07:56:27 +00:00
self.clients = []
for i in range(self.numclients):
basedir = self.getdir("client%d" % i)
if not os.path.isdir(basedir):
fileutil.make_dirs(basedir)
2006-12-07 19:48:06 +00:00
if i == 0:
open(os.path.join(basedir, "webport"), "w").write("tcp:0:interface=127.0.0.1")
open(os.path.join(basedir, "introducer.furl"), "w").write(self.introducer_furl)
open(os.path.join(basedir, "vdrive.furl"), "w").write(self.vdrive_furl)
2006-12-03 07:56:27 +00:00
c = self.add_service(client.Client(basedir=basedir))
self.clients.append(c)
log.msg("STARTING")
2006-12-07 19:48:06 +00:00
d = self.wait_for_connections()
def _connected(res):
log.msg("CONNECTED")
2006-12-07 19:48:06 +00:00
# now find out where the web port was
l = self.clients[0].getServiceNamed("webish").listener
port = l._port.getHost().port
self.webish_url = "http://localhost:%d/" % port
d.addCallback(_connected)
return d
def add_extra_node(self, client_num):
# this node is *not* parented to our self.sparent, so we can shut it
# down separately from the rest, to exercise the connection-lost code
basedir = self.getdir("client%d" % client_num)
if not os.path.isdir(basedir):
fileutil.make_dirs(basedir)
open(os.path.join(basedir, "introducer.furl"), "w").write(self.introducer_furl)
open(os.path.join(basedir, "vdrive.furl"), "w").write(self.vdrive_furl)
c = client.Client(basedir=basedir)
self.clients.append(c)
self.numclients += 1
c.startService()
d = self.wait_for_connections()
d.addCallback(lambda res: c)
return d
2006-12-03 07:56:27 +00:00
def wait_for_connections(self, ignored=None):
for c in self.clients:
if (not c.introducer_client or
len(list(c.get_all_peerids())) != self.numclients):
2006-12-03 07:56:27 +00:00
d = defer.Deferred()
d.addCallback(self.wait_for_connections)
reactor.callLater(0.05, d.callback, None)
return d
return defer.succeed(None)
def test_connections(self):
self.basedir = "test_system/SystemTest/test_connections"
2006-12-03 07:56:27 +00:00
d = self.set_up_nodes()
self.extra_node = None
d.addCallback(lambda res: self.add_extra_node(5))
def _check(extra_node):
self.extra_node = extra_node
for c in self.clients:
self.failUnlessEqual(len(list(c.get_all_peerids())), 6)
d.addCallback(_check)
def _shutdown_extra_node(res):
if self.extra_node:
return self.extra_node.stopService()
return res
d.addBoth(_shutdown_extra_node)
return d
test_connections.timeout = 300
# test_connections is subsumed by test_upload_and_download, and takes
# quite a while to run on a slow machine (because of all the TLS
# connections that must be established). If we ever rework the introducer
# code to such an extent that we're not sure if it works anymore, we can
# reinstate this test until it does.
del test_connections
def test_upload_and_download(self):
self.basedir = "test_system/SystemTest/test_upload_and_download"
# we use 4000 bytes of data, which will result in about 400k written
# to disk among all our simulated nodes
DATA = "Some data to upload\n" * 200
2006-12-03 07:56:27 +00:00
d = self.set_up_nodes()
def _do_upload(res):
2006-12-03 07:56:27 +00:00
log.msg("UPLOADING")
u = self.clients[0].getServiceNamed("uploader")
self.uploader = u
# we crank the max segsize down to 1024b for the duration of this
# test, so we can exercise multiple segments. It is important
# that this is not a multiple of the segment size, so that the
2007-04-18 03:28:19 +00:00
# tail segment is not the same length as the others. This actualy
# gets rounded up to 1025 to be a multiple of the number of
# required shares (since we use 25 out of 100 FEC).
options = {"max_segment_size": 1024}
d1 = u.upload_data(DATA, options)
return d1
d.addCallback(_do_upload)
def _upload_done(uri):
log.msg("upload finished: uri is %s" % (uri,))
self.uri = uri
dl = self.clients[1].getServiceNamed("downloader")
self.downloader = dl
d.addCallback(_upload_done)
def _upload_again(res):
# upload again. This ought to be short-circuited, however with
# the way we currently generate URIs (i.e. because they include
# the roothash), we have to do all of the encoding work, and only
# get to save on the upload part.
log.msg("UPLOADING AGAIN")
options = {"max_segment_size": 1024}
d1 = self.uploader.upload_data(DATA, options)
d.addCallback(_upload_again)
def _download_to_data(res):
log.msg("DOWNLOADING")
return self.downloader.download_to_data(self.uri)
d.addCallback(_download_to_data)
def _download_to_data_done(data):
log.msg("download finished")
self.failUnlessEqual(data, DATA)
d.addCallback(_download_to_data_done)
target_filename = os.path.join(self.basedir, "download.target")
def _download_to_filename(res):
return self.downloader.download_to_filename(self.uri,
target_filename)
d.addCallback(_download_to_filename)
def _download_to_filename_done(res):
newdata = open(target_filename, "rb").read()
self.failUnlessEqual(newdata, DATA)
d.addCallback(_download_to_filename_done)
target_filename2 = os.path.join(self.basedir, "download.target2")
def _download_to_filehandle(res):
fh = open(target_filename2, "wb")
return self.downloader.download_to_filehandle(self.uri, fh)
d.addCallback(_download_to_filehandle)
def _download_to_filehandle_done(fh):
fh.close()
newdata = open(target_filename2, "rb").read()
self.failUnlessEqual(newdata, DATA)
d.addCallback(_download_to_filehandle_done)
def _download_nonexistent_uri(res):
baduri = self.mangle_uri(self.uri)
d1 = self.downloader.download_to_data(baduri)
def _baduri_should_fail(res):
self.failUnless(isinstance(res, Failure))
self.failUnless(res.check(download.NotEnoughPeersError),
"expected NotEnoughPeersError, got %s" % res)
# TODO: files that have zero peers should get a special kind
# of NotEnoughPeersError, which can be used to suggest that
# the URI might be wrong or that they've nver uploaded the
# file in the first place.
d1.addBoth(_baduri_should_fail)
return d1
d.addCallback(_download_nonexistent_uri)
return d
test_upload_and_download.timeout = 4800
2006-12-03 07:56:27 +00:00
def flip_bit(self, good):
return good[:-1] + chr(ord(good[-1]) ^ 0x01)
def mangle_uri(self, gooduri):
# change the storage index, which means we'll be asking about the
# wrong file, so nobody will have any shares
d = uri.unpack_uri(gooduri)
assert len(d['storage_index']) == 32
d['storage_index'] = self.flip_bit(d['storage_index'])
return uri.pack_uri(**d)
2007-06-08 22:59:16 +00:00
# TODO: add a test which mangles the uri_extension_hash instead, and
# should fail due to not being able to get a valid uri_extension block.
# Also a test which sneakily mangles the uri_extension block to change
# some of the validation data, so it will fail in the post-download phase
# when the file's crypttext integrity check fails. Do the same thing for
# the key, which should cause the download to fail the post-download
# plaintext_hash check.
def test_vdrive(self):
self.basedir = "test_system/SystemTest/test_vdrive"
2006-12-07 19:48:06 +00:00
self.data = DATA = "Some data to publish to the virtual drive\n"
d = self.set_up_nodes()
def _do_publish(res):
log.msg("PUBLISHING")
ut = upload.Data(DATA)
c0 = self.clients[0]
d1 = c0._vdrive_root.create_empty_directory("subdir1")
d1.addCallback(lambda subdir1_node:
subdir1_node.add_file("mydata567", ut))
def _stash_uri(filenode):
self.uri = filenode.get_uri()
return filenode
d1.addCallback(_stash_uri)
return d1
d.addCallback(_do_publish)
def _publish_done(filenode):
log.msg("publish finished")
c1 = self.clients[1]
d1 = c1._vdrive_root.get("subdir1")
d1.addCallback(lambda subdir1: subdir1.get("mydata567"))
d1.addCallback(lambda filenode: filenode.download_to_data())
return d1
d.addCallback(_publish_done)
def _get_done(data):
log.msg("get finished")
self.failUnlessEqual(data, DATA)
d.addCallback(_get_done)
2006-12-07 19:48:06 +00:00
d.addCallback(self._test_web)
d.addCallback(self._test_runner)
return d
test_vdrive.timeout = 1100
2006-12-07 19:48:06 +00:00
def _test_web(self, res):
base = self.webish_url
d = getPage(base)
def _got_welcome(page):
expected = "Connected Peers: <span>%d</span>" % (self.numclients)
2006-12-07 19:48:06 +00:00
self.failUnless(expected in page,
"I didn't see the right 'connected peers' message "
"in: %s" % page
)
2007-03-29 21:31:55 +00:00
expected = "My nodeid: <span>%s</span>" % idlib.b2a(self.clients[0].nodeid)
self.failUnless(expected in page,
"I didn't see the right 'My nodeid' message "
"in: %s" % page)
2006-12-07 19:48:06 +00:00
d.addCallback(_got_welcome)
d.addCallback(lambda res: getPage(base + "global_vdrive"))
d.addCallback(lambda res: getPage(base + "global_vdrive/subdir1"))
2006-12-07 19:48:06 +00:00
def _got_subdir1(page):
# there ought to be an href for our file
self.failUnless(("<td>%d</td>" % len(self.data)) in page)
self.failUnless(">mydata567</a>" in page)
2006-12-07 19:48:06 +00:00
d.addCallback(_got_subdir1)
d.addCallback(lambda res:
getPage(base + "global_vdrive/subdir1/mydata567"))
def _got_data(page):
self.failUnlessEqual(page, self.data)
d.addCallback(_got_data)
# download from a URI embedded in a URL
def _get_from_uri(res):
return getPage(base + "download_uri/%s?filename=%s"
% (self.uri, "mydata567"))
d.addCallback(_get_from_uri)
def _got_from_uri(page):
self.failUnlessEqual(page, self.data)
d.addCallback(_got_from_uri)
# download from a URI embedded in a URL, second form
def _get_from_uri2(res):
return getPage(base + "download_uri?uri=%s" % (self.uri,))
d.addCallback(_get_from_uri2)
def _got_from_uri2(page):
self.failUnlessEqual(page, self.data)
d.addCallback(_got_from_uri2)
# download from a URI pasted into a form. Use POST, build a
# multipart/form-data, submit it. This actualy redirects us to a
# /download_uri?uri=%s URL, and twisted.web.client doesn't seem to
# handle POST redirects very well (it does a second POST instead of
# the GET that a browser seems to do), so we just verify that we get
# the right redirect response.
def _get_from_form(res):
url = base + "welcome/freeform_post!!download"
sep = "-"*40 + "boogabooga"
form = [sep,
"Content-Disposition: form-data; name=\"_charset_\"",
"",
"UTF-8",
sep,
"Content-Disposition: form-data; name=\"uri\"",
"",
self.uri,
sep,
"Content-Disposition: form-data; name=\"filename\"",
"",
"foo.txt",
sep,
"Content-Disposition: form-data; name=\"download\"",
"",
"Download",
sep + "--",
]
body = "\r\n".join(form)
headers = {"content-type":
"multipart/form-data; boundary=%s" % sep,
}
return getPage(url, None, "POST", body, headers=headers,
followRedirect=False)
d.addCallback(_get_from_form)
def _got_from_form_worked_unexpectedly(page):
self.fail("we weren't supposed to get an actual page: %s" %
(page,))
def _got_from_form_redirect(f):
f.trap(PageRedirect)
# the PageRedirect does not seem to capture the uri= query arg
# properly, so we can't check for it.
self.failUnless(f.value.location.startswith(base+"download_uri?"))
d.addCallbacks(_got_from_form_worked_unexpectedly,
_got_from_form_redirect)
# TODO: create a directory by using a form
# TODO: upload by using a form on the directory page
# url = base + "global_vdrive/subdir1/freeform_post!!upload"
# TODO: delete a file by using a button on the directory page
2006-12-07 19:48:06 +00:00
return d
def _test_runner(self, res):
# exercise some of the diagnostic tools in runner.py
# find a uri_extension file
for (dirpath, dirnames, filenames) in os.walk(self.basedir):
if "uri_extension" in filenames:
break
else:
self.fail("unable to find any uri_extension files in %s"
% self.basedir)
log.msg("test_system.SystemTest._test_runner using %s" % dirpath)
filename = os.path.join(dirpath, "uri_extension")
s = StringIO()
rc = runner.dump_uri_extension({'filename': filename}, s)
output = s.getvalue()
self.failUnlessEqual(rc, 0)
# we only upload a single file, so we can assert some things about
# its size and shares
self.failUnless("size: %d\n" % len(self.data) in output)
self.failUnless("num_segments: 1\n" in output)
# segment_size is always a multiple of needed_shares
self.failUnless("segment_size: 50\n" in output)
self.failUnless("total_shares: 100\n" in output)
# keys which are supposed to be present
for key in ("size", "num_segments", "segment_size",
"needed_shares", "total_shares",
"codec_name", "codec_params", "tail_codec_params",
"plaintext_hash", "plaintext_root_hash",
"crypttext_hash", "crypttext_root_hash",
"share_root_hash",
):
self.failUnless("%s: " % key in output, key)