2009-02-23 14:19:43 -07:00
|
|
|
|
2017-01-19 15:39:53 -07:00
|
|
|
import json
|
2012-04-01 01:55:19 -04:00
|
|
|
import os.path, shutil
|
2020-07-10 08:00:04 -04:00
|
|
|
|
|
|
|
from bs4 import BeautifulSoup
|
|
|
|
|
2009-02-23 14:19:43 -07:00
|
|
|
from twisted.trial import unittest
|
2011-08-01 23:37:03 -07:00
|
|
|
from twisted.internet import defer
|
2020-06-11 12:44:48 -04:00
|
|
|
|
|
|
|
from nevow.inevow import IRequest
|
|
|
|
from zope.interface import implementer
|
|
|
|
from twisted.web.server import Request
|
|
|
|
from twisted.web.test.requesthelper import DummyChannel
|
|
|
|
from twisted.web.template import flattenString
|
|
|
|
|
2009-02-23 14:19:43 -07:00
|
|
|
from allmydata import check_results, uri
|
2012-04-01 01:55:19 -04:00
|
|
|
from allmydata import uri as tahoe_uri
|
2020-07-14 21:44:41 -04:00
|
|
|
from allmydata.interfaces import (
|
2020-07-15 10:35:56 -04:00
|
|
|
IServer,
|
2020-07-14 21:44:41 -04:00
|
|
|
ICheckResults,
|
2020-07-15 16:58:39 -04:00
|
|
|
ICheckAndRepairResults,
|
2020-07-14 21:44:41 -04:00
|
|
|
)
|
2012-05-17 10:50:16 -07:00
|
|
|
from allmydata.util import base32
|
2009-02-23 14:19:43 -07:00
|
|
|
from allmydata.web import check_results as web_check_results
|
2011-02-20 17:58:04 -08:00
|
|
|
from allmydata.storage_client import StorageFarmBroker, NativeStorageServer
|
2012-04-01 01:55:19 -04:00
|
|
|
from allmydata.storage.server import storage_index_to_dir
|
checker: don't let failures in add-lease affect checker results. Closes #875.
Mutable servermap updates and the immutable checker, when run with
add_lease=True, send both the do-you-have-block and add-lease commands in
parallel, to avoid an extra round trip time. Many older servers have problems
with add-lease and raise various exceptions, which don't generally matter.
The client-side code was catching+ignoring some of them, but unrecognized
exceptions were passed through to the DYHB code, concealing the DYHB results
from the checker, making it think the server had no shares.
The fix is to separate the code paths. Both commands are sent at the same
time, but the errback path from add-lease is handled separately. Known
exceptions are ignored, the others (both unknown-remote and all-local) are
logged (log.WEIRD, which will trigger an Incident), but neither will affect
the DYHB results.
The add-lease message is sent first, and we know that the server handles them
synchronously. So when the checker is done, we can be sure that all the
add-lease messages have been retired. This makes life easier for unit tests.
2009-12-29 15:01:08 -08:00
|
|
|
from allmydata.monitor import Monitor
|
|
|
|
from allmydata.test.no_network import GridTestMixin
|
|
|
|
from allmydata.immutable.upload import Data
|
2011-08-06 17:44:59 -07:00
|
|
|
from allmydata.mutable.publish import MutableData
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2019-08-19 16:09:26 -04:00
|
|
|
from .common import (
|
|
|
|
EMPTY_CLIENT_CONFIG,
|
|
|
|
)
|
|
|
|
|
2020-07-10 08:00:04 -04:00
|
|
|
from .web.common import (
|
|
|
|
assert_soup_has_favicon,
|
|
|
|
assert_soup_has_tag_with_content,
|
|
|
|
)
|
|
|
|
|
2019-05-15 08:17:44 +02:00
|
|
|
class FakeClient(object):
|
2009-06-01 19:25:11 -07:00
|
|
|
def get_storage_broker(self):
|
|
|
|
return self.storage_broker
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2020-06-11 12:44:48 -04:00
|
|
|
@implementer(IRequest)
|
2020-07-28 06:27:40 -04:00
|
|
|
class TestRequest(Request, object):
|
2020-07-28 07:15:39 -04:00
|
|
|
"""
|
|
|
|
A minimal Request class to use in tests.
|
|
|
|
|
|
|
|
XXX: We have to have this class because `common.get_arg()` expects
|
|
|
|
a `nevow.inevow.IRequest`, which `twisted.web.server.Request`
|
|
|
|
isn't. The request needs to have `args`, `fields`, `prepath`, and
|
|
|
|
`postpath` properties so that `allmydata.web.common.get_arg()`
|
|
|
|
won't complain.
|
|
|
|
"""
|
2020-06-11 12:44:48 -04:00
|
|
|
def __init__(self, args=None, fields=None):
|
2020-07-28 06:27:40 -04:00
|
|
|
super(TestRequest, self).__init__(DummyChannel())
|
2020-06-11 12:44:48 -04:00
|
|
|
self.args = args or {}
|
|
|
|
self.fields = fields or {}
|
2020-07-10 08:00:04 -04:00
|
|
|
self.prepath = [b""]
|
2020-07-14 21:44:41 -04:00
|
|
|
self.postpath = [b""]
|
|
|
|
|
|
|
|
|
2020-07-15 10:35:56 -04:00
|
|
|
@implementer(IServer)
|
|
|
|
class FakeServer(object):
|
|
|
|
|
|
|
|
def get_name(self):
|
|
|
|
return "fake name"
|
|
|
|
|
|
|
|
def get_longname(self):
|
|
|
|
return "fake longname"
|
|
|
|
|
|
|
|
def get_nickname(self):
|
|
|
|
return "fake nickname"
|
|
|
|
|
|
|
|
|
2020-07-14 21:44:41 -04:00
|
|
|
@implementer(ICheckResults)
|
2020-07-15 18:43:52 -04:00
|
|
|
class FakeCheckResults(object):
|
2020-07-14 21:44:41 -04:00
|
|
|
|
2020-07-15 18:43:52 -04:00
|
|
|
def __init__(self, si=None,
|
|
|
|
healthy=False, recoverable=False,
|
|
|
|
summary="fake summary"):
|
|
|
|
self._storage_index = si
|
|
|
|
self._is_healthy = healthy
|
|
|
|
self._is_recoverable = recoverable
|
|
|
|
self._summary = summary
|
2020-07-14 21:44:41 -04:00
|
|
|
|
|
|
|
def get_storage_index(self):
|
|
|
|
return self._storage_index
|
|
|
|
|
|
|
|
def get_storage_index_string(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return base32.b2a_or_none(self._storage_index)
|
2020-07-14 21:44:41 -04:00
|
|
|
|
|
|
|
def is_healthy(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return self._is_healthy
|
2020-07-14 21:44:41 -04:00
|
|
|
|
|
|
|
def is_recoverable(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return self._is_recoverable
|
2020-07-14 21:44:41 -04:00
|
|
|
|
|
|
|
def get_summary(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return self._summary
|
2020-07-14 21:44:41 -04:00
|
|
|
|
2020-07-15 10:35:56 -04:00
|
|
|
def get_corrupt_shares(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
# returns a list of (IServer, storage_index, sharenum)
|
|
|
|
return [(FakeServer(), "<fake-si>", 0)]
|
2020-07-14 21:44:41 -04:00
|
|
|
|
2020-06-11 12:44:48 -04:00
|
|
|
|
2020-07-15 16:58:39 -04:00
|
|
|
@implementer(ICheckAndRepairResults)
|
2020-07-15 18:43:52 -04:00
|
|
|
class FakeCheckAndRepairResults(object):
|
|
|
|
|
|
|
|
def __init__(self, si=None,
|
|
|
|
repair_attempted=False,
|
|
|
|
repair_success=False):
|
|
|
|
self._storage_index = si
|
|
|
|
self._repair_attempted = repair_attempted
|
|
|
|
self._repair_success = repair_success
|
2020-07-15 16:58:39 -04:00
|
|
|
|
|
|
|
def get_storage_index(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return self._storage_index
|
2020-07-15 16:58:39 -04:00
|
|
|
|
|
|
|
def get_pre_repair_results(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return FakeCheckResults()
|
2020-07-15 16:58:39 -04:00
|
|
|
|
|
|
|
def get_post_repair_results(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return FakeCheckResults()
|
2020-07-15 16:58:39 -04:00
|
|
|
|
|
|
|
def get_repair_attempted(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return self._repair_attempted
|
2020-07-15 16:58:39 -04:00
|
|
|
|
|
|
|
def get_repair_successful(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
return self._repair_success
|
2020-07-15 16:58:39 -04:00
|
|
|
|
|
|
|
|
2020-06-11 15:51:39 -04:00
|
|
|
class WebResultsRendering(unittest.TestCase):
|
|
|
|
|
2020-07-28 06:53:52 -04:00
|
|
|
@staticmethod
|
|
|
|
def remove_tags(html):
|
2020-07-28 07:10:44 -04:00
|
|
|
return BeautifulSoup(html).get_text(separator=" ")
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2009-06-01 14:06:04 -07:00
|
|
|
def create_fake_client(self):
|
2019-08-19 16:09:26 -04:00
|
|
|
sb = StorageFarmBroker(True, None, EMPTY_CLIENT_CONFIG)
|
2012-05-17 10:50:16 -07:00
|
|
|
# s.get_name() (the "short description") will be "v0-00000000".
|
|
|
|
# s.get_longname() will include the -long suffix.
|
|
|
|
servers = [("v0-00000000-long", "\x00"*20, "peer-0"),
|
|
|
|
("v0-ffffffff-long", "\xff"*20, "peer-f"),
|
|
|
|
("v0-11111111-long", "\x11"*20, "peer-11")]
|
2016-08-26 17:29:39 -07:00
|
|
|
for (key_s, binary_tubid, nickname) in servers:
|
|
|
|
server_id = key_s
|
|
|
|
tubid_b32 = base32.b2a(binary_tubid)
|
2012-05-17 10:50:16 -07:00
|
|
|
furl = "pb://%s@nowhere/fake" % tubid_b32
|
new introducer: signed extensible dictionary-based messages! refs #466
This introduces new client and server halves to the Introducer (renaming the
old one with a _V1 suffix). Both have fallbacks to accomodate talking to a
different version: the publishing client switches on whether the server's
.get_version() advertises V2 support, the server switches on which
subscription method was invoked by the subscribing client.
The V2 protocol sends a three-tuple of (serialized announcement dictionary,
signature, pubkey) for each announcement. The V2 server dispatches messages
to subscribers according to the service-name, and throws errors for invalid
signatures, but does not otherwise examine the messages. The V2 receiver's
subscription callback will receive a (serverid, ann_dict) pair. The
'serverid' will be equal to the pubkey if all of the following are true:
the originating client is V2, and was told a privkey to use
the announcement went through a V2 server
the signature is valid
If not, 'serverid' will be equal to the tubid portion of the announced FURL,
as was the case for V1 receivers.
Servers will create a keypair if one does not exist yet, stored in
private/server.privkey .
The signed announcement dictionary puts the server FURL in a key named
"anonymous-storage-FURL", which anticipates upcoming Accounting-related
changes in the server advertisements. It also provides a key named
"permutation-seed-base32" to tell clients what permutation seed to use. This
is computed at startup, using tubid if there are existing shares, otherwise
the pubkey, to retain share-order compatibility for existing servers.
2011-11-20 02:21:32 -08:00
|
|
|
ann = { "version": 0,
|
|
|
|
"service-name": "storage",
|
2012-05-17 10:50:16 -07:00
|
|
|
"anonymous-storage-FURL": furl,
|
new introducer: signed extensible dictionary-based messages! refs #466
This introduces new client and server halves to the Introducer (renaming the
old one with a _V1 suffix). Both have fallbacks to accomodate talking to a
different version: the publishing client switches on whether the server's
.get_version() advertises V2 support, the server switches on which
subscription method was invoked by the subscribing client.
The V2 protocol sends a three-tuple of (serialized announcement dictionary,
signature, pubkey) for each announcement. The V2 server dispatches messages
to subscribers according to the service-name, and throws errors for invalid
signatures, but does not otherwise examine the messages. The V2 receiver's
subscription callback will receive a (serverid, ann_dict) pair. The
'serverid' will be equal to the pubkey if all of the following are true:
the originating client is V2, and was told a privkey to use
the announcement went through a V2 server
the signature is valid
If not, 'serverid' will be equal to the tubid portion of the announced FURL,
as was the case for V1 receivers.
Servers will create a keypair if one does not exist yet, stored in
private/server.privkey .
The signed announcement dictionary puts the server FURL in a key named
"anonymous-storage-FURL", which anticipates upcoming Accounting-related
changes in the server advertisements. It also provides a key named
"permutation-seed-base32" to tell clients what permutation seed to use. This
is computed at startup, using tubid if there are existing shares, otherwise
the pubkey, to retain share-order compatibility for existing servers.
2011-11-20 02:21:32 -08:00
|
|
|
"permutation-seed-base32": "",
|
|
|
|
"nickname": unicode(nickname),
|
|
|
|
"app-versions": {}, # need #466 and v2 introducer
|
|
|
|
"my-version": "ver",
|
|
|
|
"oldest-supported": "oldest",
|
|
|
|
}
|
2019-08-19 16:09:26 -04:00
|
|
|
s = NativeStorageServer(server_id, ann, None, None, None)
|
2016-08-26 17:29:39 -07:00
|
|
|
sb.test_add_server(server_id, s)
|
2009-06-01 14:06:04 -07:00
|
|
|
c = FakeClient()
|
|
|
|
c.storage_broker = sb
|
|
|
|
return c
|
|
|
|
|
2020-06-11 12:44:48 -04:00
|
|
|
def render_json(self, resource):
|
|
|
|
return resource.render(TestRequest(args={"output": ["json"]}))
|
|
|
|
|
|
|
|
def render_element(self, element, args=None):
|
|
|
|
d = flattenString(TestRequest(args), element)
|
|
|
|
return unittest.TestCase().successResultOf(d)
|
2009-02-23 14:19:43 -07:00
|
|
|
|
|
|
|
def test_literal(self):
|
2020-06-17 21:32:49 -04:00
|
|
|
lcr = web_check_results.LiteralCheckResultsRendererElement()
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2020-06-11 15:48:44 -04:00
|
|
|
html = self.render_element(lcr)
|
2020-07-28 07:18:01 -04:00
|
|
|
self.failUnlessIn("Literal files are always healthy", html)
|
2020-06-11 15:48:44 -04:00
|
|
|
|
|
|
|
html = self.render_element(lcr, args={"return_to": ["FOOURL"]})
|
2020-07-28 07:18:01 -04:00
|
|
|
self.failUnlessIn("Literal files are always healthy", html)
|
2020-06-11 15:48:44 -04:00
|
|
|
self.failUnlessIn('<a href="FOOURL">Return to file.</a>', html)
|
2020-06-11 12:44:48 -04:00
|
|
|
|
|
|
|
c = self.create_fake_client()
|
|
|
|
lcr = web_check_results.LiteralCheckResultsRenderer(c)
|
|
|
|
|
2020-06-11 15:48:44 -04:00
|
|
|
js = self.render_json(lcr)
|
|
|
|
j = json.loads(js)
|
|
|
|
self.failUnlessEqual(j["storage-index"], "")
|
|
|
|
self.failUnlessEqual(j["results"]["healthy"], True)
|
|
|
|
|
2009-02-23 14:19:43 -07:00
|
|
|
|
|
|
|
def test_check(self):
|
2009-06-01 14:06:04 -07:00
|
|
|
c = self.create_fake_client()
|
2012-05-25 12:56:03 -07:00
|
|
|
sb = c.storage_broker
|
2009-02-23 14:19:43 -07:00
|
|
|
serverid_1 = "\x00"*20
|
|
|
|
serverid_f = "\xff"*20
|
2012-05-25 12:57:53 -07:00
|
|
|
server_1 = sb.get_stub_server(serverid_1)
|
|
|
|
server_f = sb.get_stub_server(serverid_f)
|
2009-02-23 14:19:43 -07:00
|
|
|
u = uri.CHKFileURI("\x00"*16, "\x00"*32, 3, 10, 1234)
|
2014-03-20 16:13:57 +00:00
|
|
|
data = { "count_happiness": 8,
|
|
|
|
"count_shares_needed": 3,
|
2012-05-25 00:13:23 -07:00
|
|
|
"count_shares_expected": 9,
|
|
|
|
"count_shares_good": 10,
|
|
|
|
"count_good_share_hosts": 11,
|
|
|
|
"count_recoverable_versions": 1,
|
|
|
|
"count_unrecoverable_versions": 0,
|
|
|
|
"servers_responding": [],
|
2012-05-25 12:57:53 -07:00
|
|
|
"sharemap": {"shareid1": [server_1, server_f]},
|
2012-05-25 00:13:23 -07:00
|
|
|
"count_wrong_shares": 0,
|
|
|
|
"list_corrupt_shares": [],
|
|
|
|
"count_corrupt_shares": 0,
|
|
|
|
"list_incompatible_shares": [],
|
|
|
|
"count_incompatible_shares": 0,
|
2012-05-25 00:14:46 -07:00
|
|
|
"report": [], "share_problems": [], "servermap": None,
|
2009-02-23 14:19:43 -07:00
|
|
|
}
|
2012-05-25 00:14:46 -07:00
|
|
|
cr = check_results.CheckResults(u, u.get_storage_index(),
|
|
|
|
healthy=True, recoverable=True,
|
|
|
|
summary="groovy",
|
|
|
|
**data)
|
2020-06-11 12:44:48 -04:00
|
|
|
w = web_check_results.CheckResultsRendererElement(c, cr)
|
|
|
|
html = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
s = self.remove_tags(html)
|
|
|
|
self.failUnlessIn("File Check Results for SI=2k6avp", s) # abbreviated
|
|
|
|
self.failUnlessIn("Healthy : groovy", s)
|
|
|
|
self.failUnlessIn("Share Counts: need 3-of-9, have 10", s)
|
2014-03-20 16:13:57 +00:00
|
|
|
self.failUnlessIn("Happiness Level: 8", s)
|
2009-02-23 14:19:43 -07:00
|
|
|
self.failUnlessIn("Hosts with good shares: 11", s)
|
|
|
|
self.failUnlessIn("Corrupt shares: none", s)
|
|
|
|
self.failUnlessIn("Wrong Shares: 0", s)
|
|
|
|
self.failUnlessIn("Recoverable Versions: 1", s)
|
|
|
|
self.failUnlessIn("Unrecoverable Versions: 0", s)
|
2020-07-28 07:10:44 -04:00
|
|
|
self.failUnlessIn("Good Shares (sorted in share order): Share ID Nickname Node ID shareid1 peer-0 00000000 peer-f ffffffff", s)
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2012-05-25 00:14:46 -07:00
|
|
|
cr = check_results.CheckResults(u, u.get_storage_index(),
|
|
|
|
healthy=False, recoverable=True,
|
|
|
|
summary="ungroovy",
|
|
|
|
**data)
|
2020-06-11 12:44:48 -04:00
|
|
|
w = web_check_results.CheckResultsRendererElement(c, cr)
|
|
|
|
html = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
s = self.remove_tags(html)
|
|
|
|
self.failUnlessIn("File Check Results for SI=2k6avp", s) # abbreviated
|
|
|
|
self.failUnlessIn("Not Healthy! : ungroovy", s)
|
|
|
|
|
2012-05-25 00:13:23 -07:00
|
|
|
data["count_corrupt_shares"] = 1
|
2012-05-25 12:57:53 -07:00
|
|
|
data["list_corrupt_shares"] = [(server_1, u.get_storage_index(), 2)]
|
2012-05-25 00:14:46 -07:00
|
|
|
cr = check_results.CheckResults(u, u.get_storage_index(),
|
|
|
|
healthy=False, recoverable=False,
|
|
|
|
summary="rather dead",
|
|
|
|
**data)
|
2020-06-11 12:44:48 -04:00
|
|
|
w = web_check_results.CheckResultsRendererElement(c, cr)
|
|
|
|
html = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
s = self.remove_tags(html)
|
|
|
|
self.failUnlessIn("File Check Results for SI=2k6avp", s) # abbreviated
|
|
|
|
self.failUnlessIn("Not Recoverable! : rather dead", s)
|
2020-07-28 07:10:44 -04:00
|
|
|
self.failUnlessIn("Corrupt shares: Share ID Nickname Node ID sh#2 peer-0 00000000", s)
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2020-06-11 12:44:48 -04:00
|
|
|
html = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
s = self.remove_tags(html)
|
|
|
|
self.failUnlessIn("File Check Results for SI=2k6avp", s) # abbreviated
|
|
|
|
self.failUnlessIn("Not Recoverable! : rather dead", s)
|
|
|
|
|
2020-06-11 12:44:48 -04:00
|
|
|
html = self.render_element(w, args={"return_to": ["FOOURL"]})
|
2009-04-07 11:54:59 -07:00
|
|
|
self.failUnlessIn('<a href="FOOURL">Return to file/directory.</a>',
|
2009-02-23 14:19:43 -07:00
|
|
|
html)
|
|
|
|
|
2020-06-11 12:44:48 -04:00
|
|
|
w = web_check_results.CheckResultsRenderer(c, cr)
|
2009-02-23 14:19:43 -07:00
|
|
|
d = self.render_json(w)
|
|
|
|
def _check_json(jdata):
|
2017-01-19 15:39:53 -07:00
|
|
|
j = json.loads(jdata)
|
2009-02-23 14:19:43 -07:00
|
|
|
self.failUnlessEqual(j["summary"], "rather dead")
|
|
|
|
self.failUnlessEqual(j["storage-index"],
|
|
|
|
"2k6avpjga3dho3zsjo6nnkt7n4")
|
2014-03-20 16:13:57 +00:00
|
|
|
expected = {'count-happiness': 8,
|
2009-02-23 14:19:43 -07:00
|
|
|
'count-shares-expected': 9,
|
|
|
|
'healthy': False,
|
|
|
|
'count-unrecoverable-versions': 0,
|
|
|
|
'count-shares-needed': 3,
|
|
|
|
'sharemap': {"shareid1":
|
2012-05-25 12:58:02 -07:00
|
|
|
["v0-00000000-long", "v0-ffffffff-long"]},
|
2009-02-23 14:19:43 -07:00
|
|
|
'count-recoverable-versions': 1,
|
|
|
|
'list-corrupt-shares':
|
2012-05-25 12:58:28 -07:00
|
|
|
[["v0-00000000-long", "2k6avpjga3dho3zsjo6nnkt7n4", 2]],
|
2009-02-23 14:19:43 -07:00
|
|
|
'count-good-share-hosts': 11,
|
|
|
|
'count-wrong-shares': 0,
|
|
|
|
'count-shares-good': 10,
|
2012-05-25 00:13:13 -07:00
|
|
|
'count-corrupt-shares': 1,
|
2009-02-23 14:19:43 -07:00
|
|
|
'servers-responding': [],
|
|
|
|
'recoverable': False,
|
|
|
|
}
|
|
|
|
self.failUnlessEqual(j["results"], expected)
|
2020-06-11 12:44:48 -04:00
|
|
|
_check_json(d)
|
|
|
|
|
|
|
|
w = web_check_results.CheckResultsRendererElement(c, cr)
|
|
|
|
d = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
def _check(html):
|
|
|
|
s = self.remove_tags(html)
|
|
|
|
self.failUnlessIn("File Check Results for SI=2k6avp", s)
|
|
|
|
self.failUnlessIn("Not Recoverable! : rather dead", s)
|
2020-06-11 12:44:48 -04:00
|
|
|
_check(html)
|
2009-02-23 14:19:43 -07:00
|
|
|
|
|
|
|
def test_check_and_repair(self):
|
2009-06-01 14:06:04 -07:00
|
|
|
c = self.create_fake_client()
|
2012-05-25 12:56:03 -07:00
|
|
|
sb = c.storage_broker
|
2009-02-23 14:19:43 -07:00
|
|
|
serverid_1 = "\x00"*20
|
|
|
|
serverid_f = "\xff"*20
|
|
|
|
u = uri.CHKFileURI("\x00"*16, "\x00"*32, 3, 10, 1234)
|
|
|
|
|
2014-03-20 16:13:57 +00:00
|
|
|
data = { "count_happiness": 5,
|
|
|
|
"count_shares_needed": 3,
|
2012-05-25 00:13:23 -07:00
|
|
|
"count_shares_expected": 10,
|
|
|
|
"count_shares_good": 6,
|
|
|
|
"count_good_share_hosts": 7,
|
|
|
|
"count_recoverable_versions": 1,
|
|
|
|
"count_unrecoverable_versions": 0,
|
|
|
|
"servers_responding": [],
|
2012-05-25 12:56:03 -07:00
|
|
|
"sharemap": {"shareid1": [sb.get_stub_server(serverid_1),
|
|
|
|
sb.get_stub_server(serverid_f)]},
|
2012-05-25 00:13:23 -07:00
|
|
|
"count_wrong_shares": 0,
|
|
|
|
"list_corrupt_shares": [],
|
|
|
|
"count_corrupt_shares": 0,
|
|
|
|
"list_incompatible_shares": [],
|
|
|
|
"count_incompatible_shares": 0,
|
2012-05-25 00:14:46 -07:00
|
|
|
"report": [], "share_problems": [], "servermap": None,
|
2009-02-23 14:19:43 -07:00
|
|
|
}
|
2012-05-25 00:14:46 -07:00
|
|
|
pre_cr = check_results.CheckResults(u, u.get_storage_index(),
|
|
|
|
healthy=False, recoverable=True,
|
|
|
|
summary="illing",
|
|
|
|
**data)
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2014-03-20 16:13:57 +00:00
|
|
|
data = { "count_happiness": 9,
|
|
|
|
"count_shares_needed": 3,
|
2012-05-25 00:13:23 -07:00
|
|
|
"count_shares_expected": 10,
|
|
|
|
"count_shares_good": 10,
|
|
|
|
"count_good_share_hosts": 11,
|
|
|
|
"count_recoverable_versions": 1,
|
|
|
|
"count_unrecoverable_versions": 0,
|
|
|
|
"servers_responding": [],
|
2012-05-25 12:56:03 -07:00
|
|
|
"sharemap": {"shareid1": [sb.get_stub_server(serverid_1),
|
|
|
|
sb.get_stub_server(serverid_f)]},
|
2012-05-25 00:13:23 -07:00
|
|
|
"count_wrong_shares": 0,
|
|
|
|
"count_corrupt_shares": 0,
|
|
|
|
"list_corrupt_shares": [],
|
|
|
|
"list_incompatible_shares": [],
|
|
|
|
"count_incompatible_shares": 0,
|
2012-05-25 00:14:46 -07:00
|
|
|
"report": [], "share_problems": [], "servermap": None,
|
2009-02-23 14:19:43 -07:00
|
|
|
}
|
2012-05-25 00:14:46 -07:00
|
|
|
post_cr = check_results.CheckResults(u, u.get_storage_index(),
|
|
|
|
healthy=True, recoverable=True,
|
|
|
|
summary="groovy",
|
|
|
|
**data)
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2010-02-21 18:45:04 -08:00
|
|
|
crr = check_results.CheckAndRepairResults(u.get_storage_index())
|
2009-02-23 14:19:43 -07:00
|
|
|
crr.pre_repair_results = pre_cr
|
|
|
|
crr.post_repair_results = post_cr
|
|
|
|
crr.repair_attempted = False
|
|
|
|
|
2020-06-11 12:44:48 -04:00
|
|
|
w = web_check_results.CheckAndRepairResultsRendererElement(c, crr)
|
|
|
|
html = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
s = self.remove_tags(html)
|
|
|
|
|
|
|
|
self.failUnlessIn("File Check-And-Repair Results for SI=2k6avp", s)
|
|
|
|
self.failUnlessIn("Healthy : groovy", s)
|
|
|
|
self.failUnlessIn("No repair necessary", s)
|
|
|
|
self.failUnlessIn("Post-Repair Checker Results:", s)
|
|
|
|
self.failUnlessIn("Share Counts: need 3-of-10, have 10", s)
|
|
|
|
|
|
|
|
crr.repair_attempted = True
|
|
|
|
crr.repair_successful = True
|
2020-06-11 12:44:48 -04:00
|
|
|
html = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
s = self.remove_tags(html)
|
|
|
|
|
|
|
|
self.failUnlessIn("File Check-And-Repair Results for SI=2k6avp", s)
|
|
|
|
self.failUnlessIn("Healthy : groovy", s)
|
|
|
|
self.failUnlessIn("Repair successful", s)
|
|
|
|
self.failUnlessIn("Post-Repair Checker Results:", s)
|
|
|
|
|
|
|
|
crr.repair_attempted = True
|
|
|
|
crr.repair_successful = False
|
2012-05-25 00:14:46 -07:00
|
|
|
post_cr = check_results.CheckResults(u, u.get_storage_index(),
|
|
|
|
healthy=False, recoverable=True,
|
|
|
|
summary="better",
|
|
|
|
**data)
|
|
|
|
crr.post_repair_results = post_cr
|
2020-06-11 12:44:48 -04:00
|
|
|
html = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
s = self.remove_tags(html)
|
|
|
|
|
|
|
|
self.failUnlessIn("File Check-And-Repair Results for SI=2k6avp", s)
|
|
|
|
self.failUnlessIn("Not Healthy! : better", s)
|
|
|
|
self.failUnlessIn("Repair unsuccessful", s)
|
|
|
|
self.failUnlessIn("Post-Repair Checker Results:", s)
|
|
|
|
|
|
|
|
crr.repair_attempted = True
|
|
|
|
crr.repair_successful = False
|
2012-05-25 00:14:46 -07:00
|
|
|
post_cr = check_results.CheckResults(u, u.get_storage_index(),
|
|
|
|
healthy=False, recoverable=False,
|
|
|
|
summary="worse",
|
|
|
|
**data)
|
|
|
|
crr.post_repair_results = post_cr
|
2020-06-11 12:44:48 -04:00
|
|
|
html = self.render_element(w)
|
2009-02-23 14:19:43 -07:00
|
|
|
s = self.remove_tags(html)
|
|
|
|
|
|
|
|
self.failUnlessIn("File Check-And-Repair Results for SI=2k6avp", s)
|
|
|
|
self.failUnlessIn("Not Recoverable! : worse", s)
|
|
|
|
self.failUnlessIn("Repair unsuccessful", s)
|
|
|
|
self.failUnlessIn("Post-Repair Checker Results:", s)
|
|
|
|
|
2020-07-28 07:26:11 -04:00
|
|
|
w = web_check_results.CheckAndRepairResultsRenderer(c, crr)
|
|
|
|
j = json.loads(self.render_json(w))
|
|
|
|
self.failUnlessEqual(j["repair-attempted"], True)
|
|
|
|
self.failUnlessEqual(j["storage-index"],
|
|
|
|
"2k6avpjga3dho3zsjo6nnkt7n4")
|
|
|
|
self.failUnlessEqual(j["pre-repair-results"]["summary"], "illing")
|
|
|
|
self.failUnlessEqual(j["post-repair-results"]["summary"], "worse")
|
|
|
|
|
|
|
|
w = web_check_results.CheckAndRepairResultsRenderer(c, None)
|
|
|
|
j = json.loads(self.render_json(w))
|
|
|
|
self.failUnlessEqual(j["repair-attempted"], False)
|
|
|
|
self.failUnlessEqual(j["storage-index"], "")
|
2009-02-23 14:19:43 -07:00
|
|
|
|
2020-07-14 21:44:41 -04:00
|
|
|
|
2020-07-11 07:59:28 -04:00
|
|
|
def test_deep_check_renderer(self):
|
2020-07-15 18:43:52 -04:00
|
|
|
status = check_results.DeepCheckResults("fake-root-si")
|
|
|
|
status.add_check(
|
|
|
|
FakeCheckResults("<unhealthy/unrecoverable>", False, False),
|
|
|
|
(u"fake", u"unhealthy", u"unrecoverable")
|
|
|
|
)
|
|
|
|
status.add_check(
|
|
|
|
FakeCheckResults("<healthy/recoverable>", True, True),
|
|
|
|
(u"fake", u"healthy", u"recoverable")
|
|
|
|
)
|
|
|
|
status.add_check(
|
|
|
|
FakeCheckResults("<healthy/unrecoverable>", True, False),
|
|
|
|
(u"fake", u"healthy", u"unrecoverable")
|
|
|
|
)
|
|
|
|
status.add_check(
|
|
|
|
FakeCheckResults("<unhealthy/unrecoverable>", False, True),
|
|
|
|
(u"fake", u"unhealthy", u"recoverable")
|
|
|
|
)
|
|
|
|
|
2020-07-11 07:59:28 -04:00
|
|
|
monitor = Monitor()
|
2020-07-15 18:43:52 -04:00
|
|
|
monitor.set_status(status)
|
2020-07-11 07:59:28 -04:00
|
|
|
|
|
|
|
elem = web_check_results.DeepCheckResultsRendererElement(monitor)
|
|
|
|
doc = self.render_element(elem)
|
|
|
|
soup = BeautifulSoup(doc, 'html5lib')
|
|
|
|
|
|
|
|
assert_soup_has_favicon(self, soup)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"title",
|
|
|
|
u"Tahoe-LAFS - Deep Check Results"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h1",
|
|
|
|
"Deep-Check Results for root SI="
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-14 21:44:41 -04:00
|
|
|
u"Objects Checked: 4"
|
2020-07-11 07:59:28 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Objects Healthy: 2"
|
2020-07-11 07:59:28 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Objects Unhealthy: 2"
|
2020-07-11 07:59:28 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Objects Unrecoverable: 2"
|
2020-07-11 07:59:28 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Corrupt Shares: 4"
|
2020-07-11 07:59:28 -04:00
|
|
|
)
|
|
|
|
|
2020-07-15 13:35:22 -04:00
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h2",
|
|
|
|
u"Files/Directories That Had Problems:"
|
|
|
|
)
|
|
|
|
|
2020-07-15 16:38:30 -04:00
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"fake/unhealthy/recoverable: fake summary"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
|
|
|
u"fake/unhealthy/unrecoverable: fake summary"
|
2020-07-15 16:38:30 -04:00
|
|
|
)
|
|
|
|
|
2020-07-15 13:35:22 -04:00
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h2",
|
|
|
|
u"Servers on which corrupt shares were found"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h2",
|
|
|
|
u"Corrupt Shares"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h2",
|
|
|
|
u"All Results"
|
|
|
|
)
|
|
|
|
|
2020-07-10 08:00:04 -04:00
|
|
|
def test_deep_check_and_repair_renderer(self):
|
|
|
|
status = check_results.DeepCheckAndRepairResults("")
|
2020-07-15 18:43:52 -04:00
|
|
|
|
2020-07-15 16:58:39 -04:00
|
|
|
status.add_check_and_repair(
|
2020-07-15 18:43:52 -04:00
|
|
|
FakeCheckAndRepairResults("attempted/success", True, True),
|
|
|
|
(u"attempted", u"success")
|
|
|
|
)
|
|
|
|
status.add_check_and_repair(
|
|
|
|
FakeCheckAndRepairResults("attempted/failure", True, False),
|
|
|
|
(u"attempted", u"failure")
|
|
|
|
)
|
|
|
|
status.add_check_and_repair(
|
|
|
|
FakeCheckAndRepairResults("unattempted/failure", False, False),
|
|
|
|
(u"unattempted", u"failure")
|
2020-07-15 16:58:39 -04:00
|
|
|
)
|
|
|
|
|
2020-07-15 18:43:52 -04:00
|
|
|
monitor = Monitor()
|
2020-07-10 08:00:04 -04:00
|
|
|
monitor.set_status(status)
|
2020-07-15 16:58:39 -04:00
|
|
|
|
2020-07-10 08:00:04 -04:00
|
|
|
elem = web_check_results.DeepCheckAndRepairResultsRendererElement(monitor)
|
|
|
|
doc = self.render_element(elem)
|
|
|
|
soup = BeautifulSoup(doc, 'html5lib')
|
|
|
|
|
|
|
|
assert_soup_has_favicon(self, soup)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"title",
|
|
|
|
u"Tahoe-LAFS - Deep Check Results"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h1",
|
|
|
|
u"Deep-Check-And-Repair Results for root SI="
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Objects Checked: 3"
|
2020-07-10 08:00:04 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
|
|
|
u"Objects Healthy (before repair): 0"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Objects Unhealthy (before repair): 3"
|
2020-07-10 08:00:04 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 17:09:53 -04:00
|
|
|
u"Corrupt Shares (before repair): 3"
|
2020-07-10 08:00:04 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Repairs Attempted: 2"
|
2020-07-10 08:00:04 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Repairs Successful: 1"
|
2020-07-10 08:00:04 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 17:09:53 -04:00
|
|
|
"Repairs Unsuccessful: 1"
|
2020-07-10 08:00:04 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
|
|
|
u"Objects Healthy (after repair): 0"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 18:43:52 -04:00
|
|
|
u"Objects Unhealthy (after repair): 3"
|
2020-07-10 08:00:04 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"li",
|
2020-07-15 17:09:53 -04:00
|
|
|
u"Corrupt Shares (after repair): 3"
|
2020-07-10 08:00:04 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h2",
|
|
|
|
u"Files/Directories That Had Problems:"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h2",
|
|
|
|
u"Files/Directories That Still Have Problems:"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h2",
|
|
|
|
u"Servers on which corrupt shares were found"
|
|
|
|
)
|
|
|
|
|
|
|
|
assert_soup_has_tag_with_content(
|
|
|
|
self, soup, u"h2",
|
|
|
|
u"Remaining Corrupt Shares"
|
|
|
|
)
|
|
|
|
|
|
|
|
|
2012-04-01 01:55:19 -04:00
|
|
|
class BalancingAct(GridTestMixin, unittest.TestCase):
|
|
|
|
# test for #1115 regarding the 'count-good-share-hosts' metric
|
|
|
|
|
|
|
|
|
|
|
|
def add_server(self, server_number, readonly=False):
|
|
|
|
assert self.g, "I tried to find a grid at self.g, but failed"
|
|
|
|
ss = self.g.make_server(server_number, readonly)
|
|
|
|
#log.msg("just created a server, number: %s => %s" % (server_number, ss,))
|
|
|
|
self.g.add_server(server_number, ss)
|
|
|
|
|
|
|
|
def add_server_with_share(self, server_number, uri, share_number=None,
|
2012-05-13 01:12:22 -07:00
|
|
|
readonly=False):
|
2012-04-01 01:55:19 -04:00
|
|
|
self.add_server(server_number, readonly)
|
|
|
|
if share_number is not None:
|
|
|
|
self.copy_share_to_server(uri, share_number, server_number)
|
|
|
|
|
|
|
|
def copy_share_to_server(self, uri, share_number, server_number):
|
|
|
|
ss = self.g.servers_by_number[server_number]
|
|
|
|
# Copy share i from the directory associated with the first
|
|
|
|
# storage server to the directory associated with this one.
|
|
|
|
assert self.g, "I tried to find a grid at self.g, but failed"
|
|
|
|
assert self.shares, "I tried to find shares at self.shares, but failed"
|
|
|
|
old_share_location = self.shares[share_number][2]
|
|
|
|
new_share_location = os.path.join(ss.storedir, "shares")
|
|
|
|
si = tahoe_uri.from_string(self.uri).get_storage_index()
|
|
|
|
new_share_location = os.path.join(new_share_location,
|
|
|
|
storage_index_to_dir(si))
|
|
|
|
if not os.path.exists(new_share_location):
|
|
|
|
os.makedirs(new_share_location)
|
|
|
|
new_share_location = os.path.join(new_share_location,
|
|
|
|
str(share_number))
|
|
|
|
if old_share_location != new_share_location:
|
|
|
|
shutil.copy(old_share_location, new_share_location)
|
|
|
|
shares = self.find_uri_shares(uri)
|
|
|
|
# Make sure that the storage server has the share.
|
|
|
|
self.failUnless((share_number, ss.my_nodeid, new_share_location)
|
|
|
|
in shares)
|
|
|
|
|
|
|
|
def _pretty_shares_chart(self, uri):
|
|
|
|
# Servers are labeled A-Z, shares are labeled 0-9
|
|
|
|
letters = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
|
|
|
|
assert len(self.g.servers_by_number) < len(letters), \
|
|
|
|
"This little printing function is only meant for < 26 servers"
|
|
|
|
shares_chart = {}
|
2012-05-13 01:12:22 -07:00
|
|
|
names = dict(zip([ss.my_nodeid
|
|
|
|
for _,ss in self.g.servers_by_number.iteritems()],
|
|
|
|
letters))
|
2012-04-01 01:55:19 -04:00
|
|
|
for shnum, serverid, _ in self.find_uri_shares(uri):
|
|
|
|
shares_chart.setdefault(shnum, []).append(names[serverid])
|
|
|
|
return shares_chart
|
|
|
|
|
2017-02-14 16:36:57 -07:00
|
|
|
def test_good_share_hosts(self):
|
2012-04-01 01:55:19 -04:00
|
|
|
self.basedir = "checker/BalancingAct/1115"
|
|
|
|
self.set_up_grid(num_servers=1)
|
|
|
|
c0 = self.g.clients[0]
|
2014-04-21 22:40:28 +01:00
|
|
|
c0.encoding_params['happy'] = 1
|
|
|
|
c0.encoding_params['n'] = 4
|
|
|
|
c0.encoding_params['k'] = 3
|
2012-04-01 01:55:19 -04:00
|
|
|
|
|
|
|
DATA = "data" * 100
|
|
|
|
d = c0.upload(Data(DATA, convergence=""))
|
|
|
|
def _stash_immutable(ur):
|
2012-05-21 21:14:44 -07:00
|
|
|
self.imm = c0.create_node_from_uri(ur.get_uri())
|
2012-04-01 01:55:19 -04:00
|
|
|
self.uri = self.imm.get_uri()
|
|
|
|
d.addCallback(_stash_immutable)
|
|
|
|
d.addCallback(lambda ign:
|
|
|
|
self.find_uri_shares(self.uri))
|
|
|
|
def _store_shares(shares):
|
|
|
|
self.shares = shares
|
|
|
|
d.addCallback(_store_shares)
|
|
|
|
|
|
|
|
def add_three(_, i):
|
|
|
|
# Add a new server with just share 3
|
|
|
|
self.add_server_with_share(i, self.uri, 3)
|
2012-04-01 19:31:53 -04:00
|
|
|
#print self._pretty_shares_chart(self.uri)
|
2012-04-01 01:55:19 -04:00
|
|
|
for i in range(1,5):
|
|
|
|
d.addCallback(add_three, i)
|
2012-05-13 01:12:22 -07:00
|
|
|
|
2012-04-01 01:55:19 -04:00
|
|
|
def _check_and_repair(_):
|
|
|
|
return self.imm.check_and_repair(Monitor())
|
2012-04-01 19:31:53 -04:00
|
|
|
def _check_counts(crr, shares_good, good_share_hosts):
|
2012-05-25 00:13:48 -07:00
|
|
|
prr = crr.get_post_repair_results()
|
|
|
|
self.failUnlessEqual(prr.get_share_counter_good(), shares_good)
|
|
|
|
self.failUnlessEqual(prr.get_host_counter_good_shares(),
|
2012-05-13 01:12:22 -07:00
|
|
|
good_share_hosts)
|
2012-04-01 01:55:19 -04:00
|
|
|
|
|
|
|
"""
|
2012-05-13 01:12:22 -07:00
|
|
|
Initial sharemap:
|
2012-04-01 01:55:19 -04:00
|
|
|
0:[A] 1:[A] 2:[A] 3:[A,B,C,D,E]
|
|
|
|
4 good shares, but 5 good hosts
|
|
|
|
After deleting all instances of share #3 and repairing:
|
2013-06-17 13:38:49 -04:00
|
|
|
0:[A], 1:[A,B], 2:[C,A], 3:[E]
|
2017-02-06 14:16:18 -07:00
|
|
|
# actually: {0: ['E', 'A'], 1: ['C', 'A'], 2: ['A', 'B'], 3: ['D']}
|
2013-06-17 13:38:49 -04:00
|
|
|
Still 4 good shares but now 4 good hosts
|
2012-04-01 01:55:19 -04:00
|
|
|
"""
|
|
|
|
d.addCallback(_check_and_repair)
|
2012-04-01 19:31:53 -04:00
|
|
|
d.addCallback(_check_counts, 4, 5)
|
2012-04-01 01:55:19 -04:00
|
|
|
d.addCallback(lambda _: self.delete_shares_numbered(self.uri, [3]))
|
|
|
|
d.addCallback(_check_and_repair)
|
2017-02-14 16:36:57 -07:00
|
|
|
|
|
|
|
# it can happen that our uploader will choose, e.g., to upload
|
|
|
|
# to servers B, C, D, E .. which will mean that all 5 serves
|
|
|
|
# now contain our shares (and thus "respond").
|
|
|
|
|
|
|
|
def _check_happy(crr):
|
|
|
|
prr = crr.get_post_repair_results()
|
|
|
|
self.assertTrue(prr.get_host_counter_good_shares() >= 4)
|
|
|
|
return crr
|
|
|
|
d.addCallback(_check_happy)
|
2017-02-06 14:16:18 -07:00
|
|
|
d.addCallback(lambda _: all([self.g.break_server(sid)
|
|
|
|
for sid in self.g.get_all_serverids()]))
|
2012-04-01 19:31:53 -04:00
|
|
|
d.addCallback(_check_and_repair)
|
|
|
|
d.addCallback(_check_counts, 0, 0)
|
2012-04-01 01:55:19 -04:00
|
|
|
return d
|
|
|
|
|
checker: don't let failures in add-lease affect checker results. Closes #875.
Mutable servermap updates and the immutable checker, when run with
add_lease=True, send both the do-you-have-block and add-lease commands in
parallel, to avoid an extra round trip time. Many older servers have problems
with add-lease and raise various exceptions, which don't generally matter.
The client-side code was catching+ignoring some of them, but unrecognized
exceptions were passed through to the DYHB code, concealing the DYHB results
from the checker, making it think the server had no shares.
The fix is to separate the code paths. Both commands are sent at the same
time, but the errback path from add-lease is handled separately. Known
exceptions are ignored, the others (both unknown-remote and all-local) are
logged (log.WEIRD, which will trigger an Incident), but neither will affect
the DYHB results.
The add-lease message is sent first, and we know that the server handles them
synchronously. So when the checker is done, we can be sure that all the
add-lease messages have been retired. This makes life easier for unit tests.
2009-12-29 15:01:08 -08:00
|
|
|
class AddLease(GridTestMixin, unittest.TestCase):
|
|
|
|
# test for #875, in which failures in the add-lease call cause
|
|
|
|
# false-negatives in the checker
|
|
|
|
|
|
|
|
def test_875(self):
|
|
|
|
self.basedir = "checker/AddLease/875"
|
|
|
|
self.set_up_grid(num_servers=1)
|
|
|
|
c0 = self.g.clients[0]
|
2014-04-21 22:40:28 +01:00
|
|
|
c0.encoding_params['happy'] = 1
|
checker: don't let failures in add-lease affect checker results. Closes #875.
Mutable servermap updates and the immutable checker, when run with
add_lease=True, send both the do-you-have-block and add-lease commands in
parallel, to avoid an extra round trip time. Many older servers have problems
with add-lease and raise various exceptions, which don't generally matter.
The client-side code was catching+ignoring some of them, but unrecognized
exceptions were passed through to the DYHB code, concealing the DYHB results
from the checker, making it think the server had no shares.
The fix is to separate the code paths. Both commands are sent at the same
time, but the errback path from add-lease is handled separately. Known
exceptions are ignored, the others (both unknown-remote and all-local) are
logged (log.WEIRD, which will trigger an Incident), but neither will affect
the DYHB results.
The add-lease message is sent first, and we know that the server handles them
synchronously. So when the checker is done, we can be sure that all the
add-lease messages have been retired. This makes life easier for unit tests.
2009-12-29 15:01:08 -08:00
|
|
|
self.uris = {}
|
|
|
|
DATA = "data" * 100
|
|
|
|
d = c0.upload(Data(DATA, convergence=""))
|
|
|
|
def _stash_immutable(ur):
|
2012-05-21 21:14:44 -07:00
|
|
|
self.imm = c0.create_node_from_uri(ur.get_uri())
|
checker: don't let failures in add-lease affect checker results. Closes #875.
Mutable servermap updates and the immutable checker, when run with
add_lease=True, send both the do-you-have-block and add-lease commands in
parallel, to avoid an extra round trip time. Many older servers have problems
with add-lease and raise various exceptions, which don't generally matter.
The client-side code was catching+ignoring some of them, but unrecognized
exceptions were passed through to the DYHB code, concealing the DYHB results
from the checker, making it think the server had no shares.
The fix is to separate the code paths. Both commands are sent at the same
time, but the errback path from add-lease is handled separately. Known
exceptions are ignored, the others (both unknown-remote and all-local) are
logged (log.WEIRD, which will trigger an Incident), but neither will affect
the DYHB results.
The add-lease message is sent first, and we know that the server handles them
synchronously. So when the checker is done, we can be sure that all the
add-lease messages have been retired. This makes life easier for unit tests.
2009-12-29 15:01:08 -08:00
|
|
|
d.addCallback(_stash_immutable)
|
2011-08-06 17:44:59 -07:00
|
|
|
d.addCallback(lambda ign:
|
|
|
|
c0.create_mutable_file(MutableData("contents")))
|
checker: don't let failures in add-lease affect checker results. Closes #875.
Mutable servermap updates and the immutable checker, when run with
add_lease=True, send both the do-you-have-block and add-lease commands in
parallel, to avoid an extra round trip time. Many older servers have problems
with add-lease and raise various exceptions, which don't generally matter.
The client-side code was catching+ignoring some of them, but unrecognized
exceptions were passed through to the DYHB code, concealing the DYHB results
from the checker, making it think the server had no shares.
The fix is to separate the code paths. Both commands are sent at the same
time, but the errback path from add-lease is handled separately. Known
exceptions are ignored, the others (both unknown-remote and all-local) are
logged (log.WEIRD, which will trigger an Incident), but neither will affect
the DYHB results.
The add-lease message is sent first, and we know that the server handles them
synchronously. So when the checker is done, we can be sure that all the
add-lease messages have been retired. This makes life easier for unit tests.
2009-12-29 15:01:08 -08:00
|
|
|
def _stash_mutable(node):
|
|
|
|
self.mut = node
|
|
|
|
d.addCallback(_stash_mutable)
|
|
|
|
|
|
|
|
def _check_cr(cr, which):
|
|
|
|
self.failUnless(cr.is_healthy(), which)
|
|
|
|
|
|
|
|
# these two should work normally
|
|
|
|
d.addCallback(lambda ign: self.imm.check(Monitor(), add_lease=True))
|
|
|
|
d.addCallback(_check_cr, "immutable-normal")
|
|
|
|
d.addCallback(lambda ign: self.mut.check(Monitor(), add_lease=True))
|
|
|
|
d.addCallback(_check_cr, "mutable-normal")
|
|
|
|
|
|
|
|
really_did_break = []
|
|
|
|
# now break the server's remote_add_lease call
|
|
|
|
def _break_add_lease(ign):
|
|
|
|
def broken_add_lease(*args, **kwargs):
|
|
|
|
really_did_break.append(1)
|
|
|
|
raise KeyError("intentional failure, should be ignored")
|
|
|
|
assert self.g.servers_by_number[0].remote_add_lease
|
|
|
|
self.g.servers_by_number[0].remote_add_lease = broken_add_lease
|
|
|
|
d.addCallback(_break_add_lease)
|
|
|
|
|
|
|
|
# and confirm that the files still look healthy
|
|
|
|
d.addCallback(lambda ign: self.mut.check(Monitor(), add_lease=True))
|
|
|
|
d.addCallback(_check_cr, "mutable-broken")
|
|
|
|
d.addCallback(lambda ign: self.imm.check(Monitor(), add_lease=True))
|
|
|
|
d.addCallback(_check_cr, "immutable-broken")
|
|
|
|
|
|
|
|
d.addCallback(lambda ign: self.failUnless(really_did_break))
|
|
|
|
return d
|
2011-08-01 23:37:03 -07:00
|
|
|
|
|
|
|
class CounterHolder(object):
|
|
|
|
def __init__(self):
|
|
|
|
self._num_active_block_fetches = 0
|
|
|
|
self._max_active_block_fetches = 0
|
|
|
|
|
|
|
|
from allmydata.immutable.checker import ValidatedReadBucketProxy
|
|
|
|
class MockVRBP(ValidatedReadBucketProxy):
|
|
|
|
def __init__(self, sharenum, bucket, share_hash_tree, num_blocks, block_size, share_size, counterholder):
|
|
|
|
ValidatedReadBucketProxy.__init__(self, sharenum, bucket,
|
|
|
|
share_hash_tree, num_blocks,
|
|
|
|
block_size, share_size)
|
|
|
|
self.counterholder = counterholder
|
|
|
|
|
|
|
|
def get_block(self, blocknum):
|
|
|
|
self.counterholder._num_active_block_fetches += 1
|
|
|
|
if self.counterholder._num_active_block_fetches > self.counterholder._max_active_block_fetches:
|
|
|
|
self.counterholder._max_active_block_fetches = self.counterholder._num_active_block_fetches
|
|
|
|
d = ValidatedReadBucketProxy.get_block(self, blocknum)
|
|
|
|
def _mark_no_longer_active(res):
|
|
|
|
self.counterholder._num_active_block_fetches -= 1
|
|
|
|
return res
|
|
|
|
d.addBoth(_mark_no_longer_active)
|
|
|
|
return d
|
|
|
|
|
|
|
|
class TooParallel(GridTestMixin, unittest.TestCase):
|
|
|
|
# bug #1395: immutable verifier was aggressively parallized, checking all
|
|
|
|
# blocks of all shares at the same time, blowing our memory budget and
|
|
|
|
# crashing with MemoryErrors on >1GB files.
|
|
|
|
|
|
|
|
def test_immutable(self):
|
|
|
|
import allmydata.immutable.checker
|
|
|
|
origVRBP = allmydata.immutable.checker.ValidatedReadBucketProxy
|
|
|
|
|
|
|
|
self.basedir = "checker/TooParallel/immutable"
|
|
|
|
|
|
|
|
# If any code asks to instantiate a ValidatedReadBucketProxy,
|
|
|
|
# we give them a MockVRBP which is configured to use our
|
|
|
|
# CounterHolder.
|
|
|
|
counterholder = CounterHolder()
|
|
|
|
def make_mock_VRBP(*args, **kwargs):
|
|
|
|
return MockVRBP(counterholder=counterholder, *args, **kwargs)
|
|
|
|
allmydata.immutable.checker.ValidatedReadBucketProxy = make_mock_VRBP
|
|
|
|
|
|
|
|
d = defer.succeed(None)
|
|
|
|
def _start(ign):
|
|
|
|
self.set_up_grid(num_servers=4)
|
|
|
|
self.c0 = self.g.clients[0]
|
2014-04-21 22:40:28 +01:00
|
|
|
self.c0.encoding_params = { "k": 1,
|
|
|
|
"happy": 4,
|
|
|
|
"n": 4,
|
|
|
|
"max_segment_size": 5,
|
|
|
|
}
|
2011-08-01 23:37:03 -07:00
|
|
|
self.uris = {}
|
|
|
|
DATA = "data" * 100 # 400/5 = 80 blocks
|
|
|
|
return self.c0.upload(Data(DATA, convergence=""))
|
|
|
|
d.addCallback(_start)
|
|
|
|
def _do_check(ur):
|
2012-05-21 21:14:44 -07:00
|
|
|
n = self.c0.create_node_from_uri(ur.get_uri())
|
2011-08-01 23:37:03 -07:00
|
|
|
return n.check(Monitor(), verify=True)
|
|
|
|
d.addCallback(_do_check)
|
|
|
|
def _check(cr):
|
|
|
|
# the verifier works on all 4 shares in parallel, but only
|
|
|
|
# fetches one block from each share at a time, so we expect to
|
|
|
|
# see 4 parallel fetches
|
|
|
|
self.failUnlessEqual(counterholder._max_active_block_fetches, 4)
|
|
|
|
d.addCallback(_check)
|
|
|
|
def _clean_up(res):
|
|
|
|
allmydata.immutable.checker.ValidatedReadBucketProxy = origVRBP
|
|
|
|
return res
|
|
|
|
d.addBoth(_clean_up)
|
|
|
|
return d
|