2008-11-18 19:12:10 -07:00
|
|
|
|
|
|
|
import urllib
|
|
|
|
import simplejson
|
2009-02-17 17:15:11 -07:00
|
|
|
from twisted.protocols.basic import LineOnlyReceiver
|
2010-02-10 18:43:18 -08:00
|
|
|
from allmydata.scripts.common import get_alias, DEFAULT_ALIAS, escape_path, \
|
|
|
|
UnknownAliasError
|
2010-06-06 18:02:15 -07:00
|
|
|
from allmydata.scripts.common_http import do_http, format_http_error
|
2010-07-11 17:30:15 -07:00
|
|
|
from allmydata.util.encodingutil import quote_output, quote_path
|
2008-11-18 19:12:10 -07:00
|
|
|
|
|
|
|
class Checker:
|
|
|
|
pass
|
|
|
|
|
2010-06-08 22:54:48 -07:00
|
|
|
def _quote_serverid_index_share(serverid, storage_index, sharenum):
|
|
|
|
return "server %s, SI %s, shnum %r" % (quote_output(serverid, quotemarks=False),
|
|
|
|
quote_output(storage_index, quotemarks=False),
|
|
|
|
sharenum)
|
|
|
|
|
2008-11-18 19:12:10 -07:00
|
|
|
def check(options):
|
|
|
|
stdout = options.stdout
|
|
|
|
stderr = options.stderr
|
|
|
|
nodeurl = options['node-url']
|
|
|
|
if not nodeurl.endswith("/"):
|
|
|
|
nodeurl += "/"
|
|
|
|
where = options.where
|
2010-02-10 18:43:18 -08:00
|
|
|
try:
|
|
|
|
rootcap, path = get_alias(options.aliases, where, DEFAULT_ALIAS)
|
|
|
|
except UnknownAliasError, e:
|
2010-06-06 18:02:15 -07:00
|
|
|
e.display(stderr)
|
2010-02-10 18:43:18 -08:00
|
|
|
return 1
|
2008-11-18 19:12:10 -07:00
|
|
|
if path == '/':
|
|
|
|
path = ''
|
|
|
|
url = nodeurl + "uri/%s" % urllib.quote(rootcap)
|
|
|
|
if path:
|
|
|
|
url += "/" + escape_path(path)
|
|
|
|
# todo: should it end with a slash?
|
|
|
|
url += "?t=check&output=JSON"
|
|
|
|
if options["verify"]:
|
|
|
|
url += "&verify=true"
|
|
|
|
if options["repair"]:
|
|
|
|
url += "&repair=true"
|
2009-02-17 19:32:43 -07:00
|
|
|
if options["add-lease"]:
|
|
|
|
url += "&add-lease=true"
|
2008-11-18 19:12:10 -07:00
|
|
|
|
|
|
|
resp = do_http("POST", url)
|
|
|
|
if resp.status != 200:
|
2010-06-06 18:02:15 -07:00
|
|
|
print >>stderr, format_http_error("ERROR", resp)
|
2008-11-18 19:12:10 -07:00
|
|
|
return 1
|
|
|
|
jdata = resp.read()
|
|
|
|
if options.get("raw"):
|
2009-02-02 21:12:32 -07:00
|
|
|
stdout.write(jdata)
|
|
|
|
stdout.write("\n")
|
2008-11-18 19:12:10 -07:00
|
|
|
return 0
|
|
|
|
data = simplejson.loads(jdata)
|
|
|
|
|
|
|
|
if options["repair"]:
|
|
|
|
# show repair status
|
2009-02-17 17:15:11 -07:00
|
|
|
if data["pre-repair-results"]["results"]["healthy"]:
|
|
|
|
summary = "healthy"
|
|
|
|
else:
|
|
|
|
summary = "not healthy"
|
|
|
|
stdout.write("Summary: %s\n" % summary)
|
|
|
|
cr = data["pre-repair-results"]["results"]
|
2010-06-08 22:54:48 -07:00
|
|
|
stdout.write(" storage index: %s\n" % quote_output(data["storage-index"], quotemarks=False))
|
|
|
|
stdout.write(" good-shares: %r (encoding is %r-of-%r)\n"
|
2009-02-17 17:15:11 -07:00
|
|
|
% (cr["count-shares-good"],
|
|
|
|
cr["count-shares-needed"],
|
|
|
|
cr["count-shares-expected"]))
|
2010-06-08 22:54:48 -07:00
|
|
|
stdout.write(" wrong-shares: %r\n" % cr["count-wrong-shares"])
|
2009-02-17 17:15:11 -07:00
|
|
|
corrupt = cr["list-corrupt-shares"]
|
|
|
|
if corrupt:
|
|
|
|
stdout.write(" corrupt shares:\n")
|
|
|
|
for (serverid, storage_index, sharenum) in corrupt:
|
2010-06-08 22:54:48 -07:00
|
|
|
stdout.write(" %s\n" % _quote_serverid_index_share(serverid, storage_index, sharenum))
|
2009-02-17 17:15:11 -07:00
|
|
|
if data["repair-attempted"]:
|
|
|
|
if data["repair-successful"]:
|
|
|
|
stdout.write(" repair successful\n")
|
|
|
|
else:
|
|
|
|
stdout.write(" repair failed\n")
|
2008-11-18 19:12:10 -07:00
|
|
|
else:
|
2013-01-03 22:16:20 +00:00
|
|
|
# LIT files and directories do not have a "summary" field.
|
|
|
|
summary = data.get("summary", "Healthy (LIT)")
|
|
|
|
stdout.write("Summary: %s\n" % quote_output(summary, quotemarks=False))
|
2009-02-17 17:15:11 -07:00
|
|
|
cr = data["results"]
|
2010-06-08 22:54:48 -07:00
|
|
|
stdout.write(" storage index: %s\n" % quote_output(data["storage-index"], quotemarks=False))
|
2013-01-03 22:16:20 +00:00
|
|
|
|
|
|
|
if all([field in cr for field in ("count-shares-good", "count-shares-needed",
|
|
|
|
"count-shares-expected", "count-wrong-shares")]):
|
|
|
|
stdout.write(" good-shares: %r (encoding is %r-of-%r)\n"
|
|
|
|
% (cr["count-shares-good"],
|
|
|
|
cr["count-shares-needed"],
|
|
|
|
cr["count-shares-expected"]))
|
|
|
|
stdout.write(" wrong-shares: %r\n" % cr["count-wrong-shares"])
|
|
|
|
|
|
|
|
corrupt = cr.get("list-corrupt-shares", [])
|
2009-02-17 17:15:11 -07:00
|
|
|
if corrupt:
|
|
|
|
stdout.write(" corrupt shares:\n")
|
|
|
|
for (serverid, storage_index, sharenum) in corrupt:
|
2010-06-08 22:54:48 -07:00
|
|
|
stdout.write(" %s\n" % _quote_serverid_index_share(serverid, storage_index, sharenum))
|
2013-01-03 22:16:20 +00:00
|
|
|
|
2008-11-18 19:12:10 -07:00
|
|
|
return 0
|
|
|
|
|
|
|
|
|
2009-02-17 17:15:11 -07:00
|
|
|
class FakeTransport:
|
|
|
|
disconnecting = False
|
|
|
|
|
|
|
|
class DeepCheckOutput(LineOnlyReceiver):
|
|
|
|
delimiter = "\n"
|
2009-02-24 23:44:15 -07:00
|
|
|
def __init__(self, streamer, options):
|
|
|
|
self.streamer = streamer
|
2009-02-17 17:15:11 -07:00
|
|
|
self.transport = FakeTransport()
|
|
|
|
|
|
|
|
self.verbose = bool(options["verbose"])
|
|
|
|
self.stdout = options.stdout
|
2009-02-24 23:44:15 -07:00
|
|
|
self.stderr = options.stderr
|
2009-02-17 17:15:11 -07:00
|
|
|
self.num_objects = 0
|
|
|
|
self.files_healthy = 0
|
|
|
|
self.files_unhealthy = 0
|
2009-02-24 23:44:15 -07:00
|
|
|
self.in_error = False
|
2009-02-17 17:15:11 -07:00
|
|
|
|
|
|
|
def lineReceived(self, line):
|
2009-02-24 23:44:15 -07:00
|
|
|
if self.in_error:
|
2010-06-06 18:02:15 -07:00
|
|
|
print >>self.stderr, quote_output(line, quotemarks=False)
|
2009-02-24 23:44:15 -07:00
|
|
|
return
|
|
|
|
if line.startswith("ERROR:"):
|
|
|
|
self.in_error = True
|
|
|
|
self.streamer.rc = 1
|
2010-06-06 18:02:15 -07:00
|
|
|
print >>self.stderr, quote_output(line, quotemarks=False)
|
2009-02-24 23:44:15 -07:00
|
|
|
return
|
|
|
|
|
2009-02-17 17:15:11 -07:00
|
|
|
d = simplejson.loads(line)
|
|
|
|
stdout = self.stdout
|
|
|
|
if d["type"] not in ("file", "directory"):
|
|
|
|
return
|
|
|
|
self.num_objects += 1
|
|
|
|
# non-verbose means print a progress marker every 100 files
|
|
|
|
if self.num_objects % 100 == 0:
|
|
|
|
print >>stdout, "%d objects checked.." % self.num_objects
|
|
|
|
cr = d["check-results"]
|
|
|
|
if cr["results"]["healthy"]:
|
|
|
|
self.files_healthy += 1
|
|
|
|
else:
|
|
|
|
self.files_unhealthy += 1
|
|
|
|
if self.verbose:
|
|
|
|
# verbose means also print one line per file
|
|
|
|
path = d["path"]
|
|
|
|
if not path:
|
|
|
|
path = ["<root>"]
|
2013-01-03 22:16:20 +00:00
|
|
|
|
|
|
|
# LIT files and directories do not have a "summary" field.
|
2009-02-17 17:15:11 -07:00
|
|
|
summary = cr.get("summary", "Healthy (LIT)")
|
2010-06-08 22:54:48 -07:00
|
|
|
print >>stdout, "%s: %s" % (quote_path(path), quote_output(summary, quotemarks=False))
|
2010-06-06 18:02:15 -07:00
|
|
|
|
2009-02-17 17:15:11 -07:00
|
|
|
# always print out corrupt shares
|
|
|
|
for shareloc in cr["results"].get("list-corrupt-shares", []):
|
|
|
|
(serverid, storage_index, sharenum) = shareloc
|
2010-06-08 22:54:48 -07:00
|
|
|
print >>stdout, " corrupt: %s" % _quote_serverid_index_share(serverid, storage_index, sharenum)
|
2009-02-17 17:15:11 -07:00
|
|
|
|
|
|
|
def done(self):
|
2009-02-24 23:44:15 -07:00
|
|
|
if self.in_error:
|
|
|
|
return
|
2009-02-17 17:15:11 -07:00
|
|
|
stdout = self.stdout
|
|
|
|
print >>stdout, "done: %d objects checked, %d healthy, %d unhealthy" \
|
|
|
|
% (self.num_objects, self.files_healthy, self.files_unhealthy)
|
|
|
|
|
|
|
|
class DeepCheckAndRepairOutput(LineOnlyReceiver):
|
|
|
|
delimiter = "\n"
|
2009-02-24 23:44:15 -07:00
|
|
|
def __init__(self, streamer, options):
|
|
|
|
self.streamer = streamer
|
2009-02-17 17:15:11 -07:00
|
|
|
self.transport = FakeTransport()
|
|
|
|
|
|
|
|
self.verbose = bool(options["verbose"])
|
|
|
|
self.stdout = options.stdout
|
2009-02-24 23:44:15 -07:00
|
|
|
self.stderr = options.stderr
|
2009-02-17 17:15:11 -07:00
|
|
|
self.num_objects = 0
|
|
|
|
self.pre_repair_files_healthy = 0
|
|
|
|
self.pre_repair_files_unhealthy = 0
|
|
|
|
self.repairs_attempted = 0
|
|
|
|
self.repairs_successful = 0
|
|
|
|
self.post_repair_files_healthy = 0
|
|
|
|
self.post_repair_files_unhealthy = 0
|
2009-02-24 23:44:15 -07:00
|
|
|
self.in_error = False
|
2008-11-18 19:12:10 -07:00
|
|
|
|
2009-02-17 17:15:11 -07:00
|
|
|
def lineReceived(self, line):
|
2009-02-24 23:44:15 -07:00
|
|
|
if self.in_error:
|
2010-06-06 18:02:15 -07:00
|
|
|
print >>self.stderr, quote_output(line, quotemarks=False)
|
2009-02-24 23:44:15 -07:00
|
|
|
return
|
|
|
|
if line.startswith("ERROR:"):
|
|
|
|
self.in_error = True
|
|
|
|
self.streamer.rc = 1
|
2010-06-06 18:02:15 -07:00
|
|
|
print >>self.stderr, quote_output(line, quotemarks=False)
|
2009-02-24 23:44:15 -07:00
|
|
|
return
|
|
|
|
|
2009-02-17 17:15:11 -07:00
|
|
|
d = simplejson.loads(line)
|
|
|
|
stdout = self.stdout
|
|
|
|
if d["type"] not in ("file", "directory"):
|
|
|
|
return
|
|
|
|
self.num_objects += 1
|
|
|
|
# non-verbose means print a progress marker every 100 files
|
|
|
|
if self.num_objects % 100 == 0:
|
|
|
|
print >>stdout, "%d objects checked.." % self.num_objects
|
|
|
|
crr = d["check-and-repair-results"]
|
|
|
|
if d["storage-index"]:
|
|
|
|
if crr["pre-repair-results"]["results"]["healthy"]:
|
|
|
|
was_healthy = True
|
|
|
|
self.pre_repair_files_healthy += 1
|
|
|
|
else:
|
|
|
|
was_healthy = False
|
|
|
|
self.pre_repair_files_unhealthy += 1
|
|
|
|
if crr["post-repair-results"]["results"]["healthy"]:
|
|
|
|
self.post_repair_files_healthy += 1
|
|
|
|
else:
|
|
|
|
self.post_repair_files_unhealthy += 1
|
|
|
|
else:
|
|
|
|
# LIT file
|
|
|
|
was_healthy = True
|
|
|
|
self.pre_repair_files_healthy += 1
|
|
|
|
self.post_repair_files_healthy += 1
|
|
|
|
if crr["repair-attempted"]:
|
|
|
|
self.repairs_attempted += 1
|
|
|
|
if crr["repair-successful"]:
|
|
|
|
self.repairs_successful += 1
|
|
|
|
if self.verbose:
|
|
|
|
# verbose means also print one line per file
|
|
|
|
path = d["path"]
|
|
|
|
if not path:
|
|
|
|
path = ["<root>"]
|
|
|
|
# we don't seem to have a summary available, so build one
|
|
|
|
if was_healthy:
|
|
|
|
summary = "healthy"
|
|
|
|
else:
|
|
|
|
summary = "not healthy"
|
2010-06-06 18:02:15 -07:00
|
|
|
print >>stdout, "%s: %s" % (quote_path(path), summary)
|
|
|
|
|
2009-02-17 17:15:11 -07:00
|
|
|
# always print out corrupt shares
|
|
|
|
prr = crr.get("pre-repair-results", {})
|
|
|
|
for shareloc in prr.get("results", {}).get("list-corrupt-shares", []):
|
|
|
|
(serverid, storage_index, sharenum) = shareloc
|
2010-06-08 22:54:48 -07:00
|
|
|
print >>stdout, " corrupt: %s" % _quote_serverid_index_share(serverid, storage_index, sharenum)
|
2009-02-17 17:15:11 -07:00
|
|
|
|
|
|
|
# always print out repairs
|
|
|
|
if crr["repair-attempted"]:
|
|
|
|
if crr["repair-successful"]:
|
|
|
|
print >>stdout, " repair successful"
|
|
|
|
else:
|
|
|
|
print >>stdout, " repair failed"
|
|
|
|
|
|
|
|
def done(self):
|
2009-02-24 23:44:15 -07:00
|
|
|
if self.in_error:
|
|
|
|
return
|
2009-02-17 17:15:11 -07:00
|
|
|
stdout = self.stdout
|
|
|
|
print >>stdout, "done: %d objects checked" % self.num_objects
|
|
|
|
print >>stdout, " pre-repair: %d healthy, %d unhealthy" \
|
|
|
|
% (self.pre_repair_files_healthy,
|
|
|
|
self.pre_repair_files_unhealthy)
|
|
|
|
print >>stdout, " %d repairs attempted, %d successful, %d failed" \
|
|
|
|
% (self.repairs_attempted,
|
|
|
|
self.repairs_successful,
|
|
|
|
(self.repairs_attempted - self.repairs_successful))
|
|
|
|
print >>stdout, " post-repair: %d healthy, %d unhealthy" \
|
|
|
|
% (self.post_repair_files_healthy,
|
|
|
|
self.post_repair_files_unhealthy)
|
|
|
|
|
|
|
|
class DeepCheckStreamer(LineOnlyReceiver):
|
|
|
|
|
|
|
|
def run(self, options):
|
|
|
|
stdout = options.stdout
|
|
|
|
stderr = options.stderr
|
2009-02-24 23:44:15 -07:00
|
|
|
self.rc = 0
|
2009-02-17 17:15:11 -07:00
|
|
|
self.options = options
|
|
|
|
nodeurl = options['node-url']
|
|
|
|
if not nodeurl.endswith("/"):
|
|
|
|
nodeurl += "/"
|
|
|
|
self.nodeurl = nodeurl
|
|
|
|
where = options.where
|
2010-02-10 18:43:18 -08:00
|
|
|
try:
|
|
|
|
rootcap, path = get_alias(options.aliases, where, DEFAULT_ALIAS)
|
|
|
|
except UnknownAliasError, e:
|
2010-06-06 18:02:15 -07:00
|
|
|
e.display(stderr)
|
2010-02-10 18:43:18 -08:00
|
|
|
return 1
|
2009-02-17 17:15:11 -07:00
|
|
|
if path == '/':
|
|
|
|
path = ''
|
|
|
|
url = nodeurl + "uri/%s" % urllib.quote(rootcap)
|
|
|
|
if path:
|
|
|
|
url += "/" + escape_path(path)
|
|
|
|
# todo: should it end with a slash?
|
|
|
|
url += "?t=stream-deep-check"
|
|
|
|
if options["verify"]:
|
2008-11-18 19:12:10 -07:00
|
|
|
url += "&verify=true"
|
2009-02-17 17:15:11 -07:00
|
|
|
if options["repair"]:
|
2008-11-18 19:12:10 -07:00
|
|
|
url += "&repair=true"
|
2009-02-24 23:44:15 -07:00
|
|
|
output = DeepCheckAndRepairOutput(self, options)
|
2008-11-18 19:12:10 -07:00
|
|
|
else:
|
2009-02-24 23:44:15 -07:00
|
|
|
output = DeepCheckOutput(self, options)
|
2009-02-17 19:32:43 -07:00
|
|
|
if options["add-lease"]:
|
|
|
|
url += "&add-lease=true"
|
2009-02-17 17:15:11 -07:00
|
|
|
resp = do_http("POST", url)
|
|
|
|
if resp.status not in (200, 302):
|
2010-06-06 18:02:15 -07:00
|
|
|
print >>stderr, format_http_error("ERROR", resp)
|
2009-02-17 17:15:11 -07:00
|
|
|
return 1
|
2008-11-18 19:12:10 -07:00
|
|
|
|
2009-02-17 17:15:11 -07:00
|
|
|
# use Twisted to split this into lines
|
|
|
|
while True:
|
|
|
|
chunk = resp.read(100)
|
|
|
|
if not chunk:
|
|
|
|
break
|
|
|
|
if self.options["raw"]:
|
|
|
|
stdout.write(chunk)
|
|
|
|
else:
|
|
|
|
output.dataReceived(chunk)
|
|
|
|
if not self.options["raw"]:
|
|
|
|
output.done()
|
2009-02-24 23:44:15 -07:00
|
|
|
return self.rc
|
2008-11-18 19:12:10 -07:00
|
|
|
|
|
|
|
def deepcheck(options):
|
2009-02-17 17:15:11 -07:00
|
|
|
return DeepCheckStreamer().run(options)
|