import time, simplejson from nevow import rend, tags as T, inevow from allmydata.web.common import getxmlfile, abbreviate_time, get_arg from allmydata.util.abbreviate import abbreviate_space def remove_prefix(s, prefix): if not s.startswith(prefix): return None return s[len(prefix):] class StorageStatus(rend.Page): docFactory = getxmlfile("storage_status.xhtml") # the default 'data' argument is the StorageServer instance def __init__(self, storage): rend.Page.__init__(self, storage) self.storage = storage def renderHTTP(self, ctx): req = inevow.IRequest(ctx) t = get_arg(req, "t") if t == "json": return self.render_JSON(req) return rend.Page.renderHTTP(self, ctx) def render_JSON(self, req): req.setHeader("content-type", "text/plain") d = {"stats": self.storage.get_stats(), "bucket-counter": self.storage.bucket_counter.get_state(), "lease-checker": self.storage.lease_checker.get_state(), } return simplejson.dumps(d, indent=1) + "\n" def render_storage_running(self, ctx, storage): if storage: return ctx.tag else: return T.h1["No Storage Server Running"] def render_bool(self, ctx, data): return {True: "Yes", False: "No"}[bool(data)] def render_abbrev_space(self, ctx, size): if size is None: return "?" return abbreviate_space(size) def render_space(self, ctx, size): if size is None: return "?" return "%d" % size def data_stats(self, ctx, data): # FYI: 'data' appears to be self, rather than the StorageServer # object in self.original that gets passed to render_* methods. I # still don't understand Nevow. # Nevow has nevow.accessors.DictionaryContainer: Any data= directive # that appears in a context in which the current data is a dictionary # will be looked up as keys in that dictionary. So if data_stats() # returns a dictionary, then we can use something like this: # # # to use get_stats()["storage_server.disk_total"] . However, # DictionaryContainer does a raw d[] instead of d.get(), so any # missing keys will cause an error, even if the renderer can tolerate # None values. To overcome this, we either need a dict-like object # that always returns None for unknown keys, or we must pre-populate # our dict with those missing keys, or we should get rid of data_ # methods that return dicts (or find some way to override Nevow's # handling of dictionaries). d = dict([ (remove_prefix(k, "storage_server."), v) for k,v in self.storage.get_stats().items() ]) d.setdefault("disk_total", None) d.setdefault("disk_used", None) d.setdefault("disk_free_for_root", None) d.setdefault("disk_free_for_nonroot", None) d.setdefault("reserved_space", None) d.setdefault("disk_avail", None) return d def data_last_complete_bucket_count(self, ctx, data): s = self.storage.bucket_counter.get_state() count = s.get("last-complete-bucket-count") if count is None: return "Not computed yet" return count def render_count_crawler_status(self, ctx, storage): p = self.storage.bucket_counter.get_progress() return ctx.tag[self.format_crawler_progress(p)] def format_crawler_progress(self, p): cycletime = p["estimated-time-per-cycle"] cycletime_s = "" if cycletime is not None: cycletime_s = " (estimated cycle time %s)" % abbreviate_time(cycletime) if p["cycle-in-progress"]: pct = p["cycle-complete-percentage"] soon = p["remaining-sleep-time"] eta = p["estimated-cycle-complete-time-left"] eta_s = "" if eta is not None: eta_s = " (ETA %ds)" % eta return ["Current crawl %.1f%% complete" % pct, eta_s, " (next work in %s)" % abbreviate_time(soon), cycletime_s, ] else: soon = p["remaining-wait-time"] return ["Next crawl in %s" % abbreviate_time(soon), cycletime_s] def render_lease_expiration_enabled(self, ctx, data): lc = self.storage.lease_checker if lc.expiration_enabled: return ctx.tag["Enabled: expired leases will be removed"] else: return ctx.tag["Disabled: scan-only mode, no leases will be removed"] def render_lease_expiration_mode(self, ctx, data): mode = self.storage.lease_checker.mode if mode[0] == "age": return ctx.tag["leases created or last renewed more than %s ago " "will be considered expired" % abbreviate_time(mode[1])] else: assert mode[0] == "date-cutoff" date = time.strftime("%d-%b-%Y", time.gmtime(mode[1])) return ctx.tag["leases created or last renewed before %s " "will be considered expired" % date] def format_recovered(self, sr, a): def maybe(d): if d is None: return "?" return "%d" % d space = abbreviate_space(sr["%s-diskbytes" % a]) return "%s shares, %s buckets, %s" % (maybe(sr["%s-numshares" % a]), maybe(sr["%s-numbuckets" % a]), space) def render_lease_current_cycle_progress(self, ctx, data): lc = self.storage.lease_checker p = lc.get_progress() return ctx.tag[self.format_crawler_progress(p)] def render_lease_current_cycle_results(self, ctx, data): lc = self.storage.lease_checker p = lc.get_progress() if not p["cycle-in-progress"]: return "" s = lc.get_state() so_far = s["cycle-to-date"] sr = so_far["space-recovered"] er = s["estimated-remaining-cycle"] esr = er["space-recovered"] ec = s["estimated-current-cycle"] ecr = ec["space-recovered"] p = T.ul() pieces = [] def add(*pieces): p[T.li[pieces]] def maybe(d): if d is None: return "?" return "%d" % d add("So far, this cycle has examined %d shares in %d buckets" % (so_far["shares-examined"], so_far["buckets-examined"])) add("and has recovered: ", self.format_recovered(sr, "actual")) if so_far["expiration-enabled"]: add("The remainder of this cycle is expected to recover: ", self.format_recovered(esr, "actual")) add("The whole cycle is expected to examine %s shares in %s buckets" % (maybe(ec["shares-examined"]), maybe(ec["buckets-examined"]))) add("and to recover: ", self.format_recovered(ecr, "actual")) else: add("If expiration were enabled, we would have recovered: ", self.format_recovered(sr, "configured-leasetimer"), " by now") add("and the remainder of this cycle would probably recover: ", self.format_recovered(esr, "configured-leasetimer")) add("and the whole cycle would probably recover: ", self.format_recovered(ecr, "configured-leasetimer")) add("if we were using each lease's default 31-day lease lifetime " "(instead of our configured node), " "this cycle would be expected to recover: ", self.format_recovered(ecr, "original-leasetimer")) if so_far["corrupt-shares"]: add("Corrupt shares:", T.ul[ [T.li[ ["SI %s shnum %d" % corrupt_share for corrupt_share in so_far["corrupt-shares"] ] ]]]) return ctx.tag["Current cycle:", p] def render_lease_last_cycle_results(self, ctx, data): lc = self.storage.lease_checker h = lc.get_state()["history"] if not h: return "" last = h[max(h.keys())] start, end = last["cycle-start-finish-times"] ctx.tag["Last complete cycle (which took %s and finished %s ago)" " recovered: " % (abbreviate_time(end-start), abbreviate_time(time.time() - end)), self.format_recovered(last["space-recovered"], "actual") ] p = T.ul() pieces = [] def add(*pieces): p[T.li[pieces]] if not last["expiration-enabled"]: rec = self.format_recovered(last["space-recovered"], "configured-leasetimer") add("but expiration was not enabled. If it had been, " "it would have recovered: ", rec) if last["corrupt-shares"]: add("Corrupt shares:", T.ul[ [T.li[ ["SI %s shnum %d" % corrupt_share for corrupt_share in last["corrupt-shares"] ] ]]]) return ctx.tag[p]