tahoe-lafs/benchmarks/conftest.py

"""
pytest infrastructure for benchmarks.

The number of nodes is parameterized via a --number-of-nodes CLI option added
to pytest.
"""

import os
from shutil import which, rmtree
from tempfile import mkdtemp
from contextlib import contextmanager
from time import time

import pytest
import pytest_twisted

from twisted.internet import reactor
from twisted.internet.defer import DeferredList, succeed

from allmydata.util.iputil import allocate_tcp_port

from integration.grid import Client, create_grid, create_flog_gatherer


def pytest_addoption(parser):
    parser.addoption(
        "--number-of-nodes",
        action="append",
        default=[],
        type=int,
        help="list of number_of_nodes to benchmark against",
    )
    # Required to be compatible with integration.util code that we indirectly
    # depend on, but also might be useful.
    parser.addoption(
        "--force-foolscap",
        action="store_true",
        default=False,
        dest="force_foolscap",
        help=(
            "If set, force Foolscap only for the storage protocol. "
            + "Otherwise HTTP will be used."
        ),
    )


def pytest_generate_tests(metafunc):
    # Make number_of_nodes accessible as a parameterized fixture:
    if "number_of_nodes" in metafunc.fixturenames:
        metafunc.parametrize(
            "number_of_nodes",
            metafunc.config.getoption("number_of_nodes"),
            scope="session",
        )


def port_allocator():
    port = allocate_tcp_port()
    return succeed(port)


@pytest.fixture(scope="session")
def grid(request):
    """
    Provides a new Grid with a single Introducer and flog-gathering process.

    Notably does _not_ provide storage servers; use the storage_nodes
    fixture if your tests need a Grid that can be used for puts / gets.
    """
    tmp_path = mkdtemp(prefix="tahoe-benchmark")
    request.addfinalizer(lambda: rmtree(tmp_path))
    flog_binary = which("flogtool")
    flog_gatherer = pytest_twisted.blockon(
        create_flog_gatherer(reactor, request, tmp_path, flog_binary)
    )
    g = pytest_twisted.blockon(
        create_grid(reactor, request, tmp_path, flog_gatherer, port_allocator)
    )
    return g


@pytest.fixture(scope="session")
def storage_nodes(grid, number_of_nodes):
    nodes_d = []
    for _ in range(number_of_nodes):
        nodes_d.append(grid.add_storage_node())

    nodes_status = pytest_twisted.blockon(DeferredList(nodes_d))
    for ok, value in nodes_status:
        assert ok, "Storage node creation failed: {}".format(value)
    return grid.storage_servers


@pytest.fixture(scope="session")
def client_node(request, grid, storage_nodes, number_of_nodes) -> Client:
    """
    Create a grid client node with number of shares matching number of nodes.
    """
    client_node = pytest_twisted.blockon(
        grid.add_client(
            "client_node",
            needed=number_of_nodes,
            happy=number_of_nodes,
            total=number_of_nodes,
        )
    )
    print(f"Client node pid: {client_node.process.transport.pid}")
    return client_node

def get_cpu_time_for_cgroup():
    """
    Get how many CPU seconds have been used in current cgroup so far.

    Assumes we're running in a v2 cgroup.
    """
    with open("/proc/self/cgroup") as f:
        cgroup = f.read().strip().split(":")[-1]
        assert cgroup.startswith("/")
        cgroup = cgroup[1:]
    cpu_stat = os.path.join("/sys/fs/cgroup", cgroup, "cpu.stat")
    with open(cpu_stat) as f:
        for line in f.read().splitlines():
            if line.startswith("usage_usec"):
                return int(line.split()[1]) / 1_000_000
    raise ValueError("Failed to find usage_usec")


class Benchmarker:
    """Keep track of benchmarking results."""

    @contextmanager
    def record(self, capsys: pytest.CaptureFixture[str], name, **parameters):
        """Record the timing of running some code, if it succeeds."""
        start_cpu = get_cpu_time_for_cgroup()
        start = time()
        yield
        elapsed = time() - start
        end_cpu = get_cpu_time_for_cgroup()
        elapsed_cpu = end_cpu - start_cpu
        # FOR now we just print the outcome:
        parameters = " ".join(f"{k}={v}" for (k, v) in parameters.items())
        with capsys.disabled():
            print(
                f"\nBENCHMARK RESULT: {name} {parameters} elapsed={elapsed:.3} (secs) CPU={elapsed_cpu:.3} (secs)\n"
            )


@pytest.fixture(scope="session")
def tahoe_benchmarker():
    return Benchmarker()
Start on benchmarking infrastructure: a framework for starting nodes. 2023-09-05 15:45:54 +00:00			`"""`
			`pytest infrastructure for benchmarks.`

			`The number of nodes is parameterized via a --number-of-nodes CLI option added`
			`to pytest.`
			`"""`

Get CPU usage from cgroup v2. 2023-09-25 14:55:21 +00:00			`import os`
Start on benchmarking infrastructure: a framework for starting nodes. 2023-09-05 15:45:54 +00:00			`from shutil import which, rmtree`
			`from tempfile import mkdtemp`
Smallest possible benchmark result tracking. 2023-09-05 16:23:50 +00:00			`from contextlib import contextmanager`
			`from time import time`
Start on benchmarking infrastructure: a framework for starting nodes. 2023-09-05 15:45:54 +00:00
			`import pytest`
			`import pytest_twisted`

			`from twisted.internet import reactor`
			`from twisted.internet.defer import DeferredList, succeed`

			`from allmydata.util.iputil import allocate_tcp_port`

			`from integration.grid import Client, create_grid, create_flog_gatherer`


			`def pytest_addoption(parser):`
			`parser.addoption(`
			`"--number-of-nodes",`
			`action="append",`
			`default=[],`
			`type=int,`
			`help="list of number_of_nodes to benchmark against",`
			`)`
			`# Required to be compatible with integration.util code that we indirectly`
			`# depend on, but also might be useful.`
			`parser.addoption(`
			`"--force-foolscap",`
			`action="store_true",`
			`default=False,`
			`dest="force_foolscap",`
			`help=(`
			`"If set, force Foolscap only for the storage protocol. "`
			`+ "Otherwise HTTP will be used."`
			`),`
			`)`


			`def pytest_generate_tests(metafunc):`
			`# Make number_of_nodes accessible as a parameterized fixture:`
			`if "number_of_nodes" in metafunc.fixturenames:`
			`metafunc.parametrize(`
			`"number_of_nodes",`
			`metafunc.config.getoption("number_of_nodes"),`
			`scope="session",`
			`)`


			`def port_allocator():`
			`port = allocate_tcp_port()`
			`return succeed(port)`


			`@pytest.fixture(scope="session")`
			`def grid(request):`
			`"""`
			`Provides a new Grid with a single Introducer and flog-gathering process.`

			`Notably does _not_ provide storage servers; use the storage_nodes`
			`fixture if your tests need a Grid that can be used for puts / gets.`
			`"""`
			`tmp_path = mkdtemp(prefix="tahoe-benchmark")`
			`request.addfinalizer(lambda: rmtree(tmp_path))`
			`flog_binary = which("flogtool")`
			`flog_gatherer = pytest_twisted.blockon(`
			`create_flog_gatherer(reactor, request, tmp_path, flog_binary)`
			`)`
			`g = pytest_twisted.blockon(`
			`create_grid(reactor, request, tmp_path, flog_gatherer, port_allocator)`
			`)`
			`return g`


			`@pytest.fixture(scope="session")`
			`def storage_nodes(grid, number_of_nodes):`
			`nodes_d = []`
			`for _ in range(number_of_nodes):`
			`nodes_d.append(grid.add_storage_node())`

			`nodes_status = pytest_twisted.blockon(DeferredList(nodes_d))`
			`for ok, value in nodes_status:`
			`assert ok, "Storage node creation failed: {}".format(value)`
			`return grid.storage_servers`


			`@pytest.fixture(scope="session")`
			`def client_node(request, grid, storage_nodes, number_of_nodes) -> Client:`
			`"""`
			`Create a grid client node with number of shares matching number of nodes.`
			`"""`
			`client_node = pytest_twisted.blockon(`
			`grid.add_client(`
			`"client_node",`
			`needed=number_of_nodes,`
			`happy=number_of_nodes,`
			`total=number_of_nodes,`
			`)`
			`)`
			`print(f"Client node pid: {client_node.process.transport.pid}")`
			`return client_node`
Smallest possible benchmark result tracking. 2023-09-05 16:23:50 +00:00
Get CPU usage from cgroup v2. 2023-09-25 14:55:21 +00:00			`def get_cpu_time_for_cgroup():`
			`"""`
			`Get how many CPU seconds have been used in current cgroup so far.`

			`Assumes we're running in a v2 cgroup.`
			`"""`
			`with open("/proc/self/cgroup") as f:`
			`cgroup = f.read().strip().split(":")[-1]`
			`assert cgroup.startswith("/")`
			`cgroup = cgroup[1:]`
			`cpu_stat = os.path.join("/sys/fs/cgroup", cgroup, "cpu.stat")`
			`with open(cpu_stat) as f:`
			`for line in f.read().splitlines():`
			`if line.startswith("usage_usec"):`
			`return int(line.split()[1]) / 1_000_000`
			`raise ValueError("Failed to find usage_usec")`

Smallest possible benchmark result tracking. 2023-09-05 16:23:50 +00:00
			`class Benchmarker:`
			`"""Keep track of benchmarking results."""`

			`@contextmanager`
Make benchmarking results visible by default. 2023-09-07 21:21:45 +00:00			`def record(self, capsys: pytest.CaptureFixture[str], name, **parameters):`
Smallest possible benchmark result tracking. 2023-09-05 16:23:50 +00:00			`"""Record the timing of running some code, if it succeeds."""`
Get CPU usage from cgroup v2. 2023-09-25 14:55:21 +00:00			`start_cpu = get_cpu_time_for_cgroup()`
Smallest possible benchmark result tracking. 2023-09-05 16:23:50 +00:00			`start = time()`
			`yield`
			`elapsed = time() - start`
Get CPU usage from cgroup v2. 2023-09-25 14:55:21 +00:00			`end_cpu = get_cpu_time_for_cgroup()`
Also record CPU time of subprocesses. 2023-09-07 21:53:48 +00:00			`elapsed_cpu = end_cpu - start_cpu`
			`# FOR now we just print the outcome:`
Smallest possible benchmark result tracking. 2023-09-05 16:23:50 +00:00			`parameters = " ".join(f"{k}={v}" for (k, v) in parameters.items())`
Make benchmarking results visible by default. 2023-09-07 21:21:45 +00:00			`with capsys.disabled():`
Also record CPU time of subprocesses. 2023-09-07 21:53:48 +00:00			`print(`
			`f"\nBENCHMARK RESULT: {name} {parameters} elapsed={elapsed:.3} (secs) CPU={elapsed_cpu:.3} (secs)\n"`
			`)`
Smallest possible benchmark result tracking. 2023-09-05 16:23:50 +00:00

			`@pytest.fixture(scope="session")`
			`def tahoe_benchmarker():`
			`return Benchmarker()`