Move parameter definitions to their own module, away from test implementation

2025-06-19 07:48:11 +00:00 · 2023-01-17 10:59:00 -05:00
parent f6555381a9
commit e53f68f4d7
2 changed files with 99 additions and 75 deletions
--- a/integration/test_vectors.py
+++ b/integration/test_vectors.py
@ -5,7 +5,6 @@ Verify certain results against test vectors with well-known results.
 from __future__ import annotations
 from typing import AsyncGenerator, Iterator
 from hashlib import sha256
 from itertools import starmap, product
 from yaml import safe_dump
@ -17,76 +16,10 @@ from pytest_twisted import ensureDeferred
 from twisted.python.filepath import FilePath
 from . import vectors
-from .util import CHK, SSK, reconfigure, upload, TahoeProcess
+from .vectors import parameters
 from .util import reconfigure, upload, TahoeProcess
-def digest(bs: bytes) -> bytes:
+@mark.parametrize('convergence', parameters.CONVERGENCE_SECRETS)
    """
    Digest bytes to bytes.
    """
    return sha256(bs).digest()
 def hexdigest(bs: bytes) -> str:
    """
    Digest bytes to text.
    """
    return sha256(bs).hexdigest()
 # Just a couple convergence secrets.  The only thing we do with this value is
 # feed it into a tagged hash.  It certainly makes a difference to the output
 # but the hash should destroy any structure in the input so it doesn't seem
 # like there's a reason to test a lot of different values.
 CONVERGENCE_SECRETS = [
    b"aaaaaaaaaaaaaaaa",
    digest(b"Hello world")[:16],
 ]
 # Exercise at least a handful of different sizes, trying to cover:
 #
 #  1. Some cases smaller than one "segment" (128k).
 #     This covers shrinking of some parameters to match data size.
 #     This includes one case of the smallest possible CHK.
 #
 #  2. Some cases right on the edges of integer segment multiples.
 #     Because boundaries are tricky.
 #
 #  4. Some cases that involve quite a few segments.
 #     This exercises merkle tree construction more thoroughly.
 #
 # See ``stretch`` for construction of the actual test data.
 SEGMENT_SIZE = 128 * 1024
 OBJECT_DESCRIPTIONS = [
    # The smallest possible.  55 bytes and smaller are LIT.
    vectors.Sample(b"a", 56),
    vectors.Sample(b"a", 1024),
    vectors.Sample(b"c", 4096),
    vectors.Sample(digest(b"foo"), SEGMENT_SIZE - 1),
    vectors.Sample(digest(b"bar"), SEGMENT_SIZE + 1),
    vectors.Sample(digest(b"baz"), SEGMENT_SIZE * 16 - 1),
    vectors.Sample(digest(b"quux"), SEGMENT_SIZE * 16 + 1),
    vectors.Sample(digest(b"foobar"), SEGMENT_SIZE * 64 - 1),
    vectors.Sample(digest(b"barbaz"), SEGMENT_SIZE * 64 + 1),
 ]
 ZFEC_PARAMS = [
    vectors.SeedParam(1, 1),
    vectors.SeedParam(1, 3),
    vectors.SeedParam(2, 3),
    vectors.SeedParam(3, 10),
    vectors.SeedParam(71, 255),
    vectors.SeedParam(101, vectors.MAX_SHARES),
 ]
 FORMATS = [
    CHK(),
    # These start out unaware of a key but various keys will be supplied
    # during generation.
    SSK(name="sdmf", key=None),
    SSK(name="mdmf", key=None),
 ]
@mark.parametrize('convergence', CONVERGENCE_SECRETS)
 def test_convergence(convergence):
    """
    Convergence secrets are 16 bytes.
@ -126,10 +59,10 @@ async def skiptest_generate(reactor, request, alice):
    ever-changing set of outputs.
    """
    space = starmap(vectors.Case, product(
-        ZFEC_PARAMS,
+        parameters.ZFEC_PARAMS,
-        CONVERGENCE_SECRETS,
+        parameters.CONVERGENCE_SECRETS,
-        OBJECT_DESCRIPTIONS,
+        parameters.OBJECT_DESCRIPTIONS,
-        FORMATS,
+        parameters.FORMATS,
    ))
    iterresults = generate(reactor, request, alice, space)
@ -157,7 +90,7 @@ def write_results(path: FilePath, results: list[tuple[vectors.Case, str]]) -> No
                    "length": case.seed_data.length,
                },
                "zfec": {
-                    "segmentSize": SEGMENT_SIZE,
+                    "segmentSize": parameters.SEGMENT_SIZE,
                    "required": case.params.required,
                    "total": case.params.total,
                },
--- a/integration/vectors/parameters.py
+++ b/integration/vectors/parameters.py
@ -0,0 +1,91 @@
 """
 Define input parameters for test vector generation.
 :ivar CONVERGENCE_SECRETS: Convergence secrets.
 :ivar SEGMENT_SIZE: The single segment size that the Python implementation
    currently supports without a lot of refactoring.
 :ivar OBJECT_DESCRIPTIONS: Small objects with instructions which can be
    expanded into a possibly large byte string.  These are intended to be used
    as plaintext inputs.
 :ivar ZFEC_PARAMS: Input parameters to ZFEC.
 :ivar FORMATS: Encoding/encryption formats.
 """
 from __future__ import annotations
 from hashlib import sha256
 from . import MAX_SHARES, Sample, SeedParam
 from ..util import CHK, SSK
 def digest(bs: bytes) -> bytes:
    """
    Digest bytes to bytes.
    """
    return sha256(bs).digest()
 def hexdigest(bs: bytes) -> str:
    """
    Digest bytes to text.
    """
    return sha256(bs).hexdigest()
 # Just a couple convergence secrets.  The only thing we do with this value is
 # feed it into a tagged hash.  It certainly makes a difference to the output
 # but the hash should destroy any structure in the input so it doesn't seem
 # like there's a reason to test a lot of different values.
 CONVERGENCE_SECRETS: list[bytes] = [
    b"aaaaaaaaaaaaaaaa",
    digest(b"Hello world")[:16],
 ]
 SEGMENT_SIZE: int = 128 * 1024
 # Exercise at least a handful of different sizes, trying to cover:
 #
 #  1. Some cases smaller than one "segment" (128k).
 #     This covers shrinking of some parameters to match data size.
 #     This includes one case of the smallest possible CHK.
 #
 #  2. Some cases right on the edges of integer segment multiples.
 #     Because boundaries are tricky.
 #
 #  4. Some cases that involve quite a few segments.
 #     This exercises merkle tree construction more thoroughly.
 #
 # See ``stretch`` for construction of the actual test data.
 OBJECT_DESCRIPTIONS: list[Sample] = [
    # The smallest possible.  55 bytes and smaller are LIT.
    Sample(b"a", 56),
    Sample(b"a", 1024),
    Sample(b"c", 4096),
    Sample(digest(b"foo"), SEGMENT_SIZE - 1),
    Sample(digest(b"bar"), SEGMENT_SIZE + 1),
    Sample(digest(b"baz"), SEGMENT_SIZE * 16 - 1),
    Sample(digest(b"quux"), SEGMENT_SIZE * 16 + 1),
    Sample(digest(b"foobar"), SEGMENT_SIZE * 64 - 1),
    Sample(digest(b"barbaz"), SEGMENT_SIZE * 64 + 1),
 ]
 ZFEC_PARAMS: list[SeedParam] = [
    SeedParam(1, 1),
    SeedParam(1, 3),
    SeedParam(2, 3),
    SeedParam(3, 10),
    SeedParam(71, 255),
    SeedParam(101, MAX_SHARES),
 ]
 FORMATS: list[CHK | SSK] = [
    CHK(),
    # These start out unaware of a key but various keys will be supplied
    # during generation.
    SSK(name="sdmf", key=None),
    SSK(name="mdmf", key=None),
 ]