94 lines
3.1 KiB
Python

import random
from itertools import islice
from typing import List, cast
from pydantic import Field
from pydantic_core import Url
from urllib3.util import parse_url
from benchmarks.codex.agent.codex_agent_client import CodexAgentClient
from benchmarks.codex.client.common import Cid
from benchmarks.codex.codex_node import CodexMeta, CodexNode
from benchmarks.core.experiments.experiments import (
ExperimentBuilder,
ExperimentEnvironment,
ExperimentComponent,
)
from benchmarks.core.experiments.iterated_experiment import IteratedExperiment
from benchmarks.core.experiments.static_experiment import StaticDisseminationExperiment
from benchmarks.core.pydantic import SnakeCaseModel, Host
from benchmarks.core.utils.random import sample
class CodexNodeConfig(SnakeCaseModel):
name: str
address: Host
disc_port: int
api_port: int
agent_url: Url
CodexDisseminationExperiment = IteratedExperiment[
StaticDisseminationExperiment[Cid, CodexMeta]
]
class CodexExperimentConfig(ExperimentBuilder[CodexDisseminationExperiment]):
experiment_set_id: str = Field(
description="Identifies the group of experiment repetitions", default="unnamed"
)
seeder_sets: int = Field(
gt=0, default=1, description="Number of distinct seeder sets to experiment with"
)
seeders: int = Field(gt=0, description="Number of seeders per seeder set")
file_size: int = Field(gt=0, description="File size, in bytes")
repetitions: int = Field(
gt=0, description="How many experiment repetitions to run for each seeder set"
)
logging_cooldown: int = Field(
gt=0,
default=0,
description="Time to wait after the last download completes before tearing down the experiment.",
)
nodes: List[CodexNodeConfig]
def build(self) -> CodexDisseminationExperiment:
agents = [
CodexAgentClient(parse_url(str(node.agent_url))) for node in self.nodes
]
network = [
CodexNode(
codex_api_url=parse_url(f"http://{str(node.address)}:{node.api_port}"),
agent=agents[i],
)
for i, node in enumerate(self.nodes)
]
env = ExperimentEnvironment(
components=cast(List[ExperimentComponent], network + agents),
ping_max=10,
polling_interval=0.5,
)
def repetitions():
for seeder_set in range(self.seeder_sets):
seeders = list(islice(sample(len(network)), self.seeders))
for experiment_run in range(self.repetitions):
yield env.bind(
StaticDisseminationExperiment(
network=network,
seeders=seeders,
file_size=self.file_size,
seed=random.randint(0, 2**16),
meta=CodexMeta(f"dataset-{seeder_set}-{experiment_run}"),
logging_cooldown=self.logging_cooldown,
)
)
return IteratedExperiment(
repetitions(), experiment_set_id=self.experiment_set_id
)