research/waku_scalability/waku_scaling.py

# !!! THIS IS WIP (analyze the code structure at your own risk ^.^')
# the scope of this is still undefined; we want to avoid premature generalization
# - todo: separate the part on latency
# based on ../whisper_scalability/whisper.py

import matplotlib.pyplot as plt
import numpy as np
import math
from pathlib import Path

import sys
import json, ast, csv
import typer
import logging as log

from scipy.stats import truncnorm
from enum import Enum, EnumMeta


# we currently support the following two network types
class networkType(Enum):
    NEWMANWATTSSTROGATZ = "newmanwattsstrogatz"  # mesh, small-world
    REGULAR = "regular"  # d-regular


#JSON/YAML keys: for consistency and avoid stupid bugs
class Keys:
    GENNET  =   "gennet"
    GENLOAD =   "wls"
    JSON    =   "json"
    YAML    =   "yaml"
    BATCH   =   "batch"
    RUNS    =   "runs"
    EXPLORE =   "explore"
    PER_NODE =  "per_node"
    BMARK   =   "benchmark"
    OPREFIX =   "out"
    STATUS  =   "status"
    MSGS    =   "messages"
    MBPHR   =   "MBphr"
    SECS    =   "Secs"
    CASES   =   "cases"
#    SIZE    =   "size"


class caseType(Enum):
    CASE1 = "case1"
    CASE2 = "case2"
    CASE2POINT1 = "case2point1"
    CASE3 = "case3"
    CASE4 = "case4"
    CASE5 = "case5"
    SHARDINGCASE1 =  "sharding_case1"
    SHARDINGCASE2 = "sharding_case2"
    SHARDINGCASE3  =       "sharding_case3"

# WakuConfig holds the data for the individual runs. Every analysis instance is a Config instance
class WakuConfig:
    # We need 12 params to fully instantiate Libp2pConfig. Set the defaults for the missing
    def __init__(self,
            num_nodes=4, fanout=6,
            network_type=networkType.REGULAR.value,
            messages={"topic1":{"size":0.002,"msgpsec":0.001389}},
            #_size=0.002, msgpsec=0.00139,
            per_hop_delay=0.001,
            gossip_msg_size=0.002, gossip_window_size=3, gossip2reply_ratio=0.01,
            nodes_per_shard=10000, shards_per_node=3):
        # set the current Config values
        self.num_nodes = num_nodes                      # number of wakunodes
        self.fanout = fanout                            # generative fanout
        self.network_type = network_type                # regular, small world etc

        '''
        self.msg_size = msg_size                        # avg message size in MBytes
        self.msgpsec = msgpsec                          # avg # of messages per user per sec
        '''
        self.messages = messages

        self.per_hop_delay = per_hop_delay              # per-hop delay = 0.01 sec
        self.gossip_msg_size = gossip_msg_size          # avg gossip msg size in MBytes
        self.gossip_window_size = gossip_window_size    # max gossip history window size
        self.gossip2reply_ratio = gossip2reply_ratio    # fraction of replies/hits to a gossip msg
        self.nodes_per_shard = nodes_per_shard          # max number of nodes per shard
        self.shards_per_node = shards_per_node          # avg number of shards a node is part of

        # secondary parameters, derived from primary
        msg_size_sum, self.peruser_message_load, self.total_msgphr = 0, 0, 0
        for k, v in self.messages.items():
            m = self.messages[k]
            m["msgphr"] = m["msgpsec"]*60*60
            msg_size_sum += m["size"]
            self.peruser_message_load += m["msgphr"]*m["size"]
            self.total_msgphr += m["msgphr"]
        self.avg_msg_size = msg_size_sum / len(self.messages)

        '''
        self.msgphr = msgpsec*60*60                     # msgs per hour from msgpsec
        '''
        self.d = 1.5 * self.fanout if network_type == networkType.NEWMANWATTSSTROGATZ.value else self.fanout
        self.d_lazy = self.d - 6  if self.d > 6 else 0 # avg degree for gossip
        if self.d > 6:
            self.d = 6
        self.base_assumptions = ["a1", "a2", "a3", "a4"]
        # Assumption strings (general/topology)
        self.Assumptions = {
           # "a1"  :  "- A01. Message size (static): " + self.pretty_print.sizeof_fmt_kb(self.msg_size),
            "a1"  :  "- A01. Message size (static): " +  str(self.avg_msg_size),
            #"a2"  : "- A02. Messages sent per node per hour (static) (assuming no spam; but also no rate limiting.): " + str(self.msgphr),
            "a2"  : "- A02. Messages sent per node per hour (static) (assuming no spam; but also no rate limiting.): " +  str(self.total_msgphr),
            "a3"  : "- A03. The network topology is a d-regular graph of degree (static): " + str(int(self.d)),
            "a4"  : "- A04. Messages outside of Waku Relay are not considered, e.g. store messages.",
            "a5"  : "- A05. Messages are only sent once along an edge. (requires delays before sending)",
            "a6"  : "- A06. Messages are sent to all d-1 neighbours as soon as receiving a message (current operation)", # Thanks @Mmenduist
            "a7"  : "- A07. Single shard (i.e. single pubsub mesh)",
            "a8"  : "- A08. Multiple shards; mapping of content topic (multicast group) to shard is 1 to 1",
            "a9"  : "- A09. Max number of nodes per shard (static) " + str(self.nodes_per_shard),
            "a10" : "- A10. Number of shards a given node is part of (static) " + str(self.shards_per_node),
            "a11" : "- A11. Number of nodes in the network is variable.\n\
                    These nodes are distributed evenly over " + str(self.shards_per_node) + " shards.\n\
                    Once all of these shards have " + str(self.nodes_per_shard) + " nodes, new shards are spawned.\n\
                    These new shards have no influcene on this model, because the nodes we look at are not part of these new shards.",
            "a12" : "- A12. Including 1:1 chat. Messages sent to a given user are sent into a 1:1 shard associated with that user's node.\n\
                    Effectively, 1:1 chat adds a receive load corresponding to one additional shard a given node has to be part of.",
            #"a13" : "- A13. 1:1 chat messages sent per node per hour (static): " + str(self.msgphr), # could introduce a separate variable here
            "a13" : "- A13. 1:1 chat messages sent per node per hour (static): " + str(self.messages), # could introduce a separate variable here
            "a14" : "- A14. 1:1 chat shards are filled one by one (not evenly distributed over the shards).\n\
                    This acts as an upper bound and overestimates the 1:1 load for lower node counts.",
            "a15" : "- A15. Naive light node. Requests all messages in shards that have (large) 1:1 mapped multicast groups the light node is interested in.",

            # Assumption strings (store)
            "a21" : "- A21. Store nodes do not store duplicate messages.",

            # Assumption strings (gossip)
            "a31" : "- A21. Gossip is not considered.",
            "a32" : "- A32. Gossip message size (IHAVE/IWANT) (static):" + str(self.gossip_msg_size),
            "a33" : "- A33. Ratio of IHAVEs followed-up by an IWANT (incl. the actual requested message):" + str(self.gossip2reply_ratio),

            # Assumption strings (delay)
            "a41" : "- A41. Delay is calculated based on an upper bound of the expected distance.",
            "a42" : "- A42. Average delay per hop (static): " + str(self.per_hop_delay) + "s."
        }
        self.load = -1
        self.latency = -1
        self.case = ""
        #self.display_config()

    # display the Config
    def display_config(self):
        print(f'WakuConfig(Config = {self.num_nodes}, {self.fanout},  {self.d}, '
              f'{self.d_lazy}, {self.network_type}, messages={str(self.messages)}, '
              f'{self.gossip_msg_size} MBytes, {self.gossip_window_size}, '
              f' {self.gossip2reply_ratio}, {self.nodes_per_shard}, {self.shards_per_node}, '
              f' {self.per_hop_delay} secs), {self.case}, {self.latency} secs, {self.load} MBytes')
        """
        print(f'Config = {self.num_nodes}, {self.fanout} -> {(self.d, self.d_lazy)}, {self.network_type}, '
              #f'{self.msg_size}MBytes, {self.msgpsec}/sec({self.msgphr}/hr), '
              f'messages={str(self.messages)}, '
              f'{self.gossip_msg_size}MBytes, {self.gossip_window_size}, {self.gossip2reply_ratio}, '
              f'{self.nodes_per_shard}, {self.shards_per_node}, {self.per_hop_delay}secs, '
              f'{self.case}, {self.latency}, {self.load}')
        """


    # Print assumptions : with a base set
    def print_assumptions1(self, xs):
        print("Assumptions/Simplifications:")
        alist = self.base_assumptions + xs
        for a in alist:
            if a in self.Assumptions:
                print(self.Assumptions[a])
            else:
                log.error(f'Unknown assumption: ' + a)
                sys.exit(0)
        print("")


    # Print assumptions: all
    def print_assumptions(self, xs):
        print("Assumptions/Simplifications:")
        for a in xs:
            if a in self.Assumptions:
                print(self.Assumptions[a])
            else:
                log.error(f'Unknown assumption: ' + a)
                sys.exit(0)
        print("")

    def __repr__(self):
        return (f'WakuConfig(Config = {self.num_nodes}, {self.fanout},  {self.d}, '
              f'{self.d_lazy}, {self.network_type}, messages={str(self.messages)}, '
              f'{self.gossip_msg_size} MBytes, {self.gossip_window_size}, '
              f' {self.gossip2reply_ratio}, {self.nodes_per_shard}, {self.shards_per_node}, '
              f' {self.per_hop_delay} secs), {self.case}, {self.latency} secs, {self.load} MBytes')
              #f'{self.msg_size}MBytes, {self.msgpsec}/sec({self.msgphr}/hr), '

    def __iter__(self):
        return iter([self.num_nodes, self.fanout, self.d, self.d_lazy, self.network_type,
                        str(self.messages), self.gossip_msg_size, self.gossip_window_size,
                        self.gossip2reply_ratio, self.nodes_per_shard, self.shards_per_node,
                        self.per_hop_delay, self.case, self.load, self.latency])


def num_edges(config, network_type, fanout):
    # we assume and even d; d-regular graphs with both where both n and d are odd don't exist
    num_edges = config.num_nodes * config.fanout/2
    if config.network_type == networkType.REGULAR.value:
        return num_edges
    elif config.network_type == networkType.NEWMANWATTSSTROGATZ.value:
        # NEWMANWATTSSTROGATZ starts as a regular graph
        #   0. rewire random edged
        #   1. add additional ~ \beta * num_nodes*degree/2 edges to shorten the paths
        #       # \beta used = 0.5
        # this is a relatively tight estimate
        return num_edges + 0.5 * config.num_nodes * config.fanout/2
    else:
        log.error(f'num_edges: Unknown network type {config.network_type}')
        sys.exit(0)


def avg_node_distance_upper_bound(config):
    if config.network_type == networkType.REGULAR.value:
        return math.log(config.num_nodes, config.fanout)
    elif config.network_type == networkType.NEWMANWATTSSTROGATZ.value:
        # NEWMANWATTSSTROGATZ is small world and random
        # a tighter estimate
        return 2*math.log(config.num_nodes/config.fanout, config.fanout)
    else:
        log.error(f'avg_node_distance: Unknown network type {config.network_type}')
        sys.exit(0)

def load_case1(config, n_users):
    return config.peruser_message_load * n_users

# Case 2 :: single shard, (n*d)/2 messages
def load_case2(config, n_users):
    return config.peruser_message_load * num_edges(config, config.network_type, config.fanout)

def load_case2point1(config, n_users):
    return config.peruser_message_load * n_users\
                * num_edges(config, config.network_type, config.fanout)

def load_case3(config, n_users):
    return config.peruser_message_load * n_users * (config.d-1)

# Case 4:single shard n*(d-1) messages, gossip
def load_case4(config, n_users):
    num_msgsphour =  config.total_msgphr * n_users * (config.d-1) # see case 3
    #messages_load =  self.msg_size * num_msgsphour
    messages_load =  config.peruser_message_load * n_users * (config.d-1)
    num_ihave = num_msgsphour * config.d_lazy * config.gossip_window_size
    ihave_load  = num_ihave * config.gossip_msg_size
    gossip_response_load  = (num_ihave * (config.gossip_msg_size + config.avg_msg_size)) * config.gossip2reply_ratio  # reply load contains both an IWANT (from requester to sender), and the actual wanted message (from sender to requester)
    gossip_total = ihave_load + gossip_response_load
    #print(f"bandwidth {(messages_load,  gossip_total,self.d, self.d_lazy)} = {messages_load + gossip_total}")
    return messages_load + gossip_total

def load_case5(config, n_users):
    nedges = num_edges(config, config.network_type, config.fanout)
    nedges_regular = num_edges(config, networkType.REGULAR.value, 6)
    edge_diff = nedges - nedges_regular

    eager_fraction = 1 if config.d_lazy <= 0 or edge_diff <= 0 else nedges_regular / nedges
    lazy_fraction = 1 - eager_fraction

    eager_edges, lazy_edges = nedges * eager_fraction , nedges * lazy_fraction

    #print(f"{(nedges, nedges_regular)} = {eager_fraction, lazy_fraction} {self.gossip2reply_ratio}")
    total_load =  eager_edges * n_users * config.peruser_message_load \
                      + lazy_edges * 60 * config.gossip_window_size \
                            * (config.gossip_msg_size + config.gossip2reply_ratio * config.avg_msg_size)
        #print(f"{n_users} users = {total_load}, {eager_edges * self.msgphr * n_users * self.msg_size}")
    return total_load


def load_sharding_case1(config, n_users):
    load_per_node_per_shard = load_case4(config, np.minimum(n_users/3, config.nodes_per_shard))
    return config.shards_per_node * load_per_node_per_shard

def load_sharding_case2(config, n_users):
    load_per_node_per_shard = load_case4(config, np.minimum(n_users/3, config.nodes_per_shard))
    load_per_node_1to1_shard = load_case4(config, np.minimum(n_users, config.nodes_per_shard))
    return (config.shards_per_node * load_per_node_per_shard) + load_per_node_1to1_shard

def load_sharding_case3(config, n_users):
    load_per_node_per_shard = load_case1(config, np.minimum(n_users/3, config.nodes_per_shard))
    return config.shards_per_node * load_per_node_per_shard


def latency_case1(config, n_users, degree):
    return avg_node_distance_upper_bound(config) * config.per_hop_delay

# WakuAnalysis performs the runs. It creates a Config object and runs the analysis on it
class WakuAnalysis(WakuConfig):
    # accept variable number of parameters with missing values set to defaults
    def __init__(self, **kwargs):
        WakuConfig.__init__(self, **kwargs)
         # add  unit (mbps, sec etc), [good, bad, ugly]
        self.cases = {
                caseType.CASE1     :   (load_case1,        ["a7", "a21"], Keys.MBPHR),
                caseType.CASE2     :   (load_case2,        ["a5", "a7", "a31"], Keys.MBPHR),
                caseType.CASE2POINT1   :   (load_case2point1,  ["a5", "a7", "a31"], Keys.MBPHR),
                caseType.CASE3     :   (load_case3,        ["a6", "a7", "a31"], Keys.MBPHR),
                caseType.CASE4     :   (load_case4,        ["a6", "a7", "a32", "a33"], Keys.MBPHR),
                caseType.CASE5     :   (load_case5,        ["a6", "a7", "a32", "a33"], Keys.MBPHR),

                caseType.SHARDINGCASE1 : (load_sharding_case1, ["a6", "a8", "a9", "a10", "a11", "a32", "a33"], Keys.MBPHR),
                caseType.SHARDINGCASE2 : (load_sharding_case2, ["a6", "a8", "a9", "a10", "a11", "a12", "a13", "a14", "a32", "a33"], Keys.MBPHR),
                caseType.SHARDINGCASE3 : (load_sharding_case3, ["a6", "a8", "a9", "a10", "a15", "a32", "a33"]),

#                "latency_case1" : (latency_case1,   ["a3", "a41", "a42"], Keys.SECS)
                }

    def conditional_display(self, num_nodes, output, writer):
        if output:
            tmp = self.num_nodes
            self.num_nodes = num_nodes
            self.display_config()
            self.num_nodes = tmp
            writer.writerow(self)

    def print_load(self, num_nodes, case, writer, output=True):
        self.load = self.cases[caseType(case)][0](self, num_nodes)
        self.conditional_display(num_nodes, output, writer)

    def print_latency(self, num_nodes, average_node_degree, writer, output=False):
        self.latency = latency_case1(self, num_nodes, average_node_degree)
        self.conditional_display(num_nodes, output, writer)

    def compute_latency(self, average_node_degree, explore, writer):
        if explore:
            self.print_latency(100, average_node_degree, writer)
            self.print_latency(1000, average_node_degree, writer)
            self.print_latency(1000 * 10, average_node_degree, writer)
        else:
            self.print_latency(self.num_nodes, average_node_degree, writer)

    def compute_load(self, case, explore, writer):
        if explore :
            for case in self.cases:
                self.print_load(100, case, writer)
                self.print_load(1000, case, writer)
                self.print_load(1000 * 10, case, writer)
        else:
            self.print_load(self.num_nodes, case, writer)

    def run(self, writer, explore=False, cases=[caseType.CASE2POINT1.value]):
        for case in cases:
            self.case = case
            self.compute_latency(self.fanout, explore, writer)
            self.compute_load(case, explore, writer)

    def plot_load(self):
        plt.clf() # clear current plot

        n_users = np.logspace(2, 6, num=5)
        print(n_users)

        plt.xlim(100, 10**4)
        plt.ylim(1, 10**4)

        plt.plot(n_users, load_case1(n_users), label='case 1', linewidth=4, linestyle='dashed')
        plt.plot(n_users, load_case2(n_users), label='case 2', linewidth=4, linestyle='dashed')
        plt.plot(n_users, load_case3(n_users), label='case 3', linewidth=4, linestyle='dashed')
        plt.plot(n_users, load_case4(n_users), label='case 4', linewidth=4, linestyle='dashed')

        case1 = "Case 1. top: 6-regular;  store load (also: naive light node)"
        case2 = "Case 2. top: 6-regular;  receive load per node, send delay to reduce duplicates"
        case3 = "Case 3. top: 6-regular;  receive load per node, current operation"
        case4 = "Case 4. top: 6-regular;  receive load per node, current operation, incl. gossip"

        plt.xlabel('number of users (log)')
        plt.ylabel('mb/hour (log)')
        plt.legend([case1, case2, case3, case4], loc='upper left')
        plt.xscale('log')
        plt.yscale('log')

        plt.axhspan(0, 10, facecolor='0.2', alpha=0.2, color='blue')
        plt.axhspan(10, 100, facecolor='0.2', alpha=0.2, color='green')
        plt.axhspan(100, 3000, facecolor='0.2', alpha=0.2, color='orange') # desktop nodes can handle this; load comparable to streaming (but both upload and download, and with spikes)
        plt.axhspan(3000, 10**6, facecolor='0.2', alpha=0.2, color='red')

        caption = "Plot 1: single shard."
        plt.figtext(0.5, 0.01, caption, wrap=True, horizontalalignment='center', fontsize=12)

        plt.show()

        figure = plt.gcf() # get current figure
        figure.set_size_inches(16, 9)
        # plt.savefig("waku_scaling_plot.svg")
        #plt.savefig("waku_scaling_single_shard_plot.png", dpi=300, orientation="landscape")

    def plot_load_sharding(self):
        plt.clf() # clear current plot

        n_users = np.logspace(2, 6, num=5)
        print(n_users)

        plt.xlim(100, 10**6)
        plt.ylim(1, 10**5)

        plt.plot(n_users, load_case1(n_users), label='sharding store', linewidth=4, linestyle='dashed') # same as without shardinig, has to store *all* messages
        plt.plot(n_users, load_sharding_case1(n_users), label='case 1', linewidth=4, linestyle='dashed')
        plt.plot(n_users, load_sharding_case2(n_users), label='case 2', linewidth=4, linestyle='dashed')
        plt.plot(n_users, load_sharding_case3(n_users), label='case 3', linewidth=4, linestyle='dashed')

        case_store = "Sharding store load; participate in all shards; top: 6-regular"
        case1 = "Sharding case 1. sharding: top: 6-regular;  receive load per node, incl gossip"
        case2 = "Sharding case 2. sharding: top: 6-regular;  receive load per node, incl gossip and 1:1 chat"
        case3 = "Sharding case 3. sharding: top: 6-regular;  regular load for naive light node"

        plt.xlabel('number of users (log)')
        plt.ylabel('mb/hour (log)')
        plt.legend([case_store, case1, case2, case3], loc='upper left')
        plt.xscale('log')
        plt.yscale('log')

        plt.axhspan(0, 10, facecolor='0.2', alpha=0.2, color='blue')
        plt.axhspan(10, 100, facecolor='0.2', alpha=0.2, color='green')
        plt.axhspan(100, 3000, facecolor='0.2', alpha=0.2, color='orange') # desktop nodes can handle this; load comparable to streaming (but both upload and download, and with spikes)
        plt.axhspan(3000, 10**6, facecolor='0.2', alpha=0.2, color='red')

        caption = "Plot 2: multi shard."
        plt.figtext(0.5, 0.01, caption, wrap=True, horizontalalignment='center', fontsize=12)

        plt.show()

        figure = plt.gcf() # get current figure
        figure.set_size_inches(16, 9)
        # plt.savefig("waku_scaling_plot.svg")
        #plt.savefig("waku_scaling_multi_shard_plot.png", dpi=300, orientation="landscape")

    def plot(self):
        self.plot_load()
        self.plot_load_sharding()


def _sanity_check(fname, keys, ftype=Keys.JSON):
    if not fname.exists():
        log.error(f'The file "{fname}" does not exist')
        sys.exit(0)
    try:
        with open(fname, 'r') as f:     # Load config file
            if ftype == Keys.JSON:      # Both batch and kurtosis use json
                json_conf = json.load(f)
                for key in keys:
                    if key not in json_conf:
                        log.error(f'The json  key "{key}" not found in {fname}')
                        sys.exit(0)
                return json_conf
            elif ftype == "yaml":   # Shadow uses yaml
                log.error(f'YAML is not yet supported : {fname}')
                sys.exit(0)
                #yaml_conf = json.load(f)
                #return yaml_conf
    except Exception as ex:
        raise typer.BadParameter(str(ex))
    log.debug(f'Sanity check: All Ok')

app = typer.Typer()

@app.command()
def wakurtosis(ctx: typer.Context, config_file: Path,
                explore : bool = typer.Option(True,
                    help="Explore or not to explore")):
    wakurtosis_json = _sanity_check(config_file, [Keys.GENNET, Keys.GENLOAD], Keys.JSON)

    num_nodes = wakurtosis_json["gennet"]["num_nodes"]
    fanout = wakurtosis_json["gennet"]["fanout"]
    network_type = wakurtosis_json["gennet"]["network_type"]
    msg_size = 1.5 * (wakurtosis_json["wls"]["min_packet_size"] +
                                wakurtosis_json["wls"]["max_packet_size"])/(2*1024*1024)
    #msg_size = truncnorm.mean(wakurtosis_json["wls"]["min_packet_size"],
    #                            wakurtosis_json["wls"]["max_packet_size"])/(1024*1024)
    msgpsec = wakurtosis_json["wls"]["message_rate"]/wakurtosis_json["gennet"]["num_nodes"]

    messages = {}
    messages["topic1"] = {"size" : msg_size, "msgpsec" : msgpsec}
    analysis = WakuAnalysis(**{ "num_nodes" : num_nodes,
                            "fanout" : fanout,
                            "messages" : messages,
                            "network_type" : network_type,
                            "per_hop_delay" : 0.1 # TODO: pick from wakurtosis
                            })

    analysis.run(explore=explore, case="case2point1")
    print(f'kurtosis: done')

@app.command()
def batch(ctx: typer.Context,
        batch_file: Path,
        output_csv : Path = typer.Option("batch-output.csv",
        help="Set the output CSV file")):
    batch_json = _sanity_check(batch_file, [ Keys.BATCH ], Keys.JSON)
    explore  = batch_json[Keys.BATCH][Keys.EXPLORE]
    per_node = batch_json[Keys.BATCH][Keys.PER_NODE]
    runs = batch_json[Keys.BATCH][Keys.RUNS]
    cases = batch_json[Keys.BATCH][Keys.CASES]

    with open(output_csv, "w") as stream:
        writer = csv.writer(stream)
        for r in runs:
            run = runs[r]
            run["per_hop_delay"] = 0.010
            if not per_node:
                for topic, msg in run[Keys.MSGS].items():
                    run[Keys.MSGS][topic]["msgpsec"] = \
                            run[Keys.MSGS][topic]["msgpsec"] / run["num_nodes"]
            analysis = WakuAnalysis(**run)
            analysis.run(cases=cases, explore=explore, writer=writer)
    print(f'batch: done')

@app.command()
def shadow(ctx: typer.Context, config_file: Path):
    yaml = _sanity_check(config_file, [], Keys.YAML)
    print("shadow: done {yaml}")

@app.command()
def cli(ctx: typer.Context,
         num_nodes: int = typer.Option(4,
             help="Set the number of nodes"),
         fanout: float = typer.Option(6.0,
             help="Set the arity"),
         network_type: networkType = typer.Option(networkType.REGULAR.value,
             help="Set the network type"),
         messages: str = typer.Argument("{\"topic1\":{\"size\":0.002,\"msgpsec\":0.001389}}",
             callback=ast.literal_eval, help="Topics traffic spec"),
         case: caseType = typer.Option(caseType.CASE2POINT1.value,
             help="Set the case type"),
         gossip_msg_size: float = typer.Option(0.00005,
             help="Set gossip message size in MBytes"),
         gossip_window_size: int = typer.Option(3,
             help="Set gossip history window size"),
         gossip2reply_ratio: float = typer.Option(0.01,
             help="Set the Gossip to reply ratio"),
         nodes_per_shard: int = typer.Option(10000,
             help="Set the number of nodes per shard/topic"),
         shards_per_node: int = typer.Option(3,
             help="Set the number of shards a node is part of"),
         per_hop_delay: float = typer.Option(0.1,
             help="Set the delay per hop"),
         explore : bool = typer.Option(True,
             help="Explore or not to explore")):

    analysis = WakuAnalysis(**{ "num_nodes" : num_nodes,
                            "fanout" : fanout,
                            "network_type" : network_type.value,
                            "messages" : messages,
                            #"msgs" : f'{\"msg1\" : { \"msg_size\" : {msg_size}
                            #"msg_size" : msg_size,
                            #"msgpsec" : msgphr/(60*60),
                            "per_hop_delay" : 0.1, # TODO: pick from cli
                            "gossip_msg_size" : gossip_msg_size,
                            "gossip_window_size":gossip_window_size,
                            "gossip2reply_ratio":gossip2reply_ratio,
                            "nodes_per_shard":nodes_per_shard,
                            "shards_per_node":shards_per_node})
    analysis.run(explore=explore)
    print("cli: done")


@app.command()
def status(ctx: typer.Context,
            status_config: Path,
            output_csv : Path = typer.Option("status-output.csv",
             help="Set the output CSV file")):
    status_json = _sanity_check(status_config, [ Keys.STATUS ], Keys.JSON)
    sjson = status_json[Keys.STATUS]
    cases = status_json[Keys.STATUS][Keys.CASES]
    explore, per_node, run  = sjson[Keys.EXPLORE], sjson[Keys.PER_NODE], {}

    # override the defaults if set
    keys =  ["network_type", "per_hop_delay",  "gossip_msg_size", "gossip_window_size", "gossip2reply_ratio", "nodes_per_shard", "shards_per_node"]
    run = {k: sjson[k] for k in keys}

    # set the mandatory fields
    run["num_nodes"]  = sjson["num_nodes"]
    run["fanout"] = sjson["fanout"]

    # extract the control message size and frequency
    run["messages"] = {}
    for topic, msg in status_json[Keys.STATUS][Keys.MSGS].items():
        run["messages"][topic] = {}
        run["messages"][topic]["size"] = \
                                    sjson["communities"]["comm1"]["size"] * msg["varsize"] + \
                                    msg["fixedsize"]
        run["messages"][topic]["msgpsec"] = msg["msgpsec"]
    with open(output_csv, "w") as stream:
        writer = csv.writer(stream)
        analysis = WakuAnalysis(**run)
        analysis.run(cases=cases, explore=explore, writer=writer)
    print(f'status: done')


if __name__ == "__main__":
    app()

"""
# general / topology
average_node_degree = 6  # has to be even
message_size = 0.002 # in MB (Mega Bytes)
self.msgphr = 5 # on a a single pubsub topic / shard / per node

# gossip
self.gossip_msg_size = 0.00005 # 50Bytes in MB (see https://github.com/libp2p/specs/pull/413#discussion_r1018821589 )
d_lazy = 6 # gossip out degree
mcache_gossip = 3 # Number of history windows to use when emitting gossip (see https://github.com/libp2p/specs/blob/master/pubsub/gossipsub/gossipsub-v1.0.md)
avg_ratio_gossip_replys = 0.01 # -> this is a wild guess! (todo: investigate)

# multi shard
avg_nodes_per_shard = 10000 # average number of nodes that a part of a single shard
avg_shards_per_node = 3    # average number of shards a given node is part of

# latency
average_delay_per_hop = 0.1 #s
"""