refactor: waku_scaling

- Put each case in its own class in cases.py - Separate utility functions into utils.py - Separate assumptions into assumptions.py
2026-01-07 21:03:52 -05:00 · 2025-06-16 14:33:14 -04:00
parent d5d92f7820
commit fc86f0475b
5 changed files with 534 additions and 349 deletions
--- a/waku_scalability/assumptions.py
+++ b/waku_scalability/assumptions.py
@@ -0,0 +1,66 @@
+# Assumptions
+# -----------------------------------------------------------
+
+# Users sent messages at a constant rate
+# The network topology is a d-regular graph (gossipsub aims at achieving this).
+
+# general / topology
+from utils import sizeof_fmt_kb
+
+
+average_node_degree = 6  # has to be even
+message_size = 0.002  # in MB (Mega Bytes)
+messages_sent_per_hour = 5  # ona a single pubsub topic / shard
+
+# gossip
+gossip_message_size = (
+    0.00005  # 50Bytes in MB (see https://github.com/libp2p/specs/pull/413#discussion_r1018821589 )
+)
+d_lazy = 6  # gossip out degree
+mcache_gossip = 3  # Number of history windows to use when emitting gossip (see https://github.com/libp2p/specs/blob/master/pubsub/gossipsub/gossipsub-v1.0.md)
+avg_ratio_gossip_replys = 0.01  # -> this is a wild guess! (todo: investigate)
+
+# multi shard
+avg_nodes_per_shard = 10000  # average number of nodes that a part of a single shard
+avg_shards_per_node = 3  # average number of shards a given node is part of
+
+# latency
+average_delay_per_hop = 0.1  # s
+
+# TODO: load case for status control messages (note: this also introduces messages by currently online, but not active users.)
+# TODO: spread in the latency distribution (the highest 10%ish of latencies might be too high)
+
+# Assumption strings (general/topology)
+a1  = "- A01. Message size (static): " + sizeof_fmt_kb(message_size)
+a2  = "- A02. Messages sent per node per hour (static) (assuming no spam; but also no rate limiting.): " + str(messages_sent_per_hour)
+a3  = "- A03. The network topology is a d-regular graph of degree (static): " + str(average_node_degree)
+a4  = "- A04. Messages outside of Waku Relay are not considered, e.g. store messages."
+a5  = "- A05. Messages are only sent once along an edge. (requires delays before sending)"
+a6  = "- A06. Messages are sent to all d-1 neighbours as soon as receiving a message (current operation)" # Thanks @Mmenduist
+a7  = "- A07. Single shard (i.e. single pubsub mesh)"
+a8  = "- A08. Multiple shards; mapping of content topic (multicast group) to shard is 1 to 1"
+a9  = "- A09. Max number of nodes per shard (static) " + str(avg_nodes_per_shard)
+a10 = "- A10. Number of shards a given node is part of (static) " + str(avg_shards_per_node)
+a11 = "- A11. Number of nodes in the network is variable.\n\
+       These nodes are distributed evenly over " + str(avg_shards_per_node) + " shards.\n\
+       Once all of these shards have " + str(avg_nodes_per_shard) + " nodes, new shards are spawned.\n\
+       These new shards have no influcene on this model, because the nodes we look at are not part of these new shards."
+a12 = "- A12. Including 1:1 chat. Messages sent to a given user are sent into a 1:1 shard associated with that user's node.\n\
+        Effectively, 1:1 chat adds a receive load corresponding to one additional shard a given node has to be part of."
+a13 = "- A13. 1:1 chat messages sent per node per hour (static): " + str(messages_sent_per_hour) # could introduce a separate variable here
+a14 = "- A14. 1:1 chat shards are filled one by one (not evenly distributed over the shards).\n\
+        This acts as an upper bound and overestimates the 1:1 load for lower node counts."
+a15 = "- A15. Naive light node. Requests all messages in shards that have (large) 1:1 mapped multicast groups the light node is interested in."
+
+
+# Assumption strings (store)
+a21 = "- A21. Store nodes do not store duplicate messages."
+
+# Assumption strings (gossip)
+a31 = "- A21. Gossip is not considered."
+a32 = "- A32. Gossip message size (IHAVE/IWANT) (static):" + sizeof_fmt_kb(gossip_message_size)
+a33 = "- A33. Ratio of IHAVEs followed-up by an IWANT (incl. the actual requested message):" + str(avg_ratio_gossip_replys)
+
+# Assumption strings (delay)
+a41 = "- A41. Delay is calculated based on an upper bound of the expected distance."
+a42 = "- A42. Average delay per hop (static): " + str(average_delay_per_hop) + "s."
--- a/waku_scalability/cases.py
+++ b/waku_scalability/cases.py
@@ -0,0 +1,333 @@
+from abc import ABC, abstractmethod
+import io
+import math
+from typing import Any, Callable, List
+import numpy as np
+from pydantic import BaseModel, Field, PositiveInt
+
+from assumptions import (
+    a1,
+    a2,
+    a3,
+    a4,
+    a5,
+    a6,
+    a7,
+    a8,
+    a9,
+    a10,
+    a11,
+    a12,
+    a13,
+    a14,
+    a15,
+    a21,
+    a31,
+    a32,
+    a33,
+    a41,
+    a42,
+)
+
+from assumptions import (
+    message_size,
+    messages_sent_per_hour,
+    average_node_degree,
+    d_lazy,
+    mcache_gossip,
+    gossip_message_size,
+    avg_ratio_gossip_replys,
+    avg_nodes_per_shard,
+    avg_shards_per_node,
+    average_delay_per_hop,
+)
+
+from utils import load_color_fmt, magnitude_fmt, get_header, sizeof_fmt
+
+
+def get_assumptions_str(xs) -> str:
+    with io.StringIO() as builder:
+        builder.write("Assumptions/Simplifications:\n")
+        for x in xs:
+            builder.write(f"{x}\n")
+        return builder.getvalue()
+
+
+def usage_str(load_users_fn: Callable[[PositiveInt, Any], object], n_users: PositiveInt):
+    load = load_users_fn(
+        n_users,
+    )
+    return load_color_fmt(
+        load,
+        "For "
+        + magnitude_fmt(n_users)
+        + " users, receiving bandwidth is "
+        + sizeof_fmt(load_users_fn(n_users))
+        + "/hour",
+    )
+
+
+def get_usages_str(load_users) -> str:
+    usages = [
+        usage_str(load_users, n_users)
+        for n_users in [
+            100,
+            100 * 100,
+            100 * 100 * 100,
+        ]
+    ]
+    return "\n".join(usages)
+
+
+def latency_str(latency_users_fn, n_users, degree):
+    latency = latency_users_fn(n_users, degree)
+    return load_color_fmt(
+        latency,
+        "For "
+        + magnitude_fmt(n_users)
+        + " the average latency is "
+        + ("%.3f" % latency_users_fn(n_users, degree))
+        + " s",
+    )
+
+
+def get_latency_str(latency_users):
+    latencies = [
+        latency_str(latency_users, n_users, average_node_degree)
+        for n_users in [
+            100,
+            100 * 100,
+            100 * 100 * 100,
+        ]
+    ]
+    with io.StringIO() as builder:
+        latencies_strs = "\n".join(latencies)
+        builder.write(f"{latencies_strs}\n")
+        return builder.getvalue()
+
+
+def num_edges_dregular(num_nodes, degree):
+    # we assume and even d; d-regular graphs with both where both n and d are odd don't exist
+    assert (
+        num_nodes % 2 == 0 if isinstance(num_nodes, int) else all(n % 2 == 0 for n in num_nodes)
+    ), f"Broken assumption: Expected num_nodes to be even. Instead n = {num_nodes}"
+    assert (
+        degree % 2 == 0 if isinstance(degree, int) else all(d % 2 == 0 for d in degree)
+    ), f"Broken assumption: Expected degree should be even. Instead d = {degree}"
+
+    return num_nodes * (degree / 2)
+
+
+def avg_node_distance_upper_bound(n_users, degree):
+    return math.log(n_users, degree)
+
+
+# Cases Load Per Node
+# -----------------------------------------------------------
+
+
+class Case(ABC, BaseModel):
+    label: str = Field(description="String to use as label on plot.")
+    legend: str = Field(description="String to use in legend of plot.")
+
+    @abstractmethod
+    def load(self, n_users, **kargs) -> object:
+        pass
+
+    @property
+    @abstractmethod
+    def header(self) -> str:
+        pass
+
+    @property
+    @abstractmethod
+    def assumptions(self) -> List[str]:
+        pass
+
+    @property
+    def description(self) -> str:
+        return "\n".join(
+            [
+                "",
+                get_header(self.header),
+                get_assumptions_str(self.assumptions),
+                get_usages_str(self.load),
+                "",
+                "------------------------------------------------------------",
+            ]
+        )
+
+
+# Case 1 :: singe shard, unique messages, store
+class Case1(Case):
+    label: str = "case 1"
+    legend: str = "Case 1. top: 6-regular;  store load (also: naive light node)"
+
+    def load(self, n_users, **kwargs):
+        return message_size * messages_sent_per_hour * n_users
+
+    @property
+    def header(self) -> str:
+        return "Load case 1 (store load; corresponds to received load per naive light node)"
+
+    @property
+    def assumptions(self) -> List[str]:
+        return [a1, a2, a3, a4, a7, a21]
+
+
+# Case 2 :: single shard, (n*d)/2 messages
+class Case2(Case):
+    label: str = "case 2"
+    legend: str = "Case 2. top: 6-regular;  receive load per node, send delay to reduce duplicates"
+
+    def load(self, n_users, **kwargs):
+        return (
+            message_size * messages_sent_per_hour * num_edges_dregular(n_users, average_node_degree)
+        )
+
+    @property
+    def header(self) -> str:
+        return "Load case 2 (received load per node)"
+
+    @property
+    def assumptions(self):
+        return [a1, a2, a3, a4, a5, a7, a31]
+
+
+# Case 3 :: single shard n*(d-1) messages
+class Case3(Case):
+    label: str = "case 3"
+    legend: str = "Case 3. top: 6-regular;  receive load per node, current operation"
+
+    def load(self, n_users, **kwargs):
+        return message_size * messages_sent_per_hour * n_users * (average_node_degree - 1)
+
+    @property
+    def header(self) -> str:
+        return "Load case 3 (received load per node)"
+
+    @property
+    def assumptions(self):
+        return [a1, a2, a3, a4, a6, a7, a31]
+
+
+# Case 4:single shard n*(d-1) messages, gossip
+class Case4(Case):
+    label: str = "case 4"
+    legend: str = "Case 4. top: 6-regular;  receive load per node, current operation, incl. gossip"
+
+    def load(self, n_users, **kwargs):
+        messages_received_per_hour = (
+            messages_sent_per_hour * n_users * (average_node_degree - 1)
+        )  # see case 3
+        messages_load = message_size * messages_received_per_hour
+        num_ihave = messages_received_per_hour * d_lazy * mcache_gossip
+        ihave_load = num_ihave * gossip_message_size
+        gossip_response_load = (
+            num_ihave * (gossip_message_size + message_size)
+        ) * avg_ratio_gossip_replys  # reply load contains both an IWANT (from requester to sender), and the actual wanted message (from sender to requester)
+        gossip_total = ihave_load + gossip_response_load
+
+        return messages_load + gossip_total
+
+    @property
+    def header(self) -> str:
+        return "Load case 4 (received load per node incl. gossip)"
+
+    @property
+    def assumptions(self):
+        return [a1, a2, a3, a4, a6, a7, a32, a33]
+
+
+# sharding case 1: multi shard, n*(d-1) messages, gossip
+class ShardingCase1(Case):
+    label: str = "case 1"
+    legend: str = "Sharding case 1. sharding: top: 6-regular;  receive load per node, incl gossip"
+
+    def load(self, n_users, **kwargs):
+        case_4 = Case4()
+        load_per_node_per_shard = case_4.load(np.minimum(n_users / 3, avg_nodes_per_shard))
+        return avg_shards_per_node * load_per_node_per_shard
+
+    @property
+    def header(self) -> str:
+        return "load sharding case 1 (received load per node incl. gossip)"
+
+    @property
+    def assumptions(self):
+        return [a1, a2, a3, a4, a6, a8, a9, a10, a11, a32, a33]
+
+
+# sharding case 2: multi shard, n*(d-1) messages, gossip, 1:1 chat
+class ShardingCase2(Case):
+    label: str = "case 2"
+    legend: str = (
+        "Sharding case 2. sharding: top: 6-regular;  receive load per node, incl gossip and 1:1 chat"
+    )
+
+    def load(self, n_users, **kwargs):
+        case_4 = Case4()
+        load_per_node_per_shard = case_4.load(np.minimum(n_users / 3, avg_nodes_per_shard))
+        load_per_node_1to1_shard = case_4.load(np.minimum(n_users, avg_nodes_per_shard))
+        return (avg_shards_per_node * load_per_node_per_shard) + load_per_node_1to1_shard
+
+    @property
+    def header(self) -> str:
+        return "load sharding case 2 (received load per node incl. gossip and 1:1 chat)"
+
+    @property
+    def assumptions(self):
+        return [a1, a2, a3, a4, a6, a8, a9, a10, a11, a12, a13, a14, a32, a33]
+
+
+# sharding case 3: multi shard, naive light node
+class ShardingCase3(Case):
+    label: str = "case 3"
+    legend: str = "Sharding case 3. sharding: top: 6-regular;  regular load for naive light node"
+
+    def load(self, n_users, **kwargs):
+        case_1 = Case1()
+        load_per_node_per_shard = case_1.load(np.minimum(n_users / 3, avg_nodes_per_shard))
+        return avg_shards_per_node * load_per_node_per_shard
+
+    @property
+    def header(self) -> str:
+        return "load sharding case 3 (received load naive light node.)"
+
+    @property
+    def assumptions(self):
+        return [a1, a2, a3, a4, a6, a8, a9, a10, a15, a32, a33]
+
+
+# Cases average latency
+# -----------------------------------------------------------
+
+
+class LatencyCase1(Case):
+    label: str = "latency case 1"
+    legend: str = "Latency case 1. topology: 6-regular graph. No gossip"
+
+    def load(self, n_users, degree):
+        return avg_node_distance_upper_bound(n_users, degree) * average_delay_per_hop
+
+    @property
+    def header(self) -> str:
+        return (
+            "Latency case 1 :: Topology: 6-regular graph. No gossip (note: gossip would help here)"
+        )
+
+    @property
+    def description(self) -> str:
+        return "\n".join(
+            [
+                "",
+                get_header(self.header),
+                get_assumptions_str(self.assumptions),
+                get_latency_str(self.load),
+                "------------------------------------------------------------",
+            ]
+        )
+
+    @property
+    def assumptions(self):
+        return [a3, a41, a42]
--- a/waku_scalability/requirements.txt
+++ b/waku_scalability/requirements.txt
@@ -1,2 +1,3 @@
 matplotlib==3.10.3
 numpy==2.3.0
+pydantic==2.11.7
--- a/waku_scalability/utils.py
+++ b/waku_scalability/utils.py
@@ -0,0 +1,50 @@
+# Util and format functions
+# -----------------------------------------------------------
+
+
+class bcolors:
+    HEADER = "\033[95m"
+    OKBLUE = "\033[94m"
+    OKGREEN = "\033[92m"
+    WARNING = "\033[93m"
+    FAIL = "\033[91m"
+    ENDC = "\033[0m"
+    BOLD = "\033[1m"
+    UNDERLINE = "\033[4m"
+
+
+def sizeof_fmt(num):
+    return "%.1f%s" % (num, "MB")
+
+
+def sizeof_fmt_kb(num):
+    return "%.2f%s" % (num * 1024, "KB")
+
+
+def magnitude_fmt(num):
+    for x in ["", "k", "m"]:
+        if num < 1000:
+            return "%2d%s" % (num, x)
+        num /= 1000
+
+
+# Color format based on daily bandwidth usage
+# <10mb/d = good, <30mb/d ok, <100mb/d bad, 100mb/d+ fail.
+def load_color_prefix(load):
+    if load < (10):
+        color_level = bcolors.OKBLUE
+    elif load < (30):
+        color_level = bcolors.OKGREEN
+    elif load < (100):
+        color_level = bcolors.WARNING
+    else:
+        color_level = bcolors.FAIL
+    return color_level
+
+
+def load_color_fmt(load, string):
+    return load_color_prefix(load) + string + bcolors.ENDC
+
+
+def get_header(string) -> str:
+    return bcolors.HEADER + string + bcolors.ENDC + "\n"
--- a/waku_scalability/waku_scaling.py
+++ b/waku_scalability/waku_scaling.py
@@ -3,368 +3,103 @@
 # - todo: separate the part on latency
 # based on ../whisper_scalability/whisper.py

+from typing import List
 import matplotlib.pyplot as plt
 import numpy as np
-import math
-
-# Util and format functions
-#-----------------------------------------------------------
-
-class bcolors:
-    HEADER = '\033[95m'
-    OKBLUE = '\033[94m'
-    OKGREEN = '\033[92m'
-    WARNING = '\033[93m'
-    FAIL = '\033[91m'
-    ENDC = '\033[0m'
-    BOLD = '\033[1m'
-    UNDERLINE = '\033[4m'
-
-def sizeof_fmt(num):
-    return "%.1f%s" % (num, "MB")
-
-def sizeof_fmt_kb(num):
-    return "%.2f%s" % (num*1024, "KB")
-
-def magnitude_fmt(num):
-    for x in ['','k','m']:
-        if num < 1000:
-            return "%2d%s" % (num, x)
-        num /= 1000
-
-# Color format based on daily bandwidth usage
-# <10mb/d = good, <30mb/d ok, <100mb/d bad, 100mb/d+ fail.
-def load_color_prefix(load):
-    if load < (10):
-        color_level = bcolors.OKBLUE
-    elif load < (30):
-        color_level = bcolors.OKGREEN
-    elif load < (100):
-        color_level = bcolors.WARNING
-    else:
-        color_level = bcolors.FAIL
-    return color_level
-
-def load_color_fmt(load, string):
-    return load_color_prefix(load) + string + bcolors.ENDC
-
-def print_header(string):
-    print(bcolors.HEADER + string + bcolors.ENDC + "\n")
-
-def print_assumptions(xs):
-    print("Assumptions/Simplifications:")
-    for x in xs:
-        print(x)
-    print("")
-
-def usage_str(load_users_fn, n_users):
-    load = load_users_fn(n_users)
-    return load_color_fmt(load, "For " + magnitude_fmt(n_users) + " users, receiving bandwidth is " + sizeof_fmt(load_users_fn(n_users)) + "/hour")
-
-def print_usage(load_users):
-    print(usage_str(load_users, 100))
-    print(usage_str(load_users, 100 * 100))
-    print(usage_str(load_users, 100 * 100 * 100))
-
-def latency_str(latency_users_fn, n_users, degree):
-    latency =  latency_users_fn(n_users, degree)
-    return load_color_fmt(latency, "For " + magnitude_fmt(n_users) + " the average latency is " + ("%.3f" % latency_users_fn(n_users, degree)) + " s")
-
-def print_latency(latency_users):
-    print(latency_str(latency_users, 100, average_node_degree))
-    print(latency_str(latency_users, 100 * 100, average_node_degree))
-    print(latency_str(latency_users, 100 * 100 * 100, average_node_degree))
-
-def num_edges_dregular(num_nodes, degree):
-    # we assume and even d; d-regular graphs with both where both n and d are odd don't exist
-    return num_nodes * (degree/2)
-
-def avg_node_distance_upper_bound(n_users, degree):
-    return math.log(n_users, degree)
-
-# Assumptions
-#-----------------------------------------------------------
-
-# Users sent messages at a constant rate
-# The network topology is a d-regular graph (gossipsub aims at achieving this).
-
-# general / topology
-average_node_degree = 6  # has to be even
-message_size = 0.002 # in MB (Mega Bytes)
-messages_sent_per_hour = 5 # ona a single pubsub topic / shard
-
-# gossip
-gossip_message_size = 0.00005 # 50Bytes in MB (see https://github.com/libp2p/specs/pull/413#discussion_r1018821589 )
-d_lazy = 6 # gossip out degree
-mcache_gossip = 3 # Number of history windows to use when emitting gossip (see https://github.com/libp2p/specs/blob/master/pubsub/gossipsub/gossipsub-v1.0.md)
-avg_ratio_gossip_replys = 0.01 # -> this is a wild guess! (todo: investigate)
-
-# multi shard
-avg_nodes_per_shard = 10000 # average number of nodes that a part of a single shard
-avg_shards_per_node = 3    # average number of shards a given node is part of
-
-# latency
-average_delay_per_hop = 0.1 #s
-
-# TODO: load case for status control messages (note: this also introduces messages by currently online, but not active users.)
-# TODO: spread in the latency distribution (the highest 10%ish of latencies might be too high)
-
-# Assumption strings (general/topology)
-a1  = "- A01. Message size (static): " + sizeof_fmt_kb(message_size)
-a2  = "- A02. Messages sent per node per hour (static) (assuming no spam; but also no rate limiting.): " + str(messages_sent_per_hour)
-a3  = "- A03. The network topology is a d-regular graph of degree (static): " + str(average_node_degree)
-a4  = "- A04. Messages outside of Waku Relay are not considered, e.g. store messages."
-a5  = "- A05. Messages are only sent once along an edge. (requires delays before sending)"
-a6  = "- A06. Messages are sent to all d-1 neighbours as soon as receiving a message (current operation)" # Thanks @Mmenduist
-a7  = "- A07. Single shard (i.e. single pubsub mesh)"
-a8  = "- A08. Multiple shards; mapping of content topic (multicast group) to shard is 1 to 1"
-a9  = "- A09. Max number of nodes per shard (static) " + str(avg_nodes_per_shard)
-a10 = "- A10. Number of shards a given node is part of (static) " + str(avg_shards_per_node)
-a11 = "- A11. Number of nodes in the network is variable.\n\
-       These nodes are distributed evenly over " + str(avg_shards_per_node) + " shards.\n\
-       Once all of these shards have " + str(avg_nodes_per_shard) + " nodes, new shards are spawned.\n\
-       These new shards have no influcene on this model, because the nodes we look at are not part of these new shards."
-a12 = "- A12. Including 1:1 chat. Messages sent to a given user are sent into a 1:1 shard associated with that user's node.\n\
-        Effectively, 1:1 chat adds a receive load corresponding to one additional shard a given node has to be part of."
-a13 = "- A13. 1:1 chat messages sent per node per hour (static): " + str(messages_sent_per_hour) # could introduce a separate variable here
-a14 = "- A14. 1:1 chat shards are filled one by one (not evenly distributed over the shards).\n\
-        This acts as an upper bound and overestimates the 1:1 load for lower node counts."
-a15 = "- A15. Naive light node. Requests all messages in shards that have (large) 1:1 mapped multicast groups the light node is interested in."
-
-
-# Assumption strings (store)
-a21 = "- A21. Store nodes do not store duplicate messages."
-
-# Assumption strings (gossip)
-a31 = "- A21. Gossip is not considered."
-a32 = "- A32. Gossip message size (IHAVE/IWANT) (static):" + sizeof_fmt_kb(gossip_message_size)
-a33 = "- A33. Ratio of IHAVEs followed-up by an IWANT (incl. the actual requested message):" + str(avg_ratio_gossip_replys)
-
-# Assumption strings (delay)
-a41 = "- A41. Delay is calculated based on an upper bound of the expected distance."
-a42 = "- A42. Average delay per hop (static): " + str(average_delay_per_hop) + "s."
-
-
-# Cases Load Per Node
-#-----------------------------------------------------------
-
-# Case 1 :: singe shard, unique messages, store
-def load_case1(n_users):
-    return message_size * messages_sent_per_hour * n_users
-
-def print_load_case1():
-    print("")
-    print_header("Load case 1 (store load; corresponds to received load per naive light node)")
-    print_assumptions([a1, a2, a3, a4, a7, a21])
-    print_usage(load_case1)
-    print("")
-    print("------------------------------------------------------------")
-
-# Case 2 :: single shard, (n*d)/2 messages
-def load_case2(n_users):
-    return message_size * messages_sent_per_hour * num_edges_dregular(n_users, average_node_degree)
-
-def print_load_case2():
-    print("")
-    print_header("Load case 2 (received load per node)")
-    print_assumptions([a1, a2, a3, a4, a5, a7, a31])
-    print_usage(load_case2)
-    print("")
-    print("------------------------------------------------------------")
-
-# Case 3 :: single shard n*(d-1) messages
-def load_case3(n_users):
-    return message_size * messages_sent_per_hour * n_users * (average_node_degree-1)
-
-def print_load_case3():
-    print("")
-    print_header("Load case 3 (received load per node)")
-    print_assumptions([a1, a2, a3, a4, a6, a7, a31])
-    print_usage(load_case3)
-    print("")
-    print("------------------------------------------------------------")
-
-
-# Case 4:single shard n*(d-1) messages, gossip
-def load_case4(n_users):
-    messages_received_per_hour =  messages_sent_per_hour * n_users * (average_node_degree-1) # see case 3
-    messages_load =  message_size * messages_received_per_hour
-    num_ihave = messages_received_per_hour * d_lazy * mcache_gossip
-    ihave_load  = num_ihave * gossip_message_size
-    gossip_response_load  = (num_ihave * (gossip_message_size + message_size)) * avg_ratio_gossip_replys # reply load contains both an IWANT (from requester to sender), and the actual wanted message (from sender to requester)
-    gossip_total = ihave_load + gossip_response_load
-
-    return messages_load + gossip_total
-
-def print_load_case4():
-    print("")
-    print_header("Load case 4 (received load per node incl. gossip)")
-    print_assumptions([a1, a2, a3, a4, a6, a7, a32, a33])
-    print_usage(load_case4)
-    print("")
-    print("------------------------------------------------------------")
-
-# sharding case 1: multi shard, n*(d-1) messages, gossip
-def load_sharding_case1(n_users):
-    load_per_node_per_shard = load_case4(np.minimum(n_users/3, avg_nodes_per_shard))
-    return avg_shards_per_node * load_per_node_per_shard
-
-def print_load_sharding_case1():
-    print("")
-    print_header("load sharding case 1 (received load per node incl. gossip)")
-    print_assumptions([a1, a2, a3, a4, a6, a8, a9, a10, a11, a32, a33])
-    print_usage(load_sharding_case1)
-    print("")
-    print("------------------------------------------------------------")
-
-# sharding case 2: multi shard, n*(d-1) messages, gossip, 1:1 chat
-def load_sharding_case2(n_users):
-    load_per_node_per_shard = load_case4(np.minimum(n_users/3, avg_nodes_per_shard))
-    load_per_node_1to1_shard = load_case4(np.minimum(n_users, avg_nodes_per_shard))
-    return (avg_shards_per_node * load_per_node_per_shard) + load_per_node_1to1_shard
-
-def print_load_sharding_case2():
-    print("")
-    print_header("load sharding case 2 (received load per node incl. gossip and 1:1 chat)")
-    print_assumptions([a1, a2, a3, a4, a6, a8, a9, a10, a11, a12, a13, a14, a32, a33])
-    print_usage(load_sharding_case2)
-    print("")
-    print("------------------------------------------------------------")
-
-# sharding case 3: multi shard, naive light node
-def load_sharding_case3(n_users):
-    load_per_node_per_shard = load_case1(np.minimum(n_users/3, avg_nodes_per_shard))
-    return avg_shards_per_node * load_per_node_per_shard
-
-def print_load_sharding_case3():
-    print("")
-    print_header("load sharding case 3 (received load naive light node.)")
-    print_assumptions([a1, a2, a3, a4, a6, a8, a9, a10, a15, a32, a33])
-    print_usage(load_sharding_case3)
-    print("")
-    print("------------------------------------------------------------")
-
-
-
-
-# Cases average latency
-#-----------------------------------------------------------
-
-def latency_case1(n_users, degree):
-    return avg_node_distance_upper_bound(n_users, degree) * average_delay_per_hop
-
-def print_latency_case1():
-    print("")
-    print_header("Latency case 1 :: Topology: 6-regular graph. No gossip (note: gossip would help here)")
-    print_assumptions([a3, a41, a42])
-    print_latency(latency_case1)
-    print("")
-    print("------------------------------------------------------------")

+from cases import (
+    Case,
+    Case1,
+    Case2,
+    Case3,
+    Case4,
+    LatencyCase1,
+    ShardingCase1,
+    ShardingCase2,
+    ShardingCase3,
+)
+from utils import bcolors

 # Run cases
-#-----------------------------------------------------------
+# -----------------------------------------------------------

 # Print goals
 print("")
-print(bcolors.HEADER + "Waku relay theoretical model results (single shard and multi shard scenarios)." + bcolors.ENDC)
+print(
+    bcolors.HEADER
+    + "Waku relay theoretical model results (single shard and multi shard scenarios)."
+    + bcolors.ENDC
+)

-print_load_case1()
-print_load_case2()
-print_load_case3()
-print_load_case4()
+cases: List[Case] = [
+    Case1(),
+    Case2(),
+    Case3(),
+    Case4(),
+    ShardingCase1(),
+    ShardingCase2(),
+    ShardingCase3(),
+    LatencyCase1(),
+]

-print_load_sharding_case1()
-print_load_sharding_case2()
-print_load_sharding_case3()
-
-print_latency_case1()
+for case in cases:
+    print(case.description)

 # Plot
-#-----------------------------------------------------------
-
-def plot_load():
-  plt.clf() # clear current plot
-
-  n_users = np.logspace(2, 6, num=5)
-  print(n_users)
-
-  plt.xlim(100, 10**4)
-  plt.ylim(1, 10**4)
-
-  plt.plot(n_users, load_case1(n_users), label='case 1', linewidth=4, linestyle='dashed')
-  plt.plot(n_users, load_case2(n_users), label='case 2', linewidth=4, linestyle='dashed')
-  plt.plot(n_users, load_case3(n_users), label='case 3', linewidth=4, linestyle='dashed')
-  plt.plot(n_users, load_case4(n_users), label='case 4', linewidth=4, linestyle='dashed')
-
-  case1 = "Case 1. top: 6-regular;  store load (also: naive light node)"
-  case2 = "Case 2. top: 6-regular;  receive load per node, send delay to reduce duplicates"
-  case3 = "Case 3. top: 6-regular;  receive load per node, current operation"
-  case4 = "Case 4. top: 6-regular;  receive load per node, current operation, incl. gossip"
-
-  plt.xlabel('number of users (log)')
-  plt.ylabel('mb/hour (log)')
-  plt.legend([case1, case2, case3, case4], loc='upper left')
-  plt.xscale('log')
-  plt.yscale('log')
-
-  plt.axhspan(0, 10, facecolor='0.2', alpha=0.2, color='blue')
-  plt.axhspan(10, 100, facecolor='0.2', alpha=0.2, color='green')
-  plt.axhspan(100, 3000, facecolor='0.2', alpha=0.2, color='orange') # desktop nodes can handle this; load comparable to streaming (but both upload and download, and with spikes)
-  plt.axhspan(3000, 10**6, facecolor='0.2', alpha=0.2, color='red')
-
-  caption = "Plot 1: single shard."
-  plt.figtext(0.5, 0.01, caption, wrap=True, horizontalalignment='center', fontsize=12)
-
-  # plt.show()
-
-  figure = plt.gcf() # get current figure
-  figure.set_size_inches(16, 9)
-  # plt.savefig("waku_scaling_plot.svg")
-  plt.savefig("waku_scaling_single_shard_plot.png", dpi=300, orientation="landscape")
-
-def plot_load_sharding():
-  plt.clf() # clear current plot
-
-  n_users = np.logspace(2, 6, num=5)
-  print(n_users)
-
-  plt.xlim(100, 10**6)
-  plt.ylim(1, 10**5)
-
-  plt.plot(n_users, load_case1(n_users), label='sharding store', linewidth=4, linestyle='dashed') # same as without shardinig, has to store *all* messages
-  plt.plot(n_users, load_sharding_case1(n_users), label='case 1', linewidth=4, linestyle='dashed')
-  plt.plot(n_users, load_sharding_case2(n_users), label='case 2', linewidth=4, linestyle='dashed')
-  plt.plot(n_users, load_sharding_case3(n_users), label='case 3', linewidth=4, linestyle='dashed')
-
-  case_store = "Sharding store load; participate in all shards; top: 6-regular"
-  case1 = "Sharding case 1. sharding: top: 6-regular;  receive load per node, incl gossip"
-  case2 = "Sharding case 2. sharding: top: 6-regular;  receive load per node, incl gossip and 1:1 chat"
-  case3 = "Sharding case 3. sharding: top: 6-regular;  regular load for naive light node"
-
-  plt.xlabel('number of users (log)')
-  plt.ylabel('mb/hour (log)')
-  plt.legend([case_store, case1, case2, case3], loc='upper left')
-  plt.xscale('log')
-  plt.yscale('log')
-
-  plt.axhspan(0, 10, facecolor='0.2', alpha=0.2, color='blue')
-  plt.axhspan(10, 100, facecolor='0.2', alpha=0.2, color='green')
-  plt.axhspan(100, 3000, facecolor='0.2', alpha=0.2, color='orange') # desktop nodes can handle this; load comparable to streaming (but both upload and download, and with spikes)
-  plt.axhspan(3000, 10**6, facecolor='0.2', alpha=0.2, color='red')
-
-  caption = "Plot 2: multi shard."
-  plt.figtext(0.5, 0.01, caption, wrap=True, horizontalalignment='center', fontsize=12)
-
-  # plt.show()
-
-  figure = plt.gcf() # get current figure
-  figure.set_size_inches(16, 9)
-  # plt.savefig("waku_scaling_plot.svg")
-  plt.savefig("waku_scaling_multi_shard_plot.png", dpi=300, orientation="landscape")
+# -----------------------------------------------------------


+def plot_load(caption: str, cases: List[Case], file_path: str):
+    plt.clf()  # clear current plot

-plot_load()
-plot_load_sharding()
+    n_users = np.logspace(2, 6, num=5)
+    print(n_users)

+    plt.xlim(100, 10**4)
+    plt.ylim(1, 10**4)
+
+    for case in cases:
+        plt.plot(n_users, case.load(n_users), label=case.label, linewidth=4, linestyle="dashed")
+
+    plt.xlabel("number of users (log)")
+    plt.ylabel("mb/hour (log)")
+    plt.legend(cases, loc="upper left")
+    plt.xscale("log")
+    plt.yscale("log")
+
+    plt.axhspan(0, 10, facecolor="0.2", alpha=0.2, color="blue")
+    plt.axhspan(10, 100, facecolor="0.2", alpha=0.2, color="green")
+    plt.axhspan(
+        100, 3000, facecolor="0.2", alpha=0.2, color="orange"
+    )  # desktop nodes can handle this; load comparable to streaming (but both upload and download, and with spikes)
+    plt.axhspan(3000, 10**6, facecolor="0.2", alpha=0.2, color="red")
+
+    plt.figtext(0.5, 0.01, caption, wrap=True, horizontalalignment="center", fontsize=12)
+
+    # plt.show()
+
+    figure = plt.gcf()  # get current figure
+    figure.set_size_inches(16, 9)
+    # plt.savefig("waku_scaling_plot.svg")
+    plt.savefig(file_path, dpi=300, orientation="landscape")
+
+
+plot_load(
+    caption="Plot 1: single shard.",
+    cases=[Case1(), Case2(), Case3(), Case4()],
+    file_path="waku_scaling_single_shard_plot.png",
+)
+
+plot_load(
+    caption="Plot 2: multi shard.",
+    cases=[
+        Case1(
+            label="sharding store",
+            legend="Sharding store load; participate in all shards; top: 6-regular",
+        ),
+        ShardingCase1(),
+        ShardingCase2(),
+        ShardingCase3(),
+    ],
+    file_path="",
+)