refactor of the analyzer

GioeleB00 · GioeleB00 · commit 4a6c82f1f1b3 · 2025-08-01T15:33:16.000+02:00
diff --git a/src/app/config/constants.py b/src/app/config/constants.py
@@ -216,9 +216,9 @@ class SamplePeriods(float, Enum):
   we have to extract a time series
   """
 
-  STANDARD_TIME = 0.005 # 5 MILLISECONDS
+  STANDARD_TIME = 0.01 # 10 MILLISECONDS
   MINIMUM_TIME = 0.001 # 1 MILLISECOND
-  MAXIMUM_TIME = 0.1    # 10 MILLISECONDS
+  MAXIMUM_TIME = 0.1   # 100 MILLISECONDS
 
 # ======================================================================
 # CONSTANTS FOR EVENT METRICS
@@ -244,15 +244,31 @@ class AggregatedMetricName(StrEnum):
   """aggregated metrics to calculate at the end of simulation"""
 
   LATENCY_STATS = "latency_stats"
-  THROUGHPUT_RPS = "throughput_rps"
+  THROUGHPUT = "throughput_rps"
   LLM_STATS = "llm_stats"
 
 # ======================================================================
 # CONSTANTS FOR SERVER RUNTIME
 # ======================================================================
 
 class ServerResourceName(StrEnum):
-    """Keys for each server resource type, used when building the container map."""
+  """Keys for each server resource type, used when building the container map."""
 
-    CPU = "CPU"
-    RAM = "RAM"
+  CPU = "CPU"
+  RAM = "RAM"
+
+# ======================================================================
+# CONSTANTS FOR LATENCY STATS
+# ======================================================================
+
+class LatencyKey(StrEnum):
+  """Keys for the collection of the latency stats"""
+
+  TOTAL_REQUESTS = "total_requests"
+  MEAN           = "mean"
+  MEDIAN         = "median"
+  STD_DEV        = "std_dev"
+  P95            = "p95"
+  P99            = "p99"
+  MIN            = "min"
+  MAX            = "max"
diff --git a/src/app/config/plot_constants.py b/src/app/config/plot_constants.py
@@ -0,0 +1,47 @@
+"""Dataclass to define a central structure to plot the metrics"""
+from dataclasses import dataclass
+
+
+@dataclass(frozen=True)
+class PlotCfg:
+    """Dataclass for the plot of the various metrics"""
+
+    no_data: str
+    title:   str
+    x_label: str
+    y_label: str
+    ready_label: str | None = None
+    io_label: str | None = None
+    legend_label: str | None = None
+
+LATENCY_PLOT = PlotCfg(
+    no_data="No latency data",
+    title="Request Latency Distribution",
+    x_label="Latency (s)",
+    y_label="Frequency",
+)
+
+THROUGHPUT_PLOT = PlotCfg(
+    no_data="No throughput data",
+    title="Throughput (RPS)",
+    x_label="Time (s)",
+    y_label="Requests/s",
+)
+
+
+SERVER_QUEUES_PLOT = PlotCfg(
+    no_data="No queue data",
+    title="Server Queues",
+    x_label="Time (s)",
+    y_label="Queue length",
+    ready_label="Ready queue",
+    io_label="I/O queue",
+)
+
+RAM_PLOT = PlotCfg(
+    no_data="No RAM data",
+    title="RAM Usage",
+    x_label="Time (s)",
+    y_label="RAM (MB)",
+    legend_label="RAM",
+)
diff --git a/src/app/metrics/analyzer.py b/src/app/metrics/analyzer.py
@@ -7,6 +7,14 @@
 
 import numpy as np
 
+from app.config.constants import LatencyKey, SampledMetricName
+from app.config.plot_constants import (
+    LATENCY_PLOT,
+    RAM_PLOT,
+    SERVER_QUEUES_PLOT,
+    THROUGHPUT_PLOT,
+)
+
 if TYPE_CHECKING:
 
     from matplotlib.axes import Axes
@@ -26,6 +34,9 @@ class ResultsAnalyzer:
       - sampled metrics from servers and edges
     """
 
+    # Class attribute to define the period to calculate the throughput in s
+    _WINDOW_SIZE_S: float = 1
+
     def __init__(
         self,
         *,
@@ -49,7 +60,7 @@ def __init__(
 
         # Lazily computed caches
         self.latencies: list[float] | None = None
-        self.latency_stats: dict[str, float] | None = None
+        self.latency_stats: dict[LatencyKey, float] | None = None
         self.throughput_series: tuple[list[float], list[float]] | None = None
         self.sampled_metrics: dict[str, dict[str, list[float]]] | None = None
 
@@ -72,36 +83,35 @@ def _process_event_metrics(self) -> None:
         if self.latencies:
             arr = np.array(self.latencies)
             self.latency_stats = {
-                "total_requests": float(arr.size),
-                "mean": float(np.mean(arr)),
-                "median": float(np.median(arr)),
-                "std_dev": float(np.std(arr)),
-                "p95": float(np.percentile(arr, 95)),
-                "p99": float(np.percentile(arr, 99)),
-                "min": float(np.min(arr)),
-                "max": float(np.max(arr)),
+                LatencyKey.TOTAL_REQUESTS: float(arr.size),
+                LatencyKey.MEAN: float(np.mean(arr)),
+                LatencyKey.MEDIAN: float(np.median(arr)),
+                LatencyKey.STD_DEV: float(np.std(arr)),
+                LatencyKey.P95: float(np.percentile(arr, 95)),
+                LatencyKey.P99: float(np.percentile(arr, 99)),
+                LatencyKey.MIN: float(np.min(arr)),
+                LatencyKey.MAX: float(np.max(arr)),
             }
         else:
             self.latency_stats = {}
 
         # 3) Throughput per 1s window
         completion_times = sorted(clock.finish for clock in self._client.rqs_clock)
-        window_size = 1.0
         end_time = self._settings.total_simulation_time
 
         timestamps: list[float] = []
         rps_values: list[float] = []
         count = 0
         idx = 0
-        current_end = window_size
+        current_end = ResultsAnalyzer._WINDOW_SIZE_S
 
         while current_end <= end_time:
             while idx < len(completion_times) and completion_times[idx] <= current_end:
                 count += 1
                 idx += 1
             timestamps.append(current_end)
-            rps_values.append(count / window_size)
-            current_end += window_size
+            rps_values.append(count / ResultsAnalyzer._WINDOW_SIZE_S)
+            current_end += ResultsAnalyzer._WINDOW_SIZE_S
             count = 0
 
         self.throughput_series = (timestamps, rps_values)
@@ -122,7 +132,7 @@ def _extract_sampled_metrics(self) -> None:
 
         self.sampled_metrics = metrics
 
-    def get_latency_stats(self) -> dict[str, float]:
+    def get_latency_stats(self) -> dict[LatencyKey, float]:
         """Return latency statistics, computing them if necessary."""
         self.process_all_metrics()
         return self.latency_stats or {}
@@ -139,73 +149,77 @@ def get_sampled_metrics(self) -> dict[str, dict[str, list[float]]]:
         assert self.sampled_metrics is not None
         return self.sampled_metrics
 
-    # TODO(Gioele Botta): create a class of constants to remove all magic words
     def plot_latency_distribution(self, ax: Axes) -> None:
         """Draw a histogram of request latencies onto the given Axes."""
         if not self.latencies:
-            ax.text(0.5, 0.5, "No latency data", ha="center", va="center")
+            ax.text(0.5, 0.5, LATENCY_PLOT.no_data, ha="center", va="center")
             return
 
         ax.hist(self.latencies, bins=50)
-        ax.set_title("Request Latency Distribution")
-        ax.set_xlabel("Latency (s)")
-        ax.set_ylabel("Frequency")
+        ax.set_title(LATENCY_PLOT.title)
+        ax.set_xlabel(LATENCY_PLOT.x_label)
+        ax.set_ylabel(LATENCY_PLOT.y_label)
         ax.grid(visible=True)
 
     def plot_throughput(self, ax: Axes) -> None:
         """Draw throughput (RPS) over time onto the given Axes."""
         timestamps, values = self.get_throughput_series()
         if not timestamps:
-            ax.text(0.5, 0.5, "No throughput data", ha="center", va="center")
+            ax.text(0.5, 0.5, THROUGHPUT_PLOT.no_data, ha="center", va="center")
             return
 
         ax.plot(timestamps, values, marker="o", linestyle="-")
-        ax.set_title("Throughput (RPS)")
-        ax.set_xlabel("Time (s)")
-        ax.set_ylabel("Requests/s")
+        ax.set_title(THROUGHPUT_PLOT.title)
+        ax.set_xlabel(THROUGHPUT_PLOT.x_label)
+        ax.set_ylabel(THROUGHPUT_PLOT.y_label)
         ax.grid(visible=True)
 
     def plot_server_queues(self, ax: Axes) -> None:
         """Draw server queue lengths over time onto the given Axes."""
         metrics = self.get_sampled_metrics()
-        ready = metrics.get("ready_queue_len", {})
-        io_q = metrics.get("event_loop_io_sleep", {})
+        ready = metrics.get(SampledMetricName.READY_QUEUE_LEN, {})
+        io_q = metrics.get(SampledMetricName.EVENT_LOOP_IO_SLEEP, {})
 
         if not (ready or io_q):
-            ax.text(0.5, 0.5, "No queue data", ha="center", va="center")
+            ax.text(0.5, 0.5, SERVER_QUEUES_PLOT.no_data, ha="center", va="center")
             return
 
         samples = len(next(iter(ready.values()), []))
         times = np.arange(samples) * self._settings.sample_period_s
 
         for sid, vals in ready.items():
-            ax.plot(times, vals, label=f"{sid} (ready)")
+            ax.plot(times, vals, label=f"{sid} {SERVER_QUEUES_PLOT.ready_label}")
         for sid, vals in io_q.items():
-            ax.plot(times, vals, label=f"{sid} (I/O)", linestyle="--")
-
-        ax.set_title("Server Queues")
-        ax.set_xlabel("Time (s)")
-        ax.set_ylabel("Queue Length")
+            ax.plot(
+                times,
+                vals,
+                label=f"{sid} {SERVER_QUEUES_PLOT.io_label}",
+                linestyle="--",
+            )
+
+        ax.set_title(SERVER_QUEUES_PLOT.title)
+        ax.set_xlabel(SERVER_QUEUES_PLOT.x_label)
+        ax.set_ylabel(SERVER_QUEUES_PLOT.y_label)
         ax.legend()
         ax.grid(visible=True)
 
     def plot_ram_usage(self, ax: Axes) -> None:
         """Draw RAM usage over time onto the given Axes."""
         metrics = self.get_sampled_metrics()
-        ram = metrics.get("ram_in_use", {})
+        ram = metrics.get(SampledMetricName.RAM_IN_USE, {})
 
         if not ram:
-            ax.text(0.5, 0.5, "No RAM data", ha="center", va="center")
+            ax.text(0.5, 0.5, RAM_PLOT.no_data, ha="center", va="center")
             return
 
         samples = len(next(iter(ram.values())))
         times = np.arange(samples) * self._settings.sample_period_s
 
         for sid, vals in ram.items():
-            ax.plot(times, vals, label=f"{sid} RAM")
+            ax.plot(times, vals, label=f"{sid} {RAM_PLOT.legend_label}")
 
-        ax.set_title("RAM Usage")
-        ax.set_xlabel("Time (s)")
-        ax.set_ylabel("RAM (MB)")
+        ax.set_title(RAM_PLOT.title)
+        ax.set_xlabel(RAM_PLOT.x_label)
+        ax.set_ylabel(RAM_PLOT.y_label)
         ax.legend()
         ax.grid(visible=True)
diff --git a/tests/unit/metrics/test_analyzer.py b/tests/unit/metrics/test_analyzer.py