AsyncFlow-Sim
diff --git a/‎src/asyncflow/schemas/payload.py‎
Lines changed: 52 additions & 0 deletions b/‎src/asyncflow/schemas/payload.py‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎tests/integration/event_injection/lb_two_servers.py‎
Lines changed: 113 additions & 0 deletions b/‎tests/integration/event_injection/lb_two_servers.py‎
Lines changed: 113 additions & 0 deletions
diff --git a/‎tests/integration/event_injection/single_server.py‎
Lines changed: 108 additions & 0 deletions b/‎tests/integration/event_injection/single_server.py‎
Lines changed: 108 additions & 0 deletions
@@ -200,3 +200,55 @@ def ensure_not_all_servers_are_down_simultaneously(
         return model
 
 
+    @model_validator(mode="after")  # type: ignore[arg-type]
+    def forbid_overlapping_server_outages(
+        cls,  # noqa: N805
+        model: "SimulationPayload",
+    ) -> "SimulationPayload":
+        """
+        Forbid overlapping SERVER_DOWN intervals targeting the same server.
+
+        Rationale:
+        - Keeps runtime simple (no reference counting).
+        - Allows back-to-back windows (END at t and START at t) thanks to sorting
+        END before START at the same timestamp.
+        """
+        events = model.events
+        if not events:
+            return model
+
+        servers_ids = {s.id for s in model.topology_graph.nodes.servers}
+
+        # Build per-server timelines with (time, kind) marks only for server outages
+        per_server: dict[str, list[tuple[float, str]]] = {}
+        for ev in events:
+            if (
+                ev.target_id in servers_ids
+                and ev.start.kind == EventDescription.SERVER_DOWN
+            ):
+                per_server.setdefault(
+                    ev.target_id, []).append((ev.start.t_start, "start"),
+                )
+                per_server[ev.target_id].append((ev.end.t_end, "end"))
+
+        # Sweep-line per server: sort by (time, END first), ensure active<=1
+        for srv_id, timeline in per_server.items():
+            if not timeline:
+                continue
+            # END before START at same t
+            timeline.sort(key=lambda x: (x[0], x[1] == "start"))
+            active = 0
+            for t, mark in timeline:
+                if mark == "end":
+                    if active > 0:
+                        active -= 1
+                else:  # START
+                    if active >= 1:
+                        msg = (f"Overlapping events for server '{srv_id}' at t={t:.6f};"
+                              " server outage windows must not overlap.")
+                        raise ValueError(msg)
+                    active += 1
+
+        return model
+
+
@@ -0,0 +1,113 @@
+"""Integration test: LB with two servers and concurrent event injections.
+
+Topology:
+
+  rqs-1 → client-1 → lb-1 → {srv-1, srv-2}
+                     srv-* → client-1
+
+Events:
+- NETWORK_SPIKE on 'client-to-lb' in [0.20, 0.35].
+- SERVER_DOWN/UP on 'srv-1' in [0.40, 0.55].
+
+Assertions:
+- Simulation completes.
+- Latency stats and throughput exist.
+"""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import simpy
+
+from asyncflow.config.constants import Distribution, EventDescription, LatencyKey
+from asyncflow.runtime.simulation_runner import SimulationRunner
+from asyncflow.schemas.common.random_variables import RVConfig
+from asyncflow.schemas.events.injection import EventInjection
+from asyncflow.schemas.payload import SimulationPayload
+from asyncflow.schemas.settings.simulation import SimulationSettings
+from asyncflow.schemas.topology.edges import Edge
+from asyncflow.schemas.topology.graph import TopologyGraph
+from asyncflow.schemas.topology.nodes import (
+    Client,
+    LoadBalancer,
+    Server,
+    ServerResources,
+    TopologyNodes,
+)
+from asyncflow.schemas.workload.rqs_generator import RqsGenerator
+
+if TYPE_CHECKING:
+    from asyncflow.metrics.analyzer import ResultsAnalyzer
+
+
+def _server(sid: str) -> Server:
+    return Server(id=sid, server_resources=ServerResources(), endpoints=[])
+
+
+def _edge(eid: str, src: str, tgt: str, mean: float = 0.002) -> Edge:
+    return Edge(
+        id=eid,
+        source=src,
+        target=tgt,
+        latency=RVConfig(mean=mean, distribution=Distribution.POISSON),
+    )
+
+
+def test_lb_two_servers_with_events_end_to_end() -> None:
+    """Round-robin LB with events; check that KPIs are produced."""
+    env = simpy.Environment()
+    rqs = RqsGenerator(
+        id="rqs-1",
+        avg_active_users=RVConfig(mean=1.0),
+        avg_request_per_minute_per_user=RVConfig(mean=2.0),
+        user_sampling_window=10.0,
+    )
+    sim = SimulationSettings(total_simulation_time=0.8)
+
+    client = Client(id="client-1")
+    lb = LoadBalancer(id="lb-1")
+    srv1 = _server("srv-1")
+    srv2 = _server("srv-2")
+
+    edges = [
+        _edge("gen-to-client", "rqs-1", "client-1"),
+        _edge("client-to-lb", "client-1", "lb-1"),
+        _edge("lb-to-srv1", "lb-1", "srv-1"),
+        _edge("lb-to-srv2", "lb-1", "srv-2"),
+        _edge("srv1-to-client", "srv-1", "client-1"),
+        _edge("srv2-to-client", "srv-2", "client-1"),
+    ]
+    nodes = TopologyNodes(servers=[srv1, srv2], client=client, load_balancer=lb)
+    topo = TopologyGraph(nodes=nodes, edges=edges)
+
+    events = [
+        EventInjection(
+            event_id="spike",
+            target_id="client-to-lb",
+            start={
+                "kind": EventDescription.NETWORK_SPIKE_START,
+                "t_start": 0.20,
+                "spike_s": 0.02,
+            },
+            end={"kind": EventDescription.NETWORK_SPIKE_END, "t_end": 0.35},
+        ),
+        EventInjection(
+            event_id="outage-srv1",
+            target_id="srv-1",
+            start={"kind": EventDescription.SERVER_DOWN, "t_start": 0.40},
+            end={"kind": EventDescription.SERVER_UP, "t_end": 0.55},
+        ),
+    ]
+
+    payload = SimulationPayload(rqs_input=rqs, topology_graph=topo, sim_settings=sim)
+    payload.events = events
+
+    runner = SimulationRunner(env=env, simulation_input=payload)
+    results: ResultsAnalyzer = runner.run()
+
+    stats = results.get_latency_stats()
+    assert stats
+    assert stats[LatencyKey.TOTAL_REQUESTS] > 0
+    ts, rps = results.get_throughput_series()
+    assert len(ts) == len(rps) > 0
@@ -0,0 +1,108 @@
+"""Integration test: single server with edge spike and server outage.
+
+Topology:
+
+  rqs-1 → client-1 → lb-1 → srv-1
+                      srv-1 → client-1
+
+Events:
+- NETWORK_SPIKE on 'client-to-lb' during a small window.
+- SERVER_DOWN/UP on 'srv-1' during a small window.
+
+Assertions focus on end-to-end KPIs; the fine-grained event sequencing is
+covered by unit tests in the event injection suite.
+"""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import simpy
+
+from asyncflow.config.constants import Distribution, EventDescription, LatencyKey
+from asyncflow.runtime.simulation_runner import SimulationRunner
+from asyncflow.schemas.common.random_variables import RVConfig
+from asyncflow.schemas.events.injection import EventInjection
+from asyncflow.schemas.payload import SimulationPayload
+from asyncflow.schemas.settings.simulation import SimulationSettings
+from asyncflow.schemas.topology.edges import Edge
+from asyncflow.schemas.topology.graph import TopologyGraph
+from asyncflow.schemas.topology.nodes import (
+    Client,
+    LoadBalancer,
+    Server,
+    ServerResources,
+    TopologyNodes,
+)
+from asyncflow.schemas.workload.rqs_generator import RqsGenerator
+
+if TYPE_CHECKING:
+    from asyncflow.metrics.analyzer import ResultsAnalyzer
+
+
+def _server(sid: str) -> Server:
+    return Server(id=sid, server_resources=ServerResources(), endpoints=[])
+
+
+def _edge(eid: str, src: str, tgt: str, mean: float = 0.002) -> Edge:
+    return Edge(
+        id=eid,
+        source=src,
+        target=tgt,
+        latency=RVConfig(mean=mean, distribution=Distribution.POISSON),
+    )
+
+
+def test_single_server_with_spike_and_outage_end_to_end() -> None:
+    """Run with both edge spike and server outage; verify KPIs exist."""
+    env = simpy.Environment()
+    rqs = RqsGenerator(
+        id="rqs-1",
+        avg_active_users=RVConfig(mean=1.0),
+        avg_request_per_minute_per_user=RVConfig(mean=2.0),
+        user_sampling_window=10.0,
+    )
+    sim = SimulationSettings(total_simulation_time=1.0)
+
+    client = Client(id="client-1")
+    lb = LoadBalancer(id="lb-1")
+    srv = _server("srv-1")
+
+    edges = [
+        _edge("gen-to-client", "rqs-1", "client-1"),
+        _edge("client-to-lb", "client-1", "lb-1"),
+        _edge("lb-to-srv1", "lb-1", "srv-1"),
+        _edge("srv1-to-client", "srv-1", "client-1"),
+    ]
+    nodes = TopologyNodes(servers=[srv], client=client, load_balancer=lb)
+    topo = TopologyGraph(nodes=nodes, edges=edges)
+
+    # Events in a short (but disjoint) schedule to avoid cross-process ties
+    events = [
+        EventInjection(
+            event_id="spike",
+            target_id="client-to-lb",
+            start={
+                "kind": EventDescription.NETWORK_SPIKE_START,
+                "t_start": 0.2,
+                "spike_s": 0.01,
+            },
+            end={"kind": EventDescription.NETWORK_SPIKE_END, "t_end": 0.4},
+        ),
+        EventInjection(
+            event_id="outage",
+            target_id="srv-1",
+            start={"kind": EventDescription.SERVER_DOWN, "t_start": 0.5},
+            end={"kind": EventDescription.SERVER_UP, "t_end": 0.7},
+        ),
+    ]
+
+    payload = SimulationPayload(rqs_input=rqs, topology_graph=topo, sim_settings=sim)
+    payload.events = events
+
+    runner = SimulationRunner(env=env, simulation_input=payload)
+    results: ResultsAnalyzer = runner.run()
+
+    stats = results.get_latency_stats()
+    assert stats
+    assert stats[LatencyKey.TOTAL_REQUESTS] > 0