AsyncFlow/src/app/runtime/actors/server.py at 1e86d96c5806c125b483c8d04823ffa40f298bcb · AsyncFlow-Sim/AsyncFlow · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
"""
definition of the class necessary to manage the server
during the simulation
"""

from collections.abc import Generator
from typing import cast

import numpy as np
import simpy

from app.config.constants import (
    EndpointStepCPU,
    EndpointStepIO,
    EndpointStepRAM,
    SampledMetricName,
    ServerResourceName,
    StepOperation,
    SystemNodes,
)
from app.metrics.server import build_server_metrics
from app.resources.server_containers import ServerContainers
from app.runtime.actors.edge import EdgeRuntime
from app.runtime.rqs_state import RequestState
from app.schemas.simulation_settings_input import SimulationSettings
from app.schemas.system_topology.full_system_topology import Server


class ServerRuntime:
    """class to define the server during the simulation"""

    def __init__( # noqa: PLR0913
        self,
        *,
        env: simpy.Environment,
        server_resources: ServerContainers,
        server_config: Server,
        out_edge: EdgeRuntime | None,
        server_box: simpy.Store,
        settings: SimulationSettings,
        rng: np.random.Generator | None = None,
        ) -> None:
        """
        Definition of the instance attributes
        Args:
            env (simpy.Environment): simpy environment
            server_resources (ServerContainers):resource defined in the
                input for each server
            server_config (Server): parameter to define the server from the input
            out_edge (EdgeRuntime): edge connecting the server to the next node
            server_box (simpy.Store): box with the states that the server
                should elaborate
            settings (SimulationSettings): general input settings for the simulation
            rng (np.random.Generator | None, optional): random number generator.
        """
        self.env = env
        self.server_resources = server_resources
        self.server_config = server_config
        self.out_edge = out_edge
        self.server_box = server_box
        self.rng = rng or np.random.default_rng()
        # length of the active queue of the event loop
        self._el_ready_queue_len: int = 0
        # total ram used in the server
        self._ram_in_use: int | float = 0
        # length of the queue of the I/O task of the vent loop
        self._el_io_queue_len: int = 0

        # Right now is not necessary but as we will introduce
        # non mandatory metrics we will need this structure to
        # check if we have to measure a given metric
        # right now it is not necessary because we are dealing
        # only with mandatory metrics
        self._server_enabled_metrics = build_server_metrics(
            settings.enabled_sample_metrics,
        )

    # right now we disable the warnings but a refactor will be done soon
    def _handle_request( # noqa: PLR0915, PLR0912, C901
        self,
        state: RequestState,
        ) -> Generator[simpy.Event, None, None]:
        """
        Define all the step each request has to do ones reach
        the server
        """
        #register the history for the state:
        state.record_hop(
            SystemNodes.SERVER,
            self.server_config.id,
            self.env.now,
        )

        # Define the length of the endpoint list
        endpoints_list = self.server_config.endpoints
        endpoints_number = len(endpoints_list)

        # select the endpoint where the requests is directed at the moment we use
        # a uniform distribution, in the future we will allow the user to define a
        # custom distribution
        selected_endpoint_idx = self.rng.integers(low=0, high=endpoints_number)
        selected_endpoint = endpoints_list[selected_endpoint_idx]


        # Extract the total ram to execute the endpoint
        total_ram = sum(
            step.step_operation[StepOperation.NECESSARY_RAM]
            for step in selected_endpoint.steps
            if isinstance(step.kind, EndpointStepRAM)
        )

        # ------------------------------------------------------------------
        # CPU & RAM SCHEDULING
        #
        #  RAM FIRST, CPU LATER
        #   - The request reserves its full working set (total_ram) before
        #     acquiring any CPU core. If memory isn't available, it stays
        #     queued and leaves cores free for other requests.
        #
        #  LAZY-CPU LOCK
        #   - A core token is acquired only at the FIRST CPU step
        #     (`if not core_locked`) and held for all consecutive CPU steps.
        #   - As soon as an I/O step is encountered, the core is released
        #     (`CPU.put(1)`) and remains free until the next CPU step,
        #     which will re-acquire it.
        #
        #  WHY THIS IS REALISTIC
        #    Prevents “core-hogging” during long I/O awaits.
        #    Avoids redundant get/put calls for consecutive CPU steps
        #      (one token for the entire sequence).
        #    Mirrors a real Python async server: the GIL/worker thread is
        #      held only during CPU-bound code and released on each await.
        #
        #  END OF HANDLER
        #   - If we still hold the core at the end (`core_locked == True`),
        #     we put it back, then release the reserved RAM.
        # ------------------------------------------------------------------

        # Ask the necessary ram to the server
        if total_ram:
            yield self.server_resources[ServerResourceName.RAM.value].get(total_ram)
            self._ram_in_use += total_ram

        # Initial conditions of the server a rqs a priori is not in any queue
        # and it does not occupy a core until it started to be elaborated
        core_locked = False
        is_in_io_queue = False
        is_in_ready_queue = False


        # --- Step Execution: Process CPU and IO operations ---
        #  EDGE CASE
        #  First-step I/O
        #     A request could (in theory) start with an I/O step. In that case
        #     it doesn't hold any core; we enter the
        #     `not core_locked and not is_in_io_queue` branch and add +1
        #     to the I/O queue without touching the ready queue.
        #
        #  Consecutive I/O steps
        #     The second I/O sees `is_in_io_queue == True`, so it does NOT
        #     increment again—no double counting.
        #
        #  Transition CPU → I/O → CPU
        #     - CPU step: `core_locked` becomes True, +1 ready queue
        #     - I/O step: core is put back, -1 ready queue, +1 I/O queue
        #     - Next CPU step: core is acquired, -1 I/O queue, +1 ready queue
        #
        #  Endpoint completion
        #     If `core_locked == True`  we were in the ready queue (-1)
        #     Otherwise  we were in the I/O queue (-1)
        #     In both cases we clear the local flags so no “ghost” entries
        #     remain in the global counters.
        # ------------------------------------------------------------------


        for step in selected_endpoint.steps:

            if isinstance(step.kind, EndpointStepCPU):
                # with the boolean we avoid redundant operation of asking
                # the core multiple time on a given step
                # for example if we have two consecutive cpu bound step
                # in this configuration we are asking the cpu just in the
                # first one

                if not core_locked:
                    core_locked = True

                    if is_in_io_queue:
                        is_in_io_queue = False
                        self._el_io_queue_len -= 1

                    if not is_in_ready_queue:
                        is_in_ready_queue = True
                        self._el_ready_queue_len += 1


                    yield self.server_resources[ServerResourceName.CPU.value].get(1)

                cpu_time = step.step_operation[StepOperation.CPU_TIME]
                # Execute the step giving back the control to the simpy env
                yield self.env.timeout(cpu_time)


            elif isinstance(step.kind, EndpointStepIO):
                io_time = step.step_operation[StepOperation.IO_WAITING_TIME]
                # Same here with the boolean if we have multiple I/O steps
                # we release the core just the first time if the previous step
                # was a cpu bound step

                if not core_locked and not is_in_io_queue:
                    is_in_io_queue = True
                    self._el_io_queue_len += 1


                if core_locked:
                    # if the core is locked in the function it means that for sure
                    # we had a cpu bound step so the if statement will be always
                    # satisfy and we have to remove one element from the ready queue

                    if is_in_ready_queue:
                        is_in_ready_queue = False
                        self._el_ready_queue_len -= 1

                    if not is_in_io_queue:
                        is_in_io_queue = True
                        self._el_io_queue_len += 1

                    yield self.server_resources[ServerResourceName.CPU.value].put(1)
                    core_locked = False
                yield self.env.timeout(io_time)  # Wait without holding a CPU core


        if core_locked:
            is_in_ready_queue = False
            self._el_ready_queue_len -= 1
            yield self.server_resources[ServerResourceName.CPU.value].put(1)
        else:
            is_in_io_queue = False
            self._el_io_queue_len -= 1

        if total_ram:

            self._ram_in_use -= total_ram
            yield self.server_resources[ServerResourceName.RAM.value].put(total_ram)

        assert self.out_edge is not None
        self.out_edge.transport(state)


    # we need three accessor because we need to read these private attribute
    # in the sampled metric collector
    @property
    def ready_queue_len(self) -> int:
        """Current length of the event-loop ready queue for this server."""
        return self._el_ready_queue_len

    @property
    def io_queue_len(self) -> int:
        """Current length of the event-loop I/O queue for this server."""
        return self._el_io_queue_len

    @property
    def ram_in_use(self) -> int | float:
        """Total RAM (MB) currently reserved by active requests."""
        return self._ram_in_use

    @property
    def enabled_metrics(self) -> dict[SampledMetricName, list[float | int]]:
        """Read-only access to the metric store."""
        return self._server_enabled_metrics


    def _dispatcher(self) -> Generator[simpy.Event, None, None]:
        """
        The main dispatcher loop. It pulls requests from the inbox and
        spawns a new '_handle_request' process for each one.
        """
        while True:
            # Wait for a request to arrive in the server's inbox
            raw_state = yield self.server_box.get()
            request_state = cast("RequestState", raw_state)
            # Spawn a new, independent process to handle this request
            self.env.process(self._handle_request(request_state))

    def start(self) -> simpy.Process:
        """Generate the process to simulate the server inside simpy env"""
        return self.env.process(self._dispatcher())