add update workflows

Dieg0Code · Dieg0Code · commit c910095ab0ae · 2026-03-01T21:23:40.000-03:00
diff --git a/.github/workflows/build-app-image.yml b/.github/workflows/build-app-image.yml
@@ -75,6 +75,7 @@ jobs:
         with:
           context: .
           file: Dockerfile
+          target: runtime
           push: ${{ github.event_name != 'pull_request' }}
           tags: ${{ steps.meta.outputs.tags }}
           labels: ${{ steps.meta.outputs.labels }}
diff --git a/.github/workflows/ci-api.yml b/.github/workflows/ci-api.yml
@@ -56,7 +56,7 @@ jobs:
       - name: Setup Python
         uses: actions/setup-python@v5
         with:
-          python-version: "3.10"
+          python-version: "3.11"
 
       - name: Setup uv
         uses: astral-sh/setup-uv@v4
diff --git a/.github/workflows/ci-train.yml b/.github/workflows/ci-train.yml
@@ -54,7 +54,7 @@ jobs:
       - name: Setup Python
         uses: actions/setup-python@v5
         with:
-          python-version: "3.10"
+          python-version: "3.11"
 
       - name: Setup uv
         uses: astral-sh/setup-uv@v4
@@ -70,7 +70,20 @@ jobs:
           ln -sf ../bin/python .venv/Scripts/python.exe
 
       - name: Python file length policy
-        run: uv run python scripts/check_python_max_lines.py --max-lines 500 --path train.py --path src --path tests --path scripts
+        run: |
+          uv run python scripts/check_python_max_lines.py \
+            --max-lines 500 \
+            --path train.py \
+            --path src/training \
+            --path src/engine \
+            --path src/model \
+            --path src/game \
+            --path src/data \
+            --path tests/test_mcts_numerics.py \
+            --path tests/test_training_step_numerics.py \
+            --path tests/test_training_*.py \
+            --path scripts/export_model_onnx.py \
+            --path scripts/check_onnx_parity.py
 
       - name: Ruff (train scope)
         run: uv run ruff check train.py src/engine src/model src/game src/data tests scripts
diff --git a/Dockerfile.train b/Dockerfile.train
@@ -16,9 +16,9 @@ RUN apt-get update && \
 RUN pip install --no-cache-dir uv
 
 COPY pyproject.toml uv.lock README.md ./
+COPY src ./src
 RUN uv sync --frozen --no-dev --group train --group export
 
-COPY src ./src
 COPY train.py ./train.py
 COPY train_improved.py ./train_improved.py
 
diff --git a/src/training/eval_runtime.py b/src/training/eval_runtime.py
@@ -0,0 +1,98 @@
+from __future__ import annotations
+
+from typing import TYPE_CHECKING
+
+import numpy as np
+
+from game.actions import ACTION_SPACE
+from training.config_runtime import cfg_bool, cfg_int
+from training.selfplay_runtime import compute_action_probs, heuristic_move
+
+if TYPE_CHECKING:
+    from engine.mcts import MCTS
+    from model.system import AtaxxZero
+
+
+def _play_eval_episode(
+    mcts: MCTS,
+    rng: np.random.Generator,
+    heuristic_level: str,
+) -> int:
+    from game.board import AtaxxBoard
+
+    board = AtaxxBoard()
+    root = None
+    model_player = 1 if float(rng.random()) >= 0.5 else -1
+    while not board.is_game_over():
+        if board.current_player == model_player:
+            probs, root = compute_action_probs(
+                board=board,
+                mcts=mcts,
+                root=root,
+                add_noise=False,
+                temperature=0.0,
+            )
+            action_idx = int(np.argmax(probs))
+            board.step(ACTION_SPACE.decode(action_idx))
+            root = mcts.advance_root(root, action_idx)
+            continue
+        move = heuristic_move(board, rng, heuristic_level)
+        board.step(move)
+        root = mcts.advance_root(root, ACTION_SPACE.encode(move))
+    winner = board.get_result()
+    if winner == model_player:
+        return 1
+    if winner == 0:
+        return 0
+    return -1
+
+
+def evaluate_model(
+    system: AtaxxZero,
+    device: str,
+    games: int,
+    sims: int,
+    c_puct: float,
+    heuristic_level: str,
+    seed: int,
+) -> dict[str, float | int | str]:
+    from engine.mcts import MCTS
+
+    system.eval()
+    system.to(device)
+    mcts = MCTS(
+        model=system.model,
+        c_puct=c_puct,
+        n_simulations=sims,
+        device=device,
+        use_amp=cfg_bool("mcts_use_amp"),
+        cache_size=max(0, cfg_int("mcts_cache_size")),
+        leaf_batch_size=max(1, cfg_int("mcts_leaf_batch_size")),
+    )
+    rng = np.random.default_rng(seed=seed)
+    wins = 0
+    losses = 0
+    draws = 0
+    for _ in range(games):
+        outcome = _play_eval_episode(mcts, rng, heuristic_level)
+        if outcome > 0:
+            wins += 1
+        elif outcome < 0:
+            losses += 1
+        else:
+            draws += 1
+    score = (wins + 0.5 * draws) / max(1, games)
+    return {
+        "games": games,
+        "wins": wins,
+        "losses": losses,
+        "draws": draws,
+        "score": score,
+        "heuristic_level": heuristic_level,
+        "sims": sims,
+    }
+
+
+__all__ = [
+    "evaluate_model",
+]
diff --git a/src/training/selfplay_runtime.py b/src/training/selfplay_runtime.py
@@ -247,86 +247,6 @@ def history_to_examples(
     return examples
 
 
-def _play_eval_episode(
-    mcts: MCTS,
-    rng: np.random.Generator,
-    heuristic_level: str,
-) -> int:
-    from game.board import AtaxxBoard
-
-    board = AtaxxBoard()
-    root = None
-    model_player = 1 if float(rng.random()) >= 0.5 else -1
-    while not board.is_game_over():
-        if board.current_player == model_player:
-            probs, root = compute_action_probs(
-                board=board,
-                mcts=mcts,
-                root=root,
-                add_noise=False,
-                temperature=0.0,
-            )
-            action_idx = int(np.argmax(probs))
-            board.step(ACTION_SPACE.decode(action_idx))
-            root = mcts.advance_root(root, action_idx)
-            continue
-        move = heuristic_move(board, rng, heuristic_level)
-        board.step(move)
-        root = mcts.advance_root(root, ACTION_SPACE.encode(move))
-    winner = board.get_result()
-    if winner == model_player:
-        return 1
-    if winner == 0:
-        return 0
-    return -1
-
-
-def evaluate_model(
-    system: AtaxxZero,
-    device: str,
-    games: int,
-    sims: int,
-    c_puct: float,
-    heuristic_level: str,
-    seed: int,
-) -> dict[str, float | int | str]:
-    from engine.mcts import MCTS
-
-    system.eval()
-    system.to(device)
-    mcts = MCTS(
-        model=system.model,
-        c_puct=c_puct,
-        n_simulations=sims,
-        device=device,
-        use_amp=cfg_bool("mcts_use_amp"),
-        cache_size=max(0, cfg_int("mcts_cache_size")),
-        leaf_batch_size=max(1, cfg_int("mcts_leaf_batch_size")),
-    )
-    rng = np.random.default_rng(seed=seed)
-    wins = 0
-    losses = 0
-    draws = 0
-    for _ in range(games):
-        outcome = _play_eval_episode(mcts, rng, heuristic_level)
-        if outcome > 0:
-            wins += 1
-        elif outcome < 0:
-            losses += 1
-        else:
-            draws += 1
-    score = (wins + 0.5 * draws) / max(1, games)
-    return {
-        "games": games,
-        "wins": wins,
-        "losses": losses,
-        "draws": draws,
-        "score": score,
-        "heuristic_level": heuristic_level,
-        "sims": sims,
-    }
-
-
 def execute_self_play(
     system: AtaxxZero,
     buffer: ReplayBuffer,
@@ -501,6 +421,5 @@ def execute_self_play(
 
 
 __all__ = [
-    "evaluate_model",
     "execute_self_play",
 ]
diff --git a/train.py b/train.py
@@ -42,9 +42,10 @@
     parse_args,
     validate_config,
 )
+from training.eval_runtime import evaluate_model  # noqa: E402
 from training.monitor import TrainingMonitor  # noqa: E402
 from training.progress_callbacks import EpochPulseCallback  # noqa: E402
-from training.selfplay_runtime import evaluate_model, execute_self_play  # noqa: E402
+from training.selfplay_runtime import execute_self_play  # noqa: E402
 from training.trainer_runtime import (  # noqa: E402
     build_trainer,
     export_onnx,
diff --git a/web/src/pages/match/MatchPage.test.tsx b/web/src/pages/match/MatchPage.test.tsx
@@ -1,6 +1,7 @@
 import { fireEvent, render, screen, waitFor } from "@testing-library/react";
 import type { ReactNode } from "react";
 import { beforeEach, describe, expect, it, vi } from "vitest";
+import type { PersistedGameWsEvent } from "@/features/match/persistence";
 import type { BoardState } from "@/features/match/types";
 import { MatchPage } from "@/pages/match/MatchPage";
 
@@ -465,26 +466,26 @@ describe("MatchPage queued human vs human", () => {
       }),
     );
 
-    let wsEventHandler: ((event: import("@/features/match/persistence").PersistedGameWsEvent) => void) | null = null;
-    openPersistedGameSocketMock.mockImplementation(
-      (_token: string, _gameId: string, onEvent: (event: import("@/features/match/persistence").PersistedGameWsEvent) => void) => {
-        wsEventHandler = onEvent;
-        return {
-          close: vi.fn(),
-          onclose: null,
-          onmessage: null,
-        };
-      },
-    );
+    let wsEventHandler: ((event: PersistedGameWsEvent) => void) | null = null;
+    openPersistedGameSocketMock.mockImplementation((...args: unknown[]) => {
+      // Vitest mocks default to unknown/any signatures; cast the event callback explicitly.
+      wsEventHandler = args[2] as (event: PersistedGameWsEvent) => void;
+      return {
+        close: vi.fn(),
+        onclose: null,
+        onmessage: null,
+      };
+    });
 
     render(<MatchPage />);
 
     await waitFor(() => {
       expect(screen.getByText(/humano vs humano/i)).toBeInTheDocument();
     });
-    expect(wsEventHandler).not.toBeNull();
-
-    wsEventHandler?.({
+    if (wsEventHandler === null) {
+      throw new Error("Expected websocket handler to be initialized.");
+    }
+    (wsEventHandler as (event: PersistedGameWsEvent) => void)({
       type: "game.closed",
       game_id: "game-h2h",
       reason: "deleted_by_participant",
diff --git a/web/src/pages/match/MatchPage.tsx b/web/src/pages/match/MatchPage.tsx
@@ -1,6 +1,6 @@
 import { useCallback, useEffect, useMemo, useRef, useState, type MouseEvent } from "react";
 import { Link, useLocation, useNavigate } from "react-router-dom";
-import { AnimatePresence, motion } from "framer-motion";
+import { AnimatePresence, motion, type Variants } from "framer-motion";
 import {
   Activity,
   ArrowRight,
@@ -83,12 +83,12 @@ const SFX = {
   queueDeploy: "/sfx/queue_accept.ogg",
 } as const;
 
-const panelSectionVariants = {
+const panelSectionVariants: Variants = {
   hidden: { opacity: 0, y: 8 },
   show: (delay = 0) => ({
     opacity: 1,
     y: 0,
-    transition: { duration: 0.32, ease: "easeOut", delay },
+    transition: { duration: 0.32, ease: "easeOut" as const, delay },
   }),
 };
 
diff --git a/web/src/test/render.tsx b/web/src/test/render.tsx
@@ -1,11 +1,13 @@
 import { QueryClient, QueryClientProvider } from "@tanstack/react-query";
 import { render, type RenderOptions } from "@testing-library/react";
-import type { ReactElement } from "react";
-import { MemoryRouter, type InitialEntry } from "react-router-dom";
+import type { ComponentProps, ReactElement } from "react";
+import { MemoryRouter } from "react-router-dom";
+
+type MemoryRouterEntry = NonNullable<ComponentProps<typeof MemoryRouter>["initialEntries"]>[number];
 
 export function renderWithProviders(
   ui: ReactElement,
-  { route = "/", ...options }: { route?: InitialEntry } & Omit<RenderOptions, "wrapper"> = {},
+  { route = "/", ...options }: { route?: MemoryRouterEntry } & Omit<RenderOptions, "wrapper"> = {},
 ) {
   const queryClient = new QueryClient({
     defaultOptions: {
diff --git a/web/src/vite-env.d.ts b/web/src/vite-env.d.ts
@@ -0,0 +1 @@
+/// <reference types="vite/client" />
diff --git a/web/src/widgets/layout/AppShell.test.tsx b/web/src/widgets/layout/AppShell.test.tsx
@@ -7,7 +7,7 @@ const logoutMock = vi.fn();
 const openInvitationsSocketMock = vi.fn();
 const acceptInvitationMock = vi.fn();
 const rejectInvitationMock = vi.fn();
-let authState = {
+let authState: { isAuthenticated: boolean; user: { username: string } | null } = {
   isAuthenticated: true,
   user: { username: "test" },
 };