From d2a26ec7f901ea26066c04b01e069569accbfe9e Mon Sep 17 00:00:00 2001
From: yungYEEZY <259074499+yungYEEZY@users.noreply.github.com>
Date: Sun, 5 Apr 2026 11:25:22 +0200
Subject: [PATCH] Allow loading without GPU backend.

---
 src/optimization/memory_manager.py | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/src/optimization/memory_manager.py b/src/optimization/memory_manager.py
index 780c6909..e80bba35 100644
--- a/src/optimization/memory_manager.py
+++ b/src/optimization/memory_manager.py
@@ -81,17 +81,18 @@ def get_device_list(include_none: bool = False, include_cpu: bool = False) -> Li
     if include_none:
         result.append("none")
     
-    # Only include "cpu" option if:
-    # 1. It was requested (include_cpu=True), AND
-    # 2. Either CUDA is available OR MPS is not the only option
+    # Add CPU to the list if:
+    # 1. It was explicitly requested (include_cpu=True), OR
+    # 2. No GPU backend is available (CUDA/MPS both unavailable)
     # Rationale: On MPS-only systems with unified memory architecture,
-    # CPU offloading is semantically meaningless as CPU and GPU share the same memory pool
-    if include_cpu and (has_cuda or not has_mps):
+    # CPU offloading is semantically meaningless as CPU and GPU share the same memory pool,
+    # but we still need CPU as an inference device when no GPU is available
+    if include_cpu or (not has_cuda and not has_mps):
         result.append("cpu")
     
     result.extend(devs)
     
-    return result if result else []
+    return result
 
 
 def get_basic_vram_info(device: Optional[torch.device] = None) -> Dict[str, Any]: