dstackai
diff --git a/‎src/dstack/_internal/cli/commands/offer.py‎
Lines changed: 68 additions & 60 deletions b/‎src/dstack/_internal/cli/commands/offer.py‎
Lines changed: 68 additions & 60 deletions
diff --git a/‎src/dstack/_internal/cli/utils/gpu.py‎
Lines changed: 210 additions & 0 deletions b/‎src/dstack/_internal/cli/utils/gpu.py‎
Lines changed: 210 additions & 0 deletions
@@ -1,29 +1,20 @@
 import argparse
-import contextlib
-import json
 from pathlib import Path
+from typing import List
 
 from dstack._internal.cli.commands import APIBaseCommand
-from dstack._internal.cli.services.configurators.run import (
-    BaseRunConfigurator,
-)
+from dstack._internal.cli.services.configurators.run import BaseRunConfigurator
 from dstack._internal.cli.utils.common import console
-from dstack._internal.cli.utils.run import print_run_plan
-from dstack._internal.core.models.configurations import (
-    ApplyConfigurationType,
-    TaskConfiguration,
-)
+from dstack._internal.cli.utils.gpu import print_gpu_json, print_gpu_table
+from dstack._internal.cli.utils.run import print_offers_json, print_run_plan
+from dstack._internal.core.errors import CLIError
+from dstack._internal.core.models.configurations import ApplyConfigurationType, TaskConfiguration
 from dstack._internal.core.models.runs import RunSpec
+from dstack._internal.server.schemas.gpus import GpuGroup
 from dstack.api.utils import load_profile
 
 
 class OfferConfigurator(BaseRunConfigurator):
-    # TODO: The command currently uses `BaseRunConfigurator` to register arguments.
-    #   This includes --env, --retry-policy, and other arguments that are unnecessary for this command.
-    #   Eventually, we should introduce a base `OfferConfigurator` that doesn't include those arguments—
-    #   `BaseRunConfigurator` will inherit from `OfferConfigurator`.
-    #
-    #   Additionally, it should have its own type: `ApplyConfigurationType.OFFER`.
     TYPE = ApplyConfigurationType.TASK
 
     @classmethod
@@ -32,10 +23,18 @@ def register_args(
         parser: argparse.ArgumentParser,
     ):
         super().register_args(parser, default_max_offers=50)
+        parser.add_argument(
+            "--group-by",
+            action="append",
+            help=(
+                "Group results by fields ([code]gpu[/code], [code]backend[/code], [code]region[/code], [code]count[/code]). "
+                "Optional, but if used, must include [code]gpu[/code]. "
+                "The use of [code]region[/code] also requires [code]backend[/code]. "
+                "Can be repeated or comma-separated (e.g. [code]--group-by gpu,backend[/code])."
+            ),
+        )
 
 
-# TODO: Support aggregated offers
-# TODO: Add tests
 class OfferCommand(APIBaseCommand):
     NAME = "offer"
     DESCRIPTION = "List offers"
@@ -70,49 +69,58 @@ def _command(self, args: argparse.Namespace):
             ssh_key_pub="(dummy)",
             profile=profile,
         )
+
+        if args.group_by:
+            args.group_by = self._process_group_by_args(args.group_by)
+
+        if args.group_by and "gpu" not in args.group_by:
+            group_values = ", ".join(args.group_by)
+            raise CLIError(f"Cannot group by '{group_values}' without also grouping by 'gpu'")
+
         if args.format == "plain":
-            status = console.status("Getting offers...")
+            with console.status("Getting offers..."):
+                if args.group_by:
+                    gpus = self._list_gpus(args, run_spec)
+                    print_gpu_table(gpus, run_spec, args.group_by, self.api.project)
+                else:
+                    run_plan = self.api.client.runs.get_plan(
+                        self.api.project,
+                        run_spec,
+                        max_offers=args.max_offers,
+                    )
+                    print_run_plan(run_plan, include_run_properties=False)
         else:
-            status = contextlib.nullcontext()
-        with status:
-            run_plan = self.api.client.runs.get_plan(
-                self.api.project,
-                run_spec,
-                max_offers=args.max_offers,
-            )
-
-        job_plan = run_plan.job_plans[0]
-
-        if args.format == "json":
-            # FIXME: Should use effective_run_spec from run_plan,
-            # since the spec can be changed by the server and plugins
-            output = {
-                "project": run_plan.project_name,
-                "user": run_plan.user,
-                "resources": job_plan.job_spec.requirements.resources.dict(),
-                "max_price": (job_plan.job_spec.requirements.max_price),
-                "spot": run_spec.configuration.spot_policy,
-                "reservation": run_plan.run_spec.configuration.reservation,
-                "offers": [],
-                "total_offers": job_plan.total_offers,
-            }
-
-            for offer in job_plan.offers:
-                output["offers"].append(
-                    {
-                        "backend": (
-                            "ssh" if offer.backend.value == "remote" else offer.backend.value
-                        ),
-                        "region": offer.region,
-                        "instance_type": offer.instance.name,
-                        "resources": offer.instance.resources.dict(),
-                        "spot": offer.instance.resources.spot,
-                        "price": float(offer.price),
-                        "availability": offer.availability.value,
-                    }
+            if args.group_by:
+                gpus = self._list_gpus(args, run_spec)
+                print_gpu_json(gpus, run_spec, args.group_by, self.api.project)
+            else:
+                run_plan = self.api.client.runs.get_plan(
+                    self.api.project,
+                    run_spec,
+                    max_offers=args.max_offers,
                 )
+                print_offers_json(run_plan, run_spec)
 
-            print(json.dumps(output, indent=2))
-            return
-        else:
-            print_run_plan(run_plan, include_run_properties=False)
+    def _process_group_by_args(self, group_by_args: List[str]) -> List[str]:
+        valid_choices = {"gpu", "backend", "region", "count"}
+        processed = []
+
+        for arg in group_by_args:
+            values = [v.strip() for v in arg.split(",") if v.strip()]
+            for value in values:
+                if value in valid_choices:
+                    processed.append(value)
+                else:
+                    raise CLIError(
+                        f"Invalid group-by value: '{value}'. Valid choices are: {', '.join(sorted(valid_choices))}"
+                    )
+
+        return processed
+
+    def _list_gpus(self, args: List[str], run_spec: RunSpec) -> List[GpuGroup]:
+        group_by = [g for g in args.group_by if g != "gpu"] or None
+        return self.api.client.gpus.list_gpus(
+            self.api.project,
+            run_spec,
+            group_by=group_by,
+        )
@@ -0,0 +1,210 @@
+import shutil
+from typing import List
+
+from rich.table import Table
+
+from dstack._internal.cli.utils.common import console
+from dstack._internal.core.models.profiles import SpotPolicy
+from dstack._internal.core.models.runs import Requirements, RunSpec, get_policy_map
+from dstack._internal.server.schemas.gpus import GpuGroup
+
+
+def print_gpu_json(gpu_response, run_spec, group_by_cli, api_project):
+    """Print GPU information in JSON format."""
+    req = Requirements(
+        resources=run_spec.configuration.resources,
+        max_price=run_spec.merged_profile.max_price,
+        spot=get_policy_map(run_spec.merged_profile.spot_policy, default=SpotPolicy.AUTO),
+        reservation=run_spec.configuration.reservation,
+    )
+
+    if req.spot is None:
+        spot_policy = "auto"
+    elif req.spot:
+        spot_policy = "spot"
+    else:
+        spot_policy = "on-demand"
+
+    output = {
+        "project": api_project,
+        "user": "admin",  # TODO: Get actual user name
+        "resources": req.resources.dict(),
+        "spot_policy": spot_policy,
+        "max_price": req.max_price,
+        "reservation": run_spec.configuration.reservation,
+        "group_by": group_by_cli,
+        "gpus": [],
+    }
+
+    for gpu_group in gpu_response.gpus:
+        gpu_data = {
+            "name": gpu_group.name,
+            "memory_mib": gpu_group.memory_mib,
+            "vendor": gpu_group.vendor.value,
+            "availability": [av.value for av in gpu_group.availability],
+            "spot": gpu_group.spot,
+            "count": {"min": gpu_group.count.min, "max": gpu_group.count.max},
+            "price": {"min": gpu_group.price.min, "max": gpu_group.price.max},
+        }
+
+        if gpu_group.backend:
+            gpu_data["backend"] = gpu_group.backend.value
+        if gpu_group.backends:
+            gpu_data["backends"] = [b.value for b in gpu_group.backends]
+        if gpu_group.region:
+            gpu_data["region"] = gpu_group.region
+        if gpu_group.regions:
+            gpu_data["regions"] = gpu_group.regions
+
+        output["gpus"].append(gpu_data)
+
+    import json
+
+    print(json.dumps(output, indent=2))
+
+
+def print_gpu_table(gpus: List[GpuGroup], run_spec: RunSpec, group_by: List[str], project: str):
+    """Print GPU information in a formatted table."""
+    print_filter_info(run_spec, group_by, project)
+
+    has_single_backend = any(gpu_group.backend for gpu_group in gpus)
+    has_single_region = any(gpu_group.region for gpu_group in gpus)
+    has_multiple_regions = any(gpu_group.regions for gpu_group in gpus)
+
+    if has_single_backend and has_single_region:
+        backend_column = "BACKEND"
+        region_column = "REGION"
+    elif has_single_backend and has_multiple_regions:
+        backend_column = "BACKEND"
+        region_column = "REGIONS"
+    else:
+        backend_column = "BACKENDS"
+        region_column = None
+
+    table = Table(box=None, expand=shutil.get_terminal_size(fallback=(120, 40)).columns <= 110)
+    table.add_column("#")
+    table.add_column("GPU", no_wrap=True, ratio=2)
+    table.add_column("SPOT", style="grey58", ratio=1)
+    table.add_column("$/GPU", style="grey58", ratio=1)
+    table.add_column(backend_column, style="grey58", ratio=2)
+    if region_column:
+        table.add_column(region_column, style="grey58", ratio=2)
+    table.add_column()
+
+    for i, gpu_group in enumerate(gpus, start=1):
+        backend_text = ""
+        if gpu_group.backend:
+            backend_text = gpu_group.backend.value
+        elif gpu_group.backends:
+            backend_text = ", ".join(b.value for b in gpu_group.backends)
+
+        region_text = ""
+        if gpu_group.region:
+            region_text = gpu_group.region
+        elif gpu_group.regions:
+            if len(gpu_group.regions) <= 3:
+                region_text = ", ".join(gpu_group.regions)
+            else:
+                region_text = f"{len(gpu_group.regions)} regions"
+
+        if not region_column:
+            if gpu_group.regions and len(gpu_group.regions) > 3:
+                shortened_region_text = f"{len(gpu_group.regions)} regions"
+                backends_display = (
+                    f"{backend_text} ({shortened_region_text})"
+                    if shortened_region_text
+                    else backend_text
+                )
+            else:
+                backends_display = (
+                    f"{backend_text} ({region_text})" if region_text else backend_text
+                )
+        else:
+            backends_display = backend_text
+
+        memory_gb = f"{gpu_group.memory_mib // 1024}GB"
+        if gpu_group.count.min == gpu_group.count.max:
+            count_range = str(gpu_group.count.min)
+        else:
+            count_range = f"{gpu_group.count.min}..{gpu_group.count.max}"
+
+        gpu_spec = f"{gpu_group.name}:{memory_gb}:{count_range}"
+
+        spot_types = []
+        if "spot" in gpu_group.spot:
+            spot_types.append("spot")
+        if "on-demand" in gpu_group.spot:
+            spot_types.append("on-demand")
+        spot_display = ", ".join(spot_types)
+
+        if gpu_group.price.min == gpu_group.price.max:
+            price_display = f"{gpu_group.price.min:.4f}".rstrip("0").rstrip(".")
+        else:
+            min_formatted = f"{gpu_group.price.min:.4f}".rstrip("0").rstrip(".")
+            max_formatted = f"{gpu_group.price.max:.4f}".rstrip("0").rstrip(".")
+            price_display = f"{min_formatted}..{max_formatted}"
+
+        availability = ""
+        has_available = any(av.is_available() for av in gpu_group.availability)
+        has_unavailable = any(not av.is_available() for av in gpu_group.availability)
+
+        if has_unavailable and not has_available:
+            for av in gpu_group.availability:
+                if av.value in {"not_available", "no_quota", "idle", "busy"}:
+                    availability = av.value.replace("_", " ").lower()
+                    break
+
+        secondary_style = "grey58"
+        row_data = [
+            f"[{secondary_style}]{i}[/]",
+            gpu_spec,
+            f"[{secondary_style}]{spot_display}[/]",
+            f"[{secondary_style}]{price_display}[/]",
+            f"[{secondary_style}]{backends_display}[/]",
+        ]
+        if region_column:
+            row_data.append(f"[{secondary_style}]{region_text}[/]")
+        row_data.append(f"[{secondary_style}]{availability}[/]")
+
+        table.add_row(*row_data)
+
+    console.print(table)
+
+
+def print_filter_info(run_spec: RunSpec, group_by: List[str], project: str):
+    """Print filter information for GPU display."""
+    props = Table(box=None, show_header=False)
+    props.add_column(no_wrap=True)
+    props.add_column()
+
+    req = Requirements(
+        resources=run_spec.configuration.resources,
+        max_price=run_spec.merged_profile.max_price,
+        spot=get_policy_map(run_spec.merged_profile.spot_policy, default=SpotPolicy.AUTO),
+        reservation=run_spec.merged_profile.reservation,
+    )
+
+    pretty_req = req.pretty_format(resources_only=True)
+    max_price = f"${req.max_price:3f}".rstrip("0").rstrip(".") if req.max_price else "-"
+
+    if req.spot is None:
+        spot_policy = "auto"
+    elif req.spot:
+        spot_policy = "spot"
+    else:
+        spot_policy = "on-demand"
+
+    def th(s: str) -> str:
+        return f"[bold]{s}[/bold]"
+
+    props.add_row(th("Project"), project)
+    props.add_row(th("User"), "admin")  # TODO: Get actual user name
+    props.add_row(th("Resources"), pretty_req)
+    props.add_row(th("Spot policy"), spot_policy)
+    props.add_row(th("Max price"), max_price)
+    props.add_row(th("Reservation"), run_spec.configuration.reservation or "-")
+    if group_by:
+        props.add_row(th("Group by"), ", ".join(group_by))
+
+    console.print(props)
+    console.print()