FasterAI-Labs
diff --git a/‎README.md‎
Lines changed: 93 additions & 46 deletions b/‎README.md‎
Lines changed: 93 additions & 46 deletions
diff --git a/‎fasterbench/__init__.py‎
Lines changed: 42 additions & 0 deletions b/‎fasterbench/__init__.py‎
Lines changed: 42 additions & 0 deletions
diff --git a/‎fasterbench/_modidx.py‎
Lines changed: 52 additions & 2 deletions b/‎fasterbench/_modidx.py‎
Lines changed: 52 additions & 2 deletions
@@ -39,104 +39,151 @@ from fasterbench import benchmark
 
 # Load your model
 model = resnet18()
-
-# Create sample input
 dummy_input = torch.randn(1, 3, 224, 224)
 
 # Run comprehensive benchmarks
-results = benchmark(model, dummy_input)
+result = benchmark(model, dummy_input, metrics=["size", "speed", "compute"])
+
+# Typed access (IDE autocomplete!)
+print(f"Size: {result.size.size_mib:.2f} MiB")
+print(f"Params: {result.size.num_params:,}")
+print(f"CPU Latency: {result.speed['cpu'].mean_ms:.2f} ms")
+print(f"MACs: {result.compute.macs_m}M")
 
-# Print results
-for metric, value in results.items():
-    print(f"{metric}: {value}")
+# Backward-compatible dict access still works
+print(result["size_disk_bytes"])
 ```
 
 ## Features
 
-### All-in-one Benchmarking
+### BenchmarkResult: Typed Access + Backward Compatibility
 
-Get comprehensive metrics with a single function call:
+The
+[`benchmark()`](https://FasterAI-Labs.github.io/fasterbench/benchmark.html#benchmark)
+function returns a
+[`BenchmarkResult`](https://FasterAI-Labs.github.io/fasterbench/benchmark.html#benchmarkresult)
+object with both typed attribute access and dict-like access:
 
 ``` python
-# Measure all metrics
-results = benchmark(model, dummy_input)
+result = benchmark(model, dummy_input, metrics=["size", "speed", "compute"])
+
+# Typed access - IDE autocomplete and type checking
+result.size.size_mib          # 44.59
+result.size.num_params        # 11689512
+result.speed["cpu"].mean_ms   # 45.23
+result.speed["cpu"].throughput_s  # 22.1
+result.compute.macs_m         # 1819.066
+result.compute.macs_available # True (False if MACs couldn't be computed)
+
+# Dict access - backward compatible with existing code
+result["size_size_mib"]       # 44.59
+result["speed_cpu_mean_ms"]   # 45.23
+for key, value in result.items():
+    print(f"{key}: {value}")
+```
+
+### Human-Readable Summary
 
-# Or select specific metrics
-results = benchmark(model, dummy_input, metrics=["size", "speed"])
+Get a quick overview with formatted output:
+
+``` python
+result.summary()  # prints directly
 ```
 
-### Size Metrics
+    ═══ Size ════════════════════════════════════
+      Disk:   44.59 MiB
+      Params: 11.69M
+    ═══ Speed ═══════════════════════════════════
+      cpu: 45.23 ms  │  22.1 inf/s  │  p99: 48.12 ms
+    ═══ Compute ═════════════════════════════════
+      MACs:   1819.1 M
+      Params: 11.69 M
 
-Evaluate model size characteristics:
+### Export to DataFrame or JSON
 
 ``` python
-from fasterbench import compute_size
+# Convert to pandas DataFrame for analysis
+df = result.to_dataframe()
+df.to_csv("benchmark_results.csv")
 
-size_metrics = compute_size(model)
-print(f"Disk Size: {size_metrics.size_mib:.2f} MiB")
-print(f"Parameters: {size_metrics.num_params:,}")
+# Serialize to JSON
+json_str = result.to_json()
+
+# Get formatted string (for logging, etc.)
+summary_str = str(result)
 ```
 
-### Speed Metrics
+### Selective Metrics
 
-Measure inference performance across devices:
+Only compute what you need:
 
 ``` python
-from fasterbench import compute_speed_multi
+# Fast: just size and compute (no inference runs)
+result = benchmark(model, dummy_input, metrics=["size", "compute"])
 
-speed_metrics = compute_speed_multi(model, dummy_input)
-for device, metrics in speed_metrics.items():
-    print(f"{device} latency (P50): {metrics.p50_ms:.2f} ms")
-    print(f"{device} throughput: {metrics.throughput_s:.2f} inferences/sec")
+# Full benchmark on specific devices
+result = benchmark(model, dummy_input, 
+                   speed_devices=["cpu", "cuda"],
+                   memory_devices=["cuda"])
 ```
 
-### Compute Metrics
+### Individual Metric Functions
 
-Quantify computational complexity:
+For fine-grained control, use the individual compute functions:
 
 ``` python
-from fasterbench import compute_compute
-
-compute_metrics = compute_compute(model, dummy_input)
-print(f"MACs: {compute_metrics.macs_m} million")
+from fasterbench import compute_size, compute_speed_multi, compute_compute
+
+# Size metrics
+size = compute_size(model)
+print(f"Disk Size: {size.size_mib:.2f} MiB")
+print(f"Parameters: {size.num_params:,}")
+
+# Speed metrics across devices
+speed = compute_speed_multi(model, dummy_input)
+for device, metrics in speed.items():
+    print(f"{device}: {metrics.mean_ms:.2f}ms, {metrics.throughput_s:.1f} inf/s")
+
+# Compute metrics (MACs)
+compute = compute_compute(model, dummy_input)
+if compute.macs_available:
+    print(f"MACs: {compute.macs_m}M")
 ```
 
 ### Memory Metrics
 
-Profile memory usage:
+Profile memory usage on CPU and GPU:
 
 ``` python
 from fasterbench import compute_memory_multi
 
-memory_metrics = compute_memory_multi(model, dummy_input)
-for device, metrics in memory_metrics.items():
-    print(f"{device} peak memory: {metrics.peak_mib:.2f} MiB")
+memory = compute_memory_multi(model, dummy_input)
+for device, metrics in memory.items():
+    print(f"{device} peak: {metrics.peak_mib:.2f} MiB")
 ```
 
 ### Energy Metrics
 
-Measure environmental impact:
+Measure power consumption and carbon footprint (requires `codecarbon`):
 
 ``` python
 from fasterbench import compute_energy_multi
 
-# Requires codecarbon package
-energy_metrics = compute_energy_multi(model, dummy_input)
-for device, metrics in energy_metrics.items():
-    print(f"{device} power usage: {metrics.mean_watts:.2f} W")
-    print(f"{device} CO2: {metrics.co2_eq_g:.6f} g CO₂-eq per inference")
+energy = compute_energy_multi(model, dummy_input)
+for device, metrics in energy.items():
+    print(f"{device}: {metrics.mean_watts:.1f}W, {metrics.co2_eq_g:.4f}g CO₂/inf")
 ```
 
-### Thread Count Optimization
+### Thread Sweep for CPU Optimization
 
-Find the optimal number of CPU threads:
+Find the optimal thread count for CPU inference:
 
 ``` python
 from fasterbench import sweep_threads
 
-thread_results = sweep_threads(model, dummy_input, thread_counts=[1, 2, 4, 8, 16])
-for result in thread_results:
-    print(f"Threads: {result['threads']}, Latency: {result['mean_ms']:.2f} ms")
+results = sweep_threads(model, dummy_input, thread_counts=[1, 2, 4, 8])
+for r in results:
+    print(f"{r['threads']} threads: {r['mean_ms']:.2f}ms")
 ```
 
 ### Visualize Results
 
@@ -1 +1,43 @@
 __version__ = "0.0.6"
+"""Comprehensive benchmarking toolkit for deep learning models"""
+
+# AUTOGENERATED! DO NOT EDIT! File to edit: ../nbs/index.ipynb.
+
+# %% auto #0
+__all__ = []
+
+# %% ../nbs/index.ipynb #8b6f8c52
+from .benchmark import benchmark, BenchmarkResult
+from .size import SizeMetrics, compute_size, get_model_size, get_num_parameters
+from fasterbench.speed import (
+    SpeedMetrics, compute_speed, compute_speed_multi, 
+    sweep_threads, sweep_latency, sweep_batch_sizes,
+)
+from .profiling import profile_layers, LayerProfiler
+from .compute import ComputeMetrics, compute_compute
+from .memory import MemoryMetrics, compute_memory, compute_memory_multi
+from .energy import EnergyMetrics, compute_energy, compute_energy_multi
+from .plot import create_radar_plot, SPECS
+from .utils import parse_metric_value
+
+__all__ = [
+    # Main entry point
+    'benchmark', 'BenchmarkResult',
+    # Size
+    'SizeMetrics', 'compute_size', 'get_model_size', 'get_num_parameters',
+    # Speed
+    'SpeedMetrics', 'compute_speed', 'compute_speed_multi', 
+    'sweep_threads', 'sweep_latency', 'sweep_batch_sizes',
+    # Profiling
+    'profile_layers', 'LayerProfiler',
+    # Compute
+    'ComputeMetrics', 'compute_compute',
+    # Memory
+    'MemoryMetrics', 'compute_memory', 'compute_memory_multi',
+    # Energy
+    'EnergyMetrics', 'compute_energy', 'compute_energy_multi',
+    # Plot
+    'create_radar_plot', 'SPECS',
+    # Utils
+    'parse_metric_value',
+]
@@ -5,14 +5,42 @@
                 'doc_host': 'https://FasterAI-Labs.github.io',
                 'git_url': 'https://github.com/FasterAI-Labs/fasterbench',
                 'lib_path': 'fasterbench'},
-  'syms': { 'fasterbench.benchmark': {'fasterbench.benchmark.benchmark': ('benchmark.html#benchmark', 'fasterbench/benchmark.py')},
+  'syms': { 'fasterbench.benchmark': { 'fasterbench.benchmark.BenchmarkResult': ( 'benchmark.html#benchmarkresult',
+                                                                                  'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.__getitem__': ( 'benchmark.html#benchmarkresult.__getitem__',
+                                                                                              'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.__iter__': ( 'benchmark.html#benchmarkresult.__iter__',
+                                                                                           'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.__len__': ( 'benchmark.html#benchmarkresult.__len__',
+                                                                                          'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.__repr__': ( 'benchmark.html#benchmarkresult.__repr__',
+                                                                                           'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.__str__': ( 'benchmark.html#benchmarkresult.__str__',
+                                                                                          'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult._format_summary': ( 'benchmark.html#benchmarkresult._format_summary',
+                                                                                                  'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.as_dict': ( 'benchmark.html#benchmarkresult.as_dict',
+                                                                                          'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.summary': ( 'benchmark.html#benchmarkresult.summary',
+                                                                                          'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.to_dataframe': ( 'benchmark.html#benchmarkresult.to_dataframe',
+                                                                                               'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.BenchmarkResult.to_json': ( 'benchmark.html#benchmarkresult.to_json',
+                                                                                          'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark._fmt_params': ('benchmark.html#_fmt_params', 'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark._section': ('benchmark.html#_section', 'fasterbench/benchmark.py'),
+                                       'fasterbench.benchmark.benchmark': ('benchmark.html#benchmark', 'fasterbench/benchmark.py')},
             'fasterbench.compute': { 'fasterbench.compute.ComputeMetrics': ('compute.html#computemetrics', 'fasterbench/compute.py'),
                                      'fasterbench.compute.ComputeMetrics.as_dict': ( 'compute.html#computemetrics.as_dict',
                                                                                      'fasterbench/compute.py'),
+                                     'fasterbench.compute.ComputeMetrics.macs_available': ( 'compute.html#computemetrics.macs_available',
+                                                                                            'fasterbench/compute.py'),
                                      'fasterbench.compute.compute_compute': ('compute.html#compute_compute', 'fasterbench/compute.py')},
             'fasterbench.core': { 'fasterbench.core._bytes_to_mib': ('core.html#_bytes_to_mib', 'fasterbench/core.py'),
                                   'fasterbench.core._device_ctx': ('core.html#_device_ctx', 'fasterbench/core.py'),
-                                  'fasterbench.core._sync': ('core.html#_sync', 'fasterbench/core.py')},
+                                  'fasterbench.core._sync': ('core.html#_sync', 'fasterbench/core.py'),
+                                  'fasterbench.core._validate_benchmark_params': ( 'core.html#_validate_benchmark_params',
+                                                                                   'fasterbench/core.py')},
             'fasterbench.energy': { 'fasterbench.energy.EnergyMetrics': ('energy.html#energymetrics', 'fasterbench/energy.py'),
                                     'fasterbench.energy.EnergyMetrics.as_dict': ( 'energy.html#energymetrics.as_dict',
                                                                                   'fasterbench/energy.py'),
@@ -29,6 +57,27 @@
                                                                                  'fasterbench/memory.py')},
             'fasterbench.plot': { 'fasterbench.plot._parse': ('plot.html#_parse', 'fasterbench/plot.py'),
                                   'fasterbench.plot.create_radar_plot': ('plot.html#create_radar_plot', 'fasterbench/plot.py')},
+            'fasterbench.profiling': { 'fasterbench.profiling.LayerProfiler': ('profiling.html#layerprofiler', 'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.LayerProfiler.__init__': ( 'profiling.html#layerprofiler.__init__',
+                                                                                         'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.LayerProfiler._profile_compute': ( 'profiling.html#layerprofiler._profile_compute',
+                                                                                                 'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.LayerProfiler._profile_memory': ( 'profiling.html#layerprofiler._profile_memory',
+                                                                                                'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.LayerProfiler._profile_size': ( 'profiling.html#layerprofiler._profile_size',
+                                                                                              'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.LayerProfiler._profile_speed': ( 'profiling.html#layerprofiler._profile_speed',
+                                                                                               'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.LayerProfiler.profile': ( 'profiling.html#layerprofiler.profile',
+                                                                                        'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.LayerProfiler.summary': ( 'profiling.html#layerprofiler.summary',
+                                                                                        'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.LayerProfiler.top': ( 'profiling.html#layerprofiler.top',
+                                                                                    'fasterbench/profiling.py'),
+                                       'fasterbench.profiling._output_bytes': ('profiling.html#_output_bytes', 'fasterbench/profiling.py'),
+                                       'fasterbench.profiling._tensor_bytes': ('profiling.html#_tensor_bytes', 'fasterbench/profiling.py'),
+                                       'fasterbench.profiling.profile_layers': ( 'profiling.html#profile_layers',
+                                                                                 'fasterbench/profiling.py')},
             'fasterbench.size': { 'fasterbench.size.SizeMetrics': ('size.html#sizemetrics', 'fasterbench/size.py'),
                                   'fasterbench.size.SizeMetrics.as_dict': ('size.html#sizemetrics.as_dict', 'fasterbench/size.py'),
                                   'fasterbench.size.compute_size': ('size.html#compute_size', 'fasterbench/size.py'),
@@ -40,6 +89,7 @@
                                    'fasterbench.speed._stats': ('speed.html#_stats', 'fasterbench/speed.py'),
                                    'fasterbench.speed.compute_speed': ('speed.html#compute_speed', 'fasterbench/speed.py'),
                                    'fasterbench.speed.compute_speed_multi': ('speed.html#compute_speed_multi', 'fasterbench/speed.py'),
+                                   'fasterbench.speed.sweep_batch_sizes': ('speed.html#sweep_batch_sizes', 'fasterbench/speed.py'),
                                    'fasterbench.speed.sweep_latency': ('speed.html#sweep_latency', 'fasterbench/speed.py'),
                                    'fasterbench.speed.sweep_threads': ('speed.html#sweep_threads', 'fasterbench/speed.py')},
             'fasterbench.utils': {'fasterbench.utils.parse_metric_value': ('utils.html#parse_metric_value', 'fasterbench/utils.py')}}}