nomadkaraoke
diff --git a/‎README.md‎
Lines changed: 176 additions & 3 deletions b/‎README.md‎
Lines changed: 176 additions & 3 deletions
diff --git a/‎audio_separator/remote/__init__.py‎
Lines changed: 3 additions & 0 deletions b/‎audio_separator/remote/__init__.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎audio_separator/remote/api_client.py‎
Lines changed: 187 additions & 0 deletions b/‎audio_separator/remote/api_client.py‎
Lines changed: 187 additions & 0 deletions
@@ -159,7 +159,7 @@ python -m pip install ort-nightly-gpu --index-url=https://aiinfra.pkgs.visualstu
 You can use Audio Separator via the command line, for example:
 
 ```sh
-audio-separator /path/to/your/input/audio.wav --model_filename UVR-MDX-NET-Inst_HQ_3.onnx
+audio-separator /path/to/your/input/audio.wav --model_filename model_bs_roformer_ep_317_sdr_12.9755.ckpt
 ```
 
 This command will download the specified model file, process the `audio.wav` input audio and generate two new files in the current directory, one containing vocals and one containing instrumental.
@@ -342,7 +342,7 @@ from audio_separator.separator import Separator
 separator = Separator()
 
 # Load a model
-separator.load_model(model_filename='UVR-MDX-NET-Inst_HQ_3.onnx')
+separator.load_model(model_filename='model_bs_roformer_ep_317_sdr_12.9755.ckpt')
 
 # Separate multiple audio files without reloading the model
 output_files = separator.separate(['audio1.wav', 'audio2.wav', 'audio3.wav'])
@@ -362,7 +362,7 @@ from audio_separator.separator import Separator
 separator = Separator()
 
 # Load a model
-separator.load_model(model_filename='UVR-MDX-NET-Inst_HQ_3.onnx')
+separator.load_model(model_filename='model_bs_roformer_ep_317_sdr_12.9755.ckpt')
 
 # Separate all audio files located in a folder
 output_files = separator.separate('path/to/audio_directory')
@@ -439,6 +439,179 @@ You can also rename specific stems:
 - **`demucs_params`:** (Optional) Demucs Architecture Specific Attributes & Defaults. `Default: {"segment_size": "Default", "shifts": 2, "overlap": 0.25, "segments_enabled": True}`
 - **`mdxc_params`:** (Optional) MDXC Architecture Specific Attributes & Defaults. `Default: {"segment_size": 256, "override_model_segment_size": False, "batch_size": 1, "overlap": 8, "pitch_shift": 0}`
 
+
+## Remote API Usage 🌐
+
+Audio Separator includes a remote API client that allows you to connect to a deployed Audio Separator API service, enabling you to perform audio separation without running the models locally. The API uses asynchronous processing with job polling for efficient handling of separation tasks.
+
+### Deploying the API Server
+
+To use the remote API functionality, you'll need to deploy the Audio Separator API server. The easiest way is using Modal.com:
+
+1. **Sign up for Modal.com** at [modal.com](https://modal.com)
+2. **Install the Modal CLI** and authenticate:
+   ```bash
+   pip install modal
+   modal setup
+   ```
+3. **Deploy the Audio Separator API**:
+   ```bash
+   modal deploy audio_separator/remote/deploy_modal.py
+   ```
+4. **Get your API URL** from the deployment output. It will look like:
+   ```
+   https://USERNAME--audio-separator-api.modal.run
+   ```
+
+Set this API URL as an environment variable:
+```bash
+export AUDIO_SEPARATOR_API_URL="https://USERNAME--audio-separator-api.modal.run"
+```
+
+Or pass it directly with the `--api_url` parameter.
+
+### Remote API Client (Python)
+
+You can use the `AudioSeparatorAPIClient` class to interact with a remote Audio Separator API:
+
+```python
+import logging
+from audio_separator.remote import AudioSeparatorAPIClient
+
+# Set up logging
+logger = logging.getLogger(__name__)
+
+# Initialize the API client
+api_client = AudioSeparatorAPIClient("https://USERNAME--audio-separator-api.modal.run", logger)
+
+# Simple example: separate audio and get results
+result = api_client.separate_audio_and_wait("audio.mp3")
+if result["status"] == "completed":
+    print(f"✅ Separation completed! Downloaded files:")
+    for file_path in result["downloaded_files"]:
+        print(f"  - {file_path}")
+else:
+    print(f"❌ Separation failed: {result.get('error', 'Unknown error')}")
+
+# Complex example with custom options
+result = api_client.separate_audio_and_wait(
+    "path/to/audio.wav",
+    model="model_bs_roformer_ep_317_sdr_12.9755.ckpt",
+    timeout=300,           # Wait up to 5 minutes
+    poll_interval=10,      # Check status every 10 seconds
+    download=True,         # Automatically download files
+    output_dir="./output"  # Save files to specific directory
+)
+
+# Advanced approach: manual job management (for custom polling logic)
+result = api_client.separate_audio("path/to/audio.wav", model="model_bs_roformer_ep_317_sdr_12.9755.ckpt")
+task_id = result["task_id"]
+print(f"Job submitted! Task ID: {task_id}")
+
+# Custom polling logic
+import time
+while True:
+    status = api_client.get_job_status(task_id)
+    print(f"Job status: {status['status']}")
+    
+    if status["status"] == "completed":
+        # Download files manually
+        for filename in status["files"]:
+            output_path = api_client.download_file(task_id, filename)
+            print(f"Downloaded: {output_path}")
+        break
+    elif status["status"] == "error":
+        print(f"Job failed: {status.get('error', 'Unknown error')}")
+        break
+    else:
+        if "progress" in status:
+            print(f"Progress: {status['progress']}%")
+        time.sleep(10)  # Wait 10 seconds
+
+# List available models
+models = api_client.list_models()
+print(models["text"])
+
+# Get server version
+version = api_client.get_server_version()
+print(f"Server version: {version}")
+```
+
+### Remote API CLI
+
+Audio Separator also provides a command-line interface for interacting with remote APIs:
+
+#### Commands
+
+**Separate audio files:**
+```bash
+# Separate audio file (asynchronous processing)
+audio-separator-remote separate audio.wav --model model_bs_roformer_ep_317_sdr_12.9755.ckpt
+
+# Multiple files
+audio-separator-remote separate audio1.wav audio2.wav audio3.wav
+
+# Use default model (if not specified)
+audio-separator-remote separate audio.wav
+```
+
+**Check job status:**
+```bash
+audio-separator-remote status <task_id>
+```
+
+**List available models:**
+```bash
+# Pretty formatted list
+audio-separator-remote models
+
+# JSON output
+audio-separator-remote models --format json
+
+# Filter by stem type
+audio-separator-remote models --filter vocals
+```
+
+**Download specific files:**
+```bash
+audio-separator-remote download <task_id> filename1.wav filename2.wav
+```
+
+**Get version information:**
+```bash
+audio-separator-remote --version
+```
+
+#### CLI Options
+
+- `--api_url`: Override the API URL
+- `--timeout`: Set timeout for polling (default: 600 seconds)
+- `--poll_interval`: Set polling interval (default: 10 seconds)
+- `--debug`: Enable debug logging
+- `--log_level`: Set log level (info, debug, warning, etc.)
+
+#### Examples
+
+```bash
+# Separate with custom settings
+audio-separator-remote separate song.mp3 \
+  --model model_bs_roformer_ep_317_sdr_12.9755.ckpt \
+  --api_url https://my-api.com \
+  --timeout 300
+
+# Check status with debug logging
+audio-separator-remote status abc123 --debug
+
+# List vocal separation models in JSON format
+audio-separator-remote models --filter vocals --format json
+```
+
+The remote API client automatically handles:
+- File uploading and downloading
+- Job polling and status updates
+- Error handling and retries
+- Progress reporting
+
 ## Requirements 📋
 
 Python >= 3.10
 
@@ -0,0 +1,3 @@
+from .api_client import AudioSeparatorAPIClient
+
+__all__ = ["AudioSeparatorAPIClient"]
@@ -0,0 +1,187 @@
+#!/usr/bin/env python
+import os
+import logging
+from typing import Optional
+
+import requests
+
+
+class AudioSeparatorAPIClient:
+    """Client for interacting with a remotely deployed Audio Separator API."""
+
+    def __init__(self, api_url: str, logger: logging.Logger):
+        self.api_url = api_url
+        self.logger = logger
+        self.session = requests.Session()
+
+    def separate_audio(self, file_path: str, model: Optional[str] = None) -> dict:
+        """Submit audio separation job (asynchronous processing)."""
+        if not os.path.exists(file_path):
+            raise FileNotFoundError(f"Audio file not found: {file_path}")
+
+        files = {"file": (os.path.basename(file_path), open(file_path, "rb"))}
+        data = {}
+
+        if model:
+            data["model"] = model
+
+        try:
+            # Increase timeout for large files (5 minutes)
+            response = self.session.post(f"{self.api_url}/separate", files=files, data=data, timeout=300)
+            response.raise_for_status()
+            return response.json()
+        except requests.RequestException as e:
+            self.logger.error(f"Separation request failed: {e}")
+            raise
+        finally:
+            files["file"][1].close()
+
+    def separate_audio_and_wait(self, file_path: str, model: Optional[str] = None, timeout: int = 600, poll_interval: int = 10, download: bool = True, output_dir: Optional[str] = None) -> dict:
+        """
+        Submit audio separation job and wait for completion (convenience method).
+
+        This method handles the full workflow: submit job, poll for completion,
+        and optionally download the result files.
+
+        Args:
+            file_path: Path to the audio file to separate
+            model: Model to use for separation (optional)
+            timeout: Maximum time to wait for completion in seconds (default: 600)
+            poll_interval: How often to check status in seconds (default: 10)
+            download: Whether to automatically download result files (default: True)
+            output_dir: Directory to save downloaded files (default: current directory)
+
+        Returns:
+            dict with keys:
+                - task_id: The job task ID
+                - status: "completed" or "error"
+                - files: List of output filenames
+                - downloaded_files: List of local file paths (if download=True)
+                - error: Error message (if status="error")
+        """
+        import time
+
+        # Submit the separation job
+        self.logger.info(f"Submitting separation job for '{file_path}'...")
+        result = self.separate_audio(file_path, model)
+        task_id = result["task_id"]
+        self.logger.info(f"Job submitted! Task ID: {task_id}")
+
+        # Poll for completion
+        self.logger.info("Waiting for separation to complete...")
+        start_time = time.time()
+        last_progress = -1
+
+        while time.time() - start_time < timeout:
+            try:
+                status = self.get_job_status(task_id)
+                current_status = status.get("status", "unknown")
+
+                # Show progress if it changed
+                if "progress" in status and status["progress"] != last_progress:
+                    self.logger.info(f"Progress: {status['progress']}%")
+                    last_progress = status["progress"]
+
+                # Check if completed
+                if current_status == "completed":
+                    self.logger.info("✅ Separation completed!")
+
+                    result = {"task_id": task_id, "status": "completed", "files": status.get("files", [])}
+
+                    # Download files if requested
+                    if download:
+                        downloaded_files = []
+                        self.logger.info(f"📥 Downloading {len(status.get('files', []))} output files...")
+
+                        for filename in status.get("files", []):
+                            try:
+                                if output_dir:
+                                    output_path = f"{output_dir.rstrip('/')}/{filename}"
+                                else:
+                                    output_path = filename
+
+                                downloaded_path = self.download_file(task_id, filename, output_path)
+                                downloaded_files.append(downloaded_path)
+                                self.logger.info(f"  ✅ Downloaded: {downloaded_path}")
+                            except Exception as e:
+                                self.logger.error(f"  ❌ Failed to download {filename}: {e}")
+
+                        result["downloaded_files"] = downloaded_files
+                        self.logger.info(f"🎉 Successfully downloaded {len(downloaded_files)} files!")
+
+                    return result
+
+                elif current_status == "error":
+                    error_msg = status.get("error", "Unknown error")
+                    self.logger.error(f"❌ Job failed: {error_msg}")
+                    return {"task_id": task_id, "status": "error", "error": error_msg, "files": []}
+
+                # Wait before next poll
+                time.sleep(poll_interval)
+
+            except Exception as e:
+                self.logger.warning(f"Error polling status: {e}")
+                time.sleep(poll_interval)
+
+        # Timeout reached
+        self.logger.error(f"❌ Job polling timed out after {timeout} seconds")
+        return {"task_id": task_id, "status": "timeout", "error": f"Job polling timed out after {timeout} seconds", "files": []}
+
+    def get_job_status(self, task_id: str) -> dict:
+        """Get job status."""
+        try:
+            response = self.session.get(f"{self.api_url}/status/{task_id}", timeout=10)
+            response.raise_for_status()
+            return response.json()
+        except requests.RequestException as e:
+            self.logger.error(f"Status request failed: {e}")
+            raise
+
+    def download_file(self, task_id: str, filename: str, output_path: Optional[str] = None) -> str:
+        """Download a file from a completed job."""
+        if output_path is None:
+            output_path = filename
+
+        try:
+            response = self.session.get(f"{self.api_url}/download/{task_id}/{filename}", timeout=60)
+            response.raise_for_status()
+
+            with open(output_path, "wb") as f:
+                f.write(response.content)
+
+            return output_path
+        except requests.RequestException as e:
+            self.logger.error(f"Download failed: {e}")
+            raise
+
+    def list_models(self, format_type: str = "pretty", filter_by: Optional[str] = None) -> dict:
+        """List available models."""
+        try:
+            if format_type == "json":
+                response = self.session.get(f"{self.api_url}/models-json", timeout=10)
+            else:
+                url = f"{self.api_url}/models"
+                if filter_by:
+                    url += f"?filter_sort_by={filter_by}"
+                response = self.session.get(url, timeout=10)
+
+            response.raise_for_status()
+
+            if format_type == "json":
+                return response.json()
+            else:
+                return {"text": response.text}
+        except requests.RequestException as e:
+            self.logger.error(f"Models request failed: {e}")
+            raise
+
+    def get_server_version(self) -> str:
+        """Get the server version."""
+        try:
+            response = self.session.get(f"{self.api_url}/health", timeout=10)
+            response.raise_for_status()
+            health_data = response.json()
+            return health_data.get("version", "unknown")
+        except requests.RequestException as e:
+            self.logger.error(f"Health check request failed: {e}")
+            raise
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+from .api_client import AudioSeparatorAPIClient`
	`2`	`+`
	`3`	`+__all__ = ["AudioSeparatorAPIClient"]`