Add NVIDIA provider

Patel230 · Patel230 · commit d8c3a0c65c60 · 2026-03-16T19:30:17.000+05:30
diff --git a/nvidia.go b/nvidia.go
@@ -0,0 +1,79 @@
+package iteragent
+
+import (
+	"bytes"
+	"context"
+	"encoding/json"
+	"fmt"
+	"io"
+	"net/http"
+	"time"
+)
+
+type nvidiaProvider struct {
+	cfg    OpenAICompatConfig
+	client *http.Client
+}
+
+func NewNvidia(cfg OpenAICompatConfig) Provider {
+	return &nvidiaProvider{
+		cfg:    cfg,
+		client: &http.Client{Timeout: 120 * time.Second},
+	}
+}
+
+func (p *nvidiaProvider) Name() string {
+	return fmt.Sprintf("nvidia(%s)", p.cfg.Model)
+}
+
+func (p *nvidiaProvider) Complete(ctx context.Context, messages []Message) (string, error) {
+	url := p.cfg.BaseURL + "/chat/completions"
+	if p.cfg.BaseURL == "" {
+		url = "https://integrate.api.nvidia.com/v1/chat/completions"
+	}
+
+	reqBody := openaiRequest{
+		Model:    p.cfg.Model,
+		Messages: messages,
+		Stream:   false,
+	}
+
+	body, err := json.Marshal(reqBody)
+	if err != nil {
+		return "", fmt.Errorf("marshal request: %w", err)
+	}
+
+	req, err := http.NewRequestWithContext(ctx, "POST", url, bytes.NewReader(body))
+	if err != nil {
+		return "", fmt.Errorf("create request: %w", err)
+	}
+
+	req.Header.Set("Content-Type", "application/json")
+	req.Header.Set("Authorization", "Bearer "+p.cfg.APIKey)
+
+	resp, err := p.client.Do(req)
+	if err != nil {
+		return "", fmt.Errorf("do request: %w", err)
+	}
+	defer resp.Body.Close()
+
+	respBody, err := io.ReadAll(resp.Body)
+	if err != nil {
+		return "", fmt.Errorf("read response: %w", err)
+	}
+
+	if resp.StatusCode != 200 {
+		return "", fmt.Errorf("nvidia API error (%d): %s", resp.StatusCode, string(respBody))
+	}
+
+	var parsed openaiResponse
+	if err := json.Unmarshal(respBody, &parsed); err != nil {
+		return "", fmt.Errorf("unmarshal response: %w", err)
+	}
+
+	if len(parsed.Choices) == 0 {
+		return "", fmt.Errorf("no response from nvidia")
+	}
+
+	return parsed.Choices[0].Message.Content, nil
+}
diff --git a/provider.go b/provider.go
@@ -13,7 +13,7 @@ type Provider interface {
 }
 
 // NewProvider returns the provider selected by ITERATE_PROVIDER.
-// Supported values: ollama, openai, anthropic, groq, gemini (default: gemini)
+// Supported values: ollama, openai, anthropic, groq, gemini, nvidia (default: gemini)
 // If apiKey is provided, it takes priority over environment variables.
 func NewProvider(providerName string, apiKey ...string) (Provider, error) {
 	providedKey := ""
@@ -94,6 +94,20 @@ func NewProvider(providerName string, apiKey ...string) (Provider, error) {
 			APIKey: key,
 		}), nil
 
+	case "nvidia":
+		key := providedKey
+		if key == "" {
+			key = os.Getenv("NVIDIA_API_KEY")
+		}
+		if key == "" {
+			return nil, fmt.Errorf("NVIDIA_API_KEY is required for nvidia provider (or use --api-key)")
+		}
+		return NewNvidia(OpenAICompatConfig{
+			BaseURL: getEnvOr("NVIDIA_BASE_URL", "https://integrate.api.nvidia.com/v1"),
+			Model:   getEnvOr("ITERATE_MODEL", "nvidia/llama-3.3-nemotron-70b-instruct"),
+			APIKey:  key,
+		}), nil
+
 	default:
 		baseURL := os.Getenv("ITERATE_BASE_URL")
 		if baseURL == "" {