PrimeIntellect-ai
diff --git a/‎configs/endpoints.py‎
Lines changed: 71 additions & 9 deletions b/‎configs/endpoints.py‎
Lines changed: 71 additions & 9 deletions
diff --git a/‎docs/development.md‎
Lines changed: 3 additions & 4 deletions b/‎docs/development.md‎
Lines changed: 3 additions & 4 deletions
diff --git a/‎docs/evaluation.md‎
Lines changed: 11 additions & 1 deletion b/‎docs/evaluation.md‎
Lines changed: 11 additions & 1 deletion
@@ -4,187 +4,249 @@
         "model": "allenai/olmo-3-32b-think",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "olmo3-7b-i": {
         "model": "allenai/olmo-3-7b-instruct",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "olmo3-7b-t": {
         "model": "allenai/olmo-3-7b-think",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     # arcee
     "trinity-mini": {
         "model": "arcee/trinity-mini",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     # anthropic
     "haiku": {
-        "model": "anthropic/claude-4.5-haiku",
-        "url": "https://api.pinference.ai/api/v1",
-        "key": "PRIME_API_KEY",
+        "model": "claude-haiku-4-5",
+        "url": "https://api.anthropic.com",
+        "key": "ANTHROPIC_API_KEY",
+        "type": "anthropic_messages",
     },
     "sonnet": {
-        "model": "anthropic/claude-4.5-sonnet",
-        "url": "https://api.pinference.ai/api/v1",
-        "key": "PRIME_API_KEY",
+        "model": "claude-sonnet-4-5",
+        "url": "https://api.anthropic.com",
+        "key": "ANTHROPIC_API_KEY",
+        "type": "anthropic_messages",
     },
     "opus": {
-        "model": "anthropic/claude-4.5-opus",
-        "url": "https://api.pinference.ai/api/v1",
-        "key": "PRIME_API_KEY",
+        "model": "claude-opus-4-5",
+        "url": "https://api.anthropic.com",
+        "key": "ANTHROPIC_API_KEY",
+        "type": "anthropic_messages",
+    },
+    # deepseek
+    "deepseek-chat": {
+        "model": "deepseek-chat",
+        "url": "https://api.deepseek.com/v1",
+        "key": "DEEPSEEK_API_KEY",
+        "type": "openai_chat_completions",
+    },
+    "deepseek-reasoner": {
+        "model": "deepseek-reasoner",
+        "url": "https://api.deepseek.com/v1",
+        "key": "DEEPSEEK_API_KEY",
+        "type": "openai_chat_completions",
+    },
+    # deepseek (Anthropic-compatible)
+    "deepseek-chat-anth": {
+        "model": "deepseek-chat",
+        "url": "https://api.deepseek.com/anthropic",
+        "key": "DEEPSEEK_API_KEY",
+        "type": "anthropic_messages",
+    },
+    "deepseek-reasoner-anth": {
+        "model": "deepseek-reasoner",
+        "url": "https://api.deepseek.com/anthropic",
+        "key": "DEEPSEEK_API_KEY",
+        "type": "anthropic_messages",
     },
     # google
     "gemini-2.5-flash": {
         "model": "google/gemini-2.5-flash",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gemini-2.5-pro": {
         "model": "google/gemini-2.5-pro",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gemini-3-flash": {
         "model": "google/gemini-3-flash",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gemini-3-pro": {
         "model": "google/gemini-3-pro-preview",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gemini-3-pro-exp": {
         "model": "google/gemini-3-pro-preview",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     # qwen
     "qwen3-30b-i": {
         "model": "qwen/qwen3-30b-a3b-instruct-2507",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "qwen3-30b-t": {
         "model": "qwen/qwen3-30b-a3b-thinking-2507",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "qwen3-235b-i": {
         "model": "qwen/qwen3-235b-a22b-instruct-2507",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "qwen3-235b-t": {
         "model": "qwen/qwen3-235b-a22b-thinking-2507",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "qwen3-vl-30b-i": {
         "model": "qwen/qwen3-vl-30b-a3b-instruct",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "qwen3-vl-30b-t": {
         "model": "qwen/qwen3-vl-30b-a3b-thinking",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "qwen3-vl-235b-i": {
         "model": "qwen/qwen3-vl-235b-a22b-instruct",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "qwen3-vl-235b-t": {
         "model": "qwen/qwen3-vl-235b-a22b-thinking",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     # moonshot
     "kimi-k2": {
         "model": "moonshotai/kimi-k2-0905",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "kimi-k2-t": {
         "model": "moonshotai/kimi-k2-thinking",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     # openai
     "gpt-oss-120b": {
         "model": "openai/gpt-oss-120b",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-oss-20b": {
         "model": "openai/gpt-oss-20b",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-4.1-nano": {
         "model": "gpt-4.1-nano",
         "url": "https://api.openai.com/v1",
         "key": "OPENAI_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-4.1-mini": {
         "model": "gpt-4.1-mini",
         "url": "https://api.openai.com/v1",
         "key": "OPENAI_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-4.1": {
         "model": "gpt-4.1",
         "url": "https://api.openai.com/v1",
         "key": "OPENAI_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-5-nano": {
         "model": "gpt-5-nano",
         "url": "https://api.openai.com/v1",
         "key": "OPENAI_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-5-mini": {
         "model": "gpt-5-mini",
         "url": "https://api.openai.com/v1",
         "key": "OPENAI_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-5": {
         "model": "gpt-5",
         "url": "https://api.openai.com/v1",
         "key": "OPENAI_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-5.1": {
         "model": "gpt-5.1",
         "url": "https://api.openai.com/v1",
         "key": "OPENAI_API_KEY",
+        "type": "openai_chat_completions",
     },
     "gpt-5.2": {
         "model": "gpt-5.2",
         "url": "https://api.openai.com/v1",
         "key": "OPENAI_API_KEY",
+        "type": "openai_chat_completions",
     },
     # z-ai
     "glm-4.5": {
         "model": "z-ai/glm-4.5",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "glm-4.5-air": {
         "model": "z-ai/glm-4.5-air",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "glm-4.6": {
         "model": "z-ai/glm-4.6",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
     "glm-4.7": {
         "model": "z-ai/glm-4.7",
         "url": "https://api.pinference.ai/api/v1",
         "key": "PRIME_API_KEY",
+        "type": "openai_chat_completions",
     },
 }
@@ -146,13 +146,12 @@ class TestFeature:
 
 ### Using Mocks
 
-The test suite provides mock OpenAI clients:
+The test suite provides a `MockClient` in `conftest.py` that implements the `Client` interface:
 
 ```python
-from tests.mock_openai_client import MockOpenAIClient
-
 def test_with_mock(mock_client):
-    env = vf.SingleTurnEnv(client=mock_client)
+    mock_client.set_default_responses(chat_response="test answer")
+    env = vf.SingleTurnEnv(client=mock_client, model="test", ...)
     # Test without real API calls
 ```
 
 
@@ -17,7 +17,7 @@ This section explains how to run evaluations with Verifiers environments. See [E
   - [TOML Configuration](#toml-configuration)
   - [Configuration Precedence](#configuration-precedence)
 
-Use `prime eval` to execute rollouts against any OpenAI-compatible model and report aggregate metrics.
+Use `prime eval` to execute rollouts against any supported model provider and report aggregate metrics. Supported providers include OpenAI-compatible APIs (the default) and the Anthropic Messages API (via `--api-client-type anthropic_messages`).
 
 ## Basic Usage
 
@@ -66,6 +66,7 @@ prime eval run my-env -x '{"max_turns": 20}'
 | `--model` | `-m` | `openai/gpt-4.1-mini` | Model name or endpoint alias |
 | `--api-base-url` | `-b` | `https://api.pinference.ai/api/v1` | API base URL |
 | `--api-key-var` | `-k` | `PRIME_API_KEY` | Environment variable containing API key |
+| `--api-client-type` | — | `openai_chat_completions` | Client type: `openai_chat_completions`, `openai_completions`, `openai_chat_completions_token`, or `anthropic_messages` |
 | `--endpoints-path` | `-e` | `./configs/endpoints.toml` | Path to TOML endpoints registry |
 | `--header` | — | — | Extra HTTP header (`Name: Value`), repeatable |
 
@@ -83,8 +84,17 @@ endpoint_id = "qwen3-235b-i"
 model = "qwen/qwen3-235b-a22b-instruct-2507"
 url = "https://api.pinference.ai/api/v1"
 key = "PRIME_API_KEY"
+
+[[endpoint]]
+endpoint_id = "claude-sonnet"
+model = "claude-sonnet-4-5-20250929"
+url = "https://api.anthropic.com"
+key = "ANTHROPIC_API_KEY"
+api_client_type = "anthropic_messages"
 ```
 
+Each endpoint entry supports an optional `api_client_type` field to select the client implementation (defaults to `"openai_chat_completions"`). Use `"anthropic_messages"` for Anthropic models when calling the Anthropic API directly.
+
 To define equivalent replicas, add multiple `[[endpoint]]` entries with the same `endpoint_id`.
 
 Then use the alias directly: