Skip to content

Commit cfaf123

Browse files
fix: rm callisto refs
1 parent 38ef6c1 commit cfaf123

File tree

4 files changed

+25
-28
lines changed

4 files changed

+25
-28
lines changed

.gitignore

Lines changed: 0 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -172,15 +172,6 @@ runs/*.jsonl
172172
# Datasets
173173

174174
datasets/
175-
176-
# Callisto
177-
178-
callisto/challenges/public*
179-
180-
# JSON we want
181-
182-
!callisto/analysis/openai_challenges.json
183-
184175
*.parquet
185176
*.json
186177
*.csv

.pre-commit-config.yaml

Lines changed: 0 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,6 @@ repos:
7474
- "types-PyYAML"
7575
- "types-requests"
7676
- "types-setuptools"
77-
exclude: (callisto/scripts/|scripts/challenge_manager\.py)
7877

7978
- repo: local
8079
hooks:
@@ -90,14 +89,3 @@ repos:
9089
entry: .hooks/prettier.sh
9190
language: script
9291
types: [json, yaml]
93-
94-
- id: check-challenges
95-
name: Check challenge updates
96-
entry: python scripts/challenge_manager.py --check
97-
language: python
98-
pass_filenames: false
99-
always_run: true
100-
files: ^callisto/challenges/
101-
additional_dependencies:
102-
- pyyaml
103-
- jinja2

.vscode/settings.json

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
{
2+
"[python]": {
3+
"editor.formatOnSave": true,
4+
"editor.codeActionsOnSave": {
5+
"source.fixAll": "explicit",
6+
"source.organizeImports": "explicit"
7+
},
8+
"editor.defaultFormatter": "charliermarsh.ruff"
9+
},
10+
"python.testing.pytestArgs": [
11+
"tests"
12+
],
13+
"python.testing.unittestEnabled": false,
14+
"python.testing.pytestEnabled": true,
15+
"mypy.runUsingActiveInterpreter": true,
16+
"debugpy.debugJustMyCode": false,
17+
"jupyter.debugJustMyCode": false
18+
}

airtbench/main.py

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@
4141

4242
@cyclopts.Parameter(name="*", group="args")
4343
@dataclass
44-
class CallistoArgs:
44+
class AIRTBenchArgs:
4545
model: str
4646
"""Model to use for inference"""
4747
platform_api_key: str
@@ -81,7 +81,7 @@ class DreadnodeArgs:
8181
"""Dreadnode API token"""
8282
local_dir: str | None = None
8383
"""Local directory to store data in"""
84-
project: str = "callisto"
84+
project: str = "airtbench"
8585
"""Project name"""
8686

8787

@@ -138,7 +138,7 @@ async def validate_api_key(api_key: str) -> bool:
138138
try:
139139
# Use a bogus flag to test the API key with a standard challenge
140140
test_challenge_id = "pieceofcake"
141-
test_flag = "gAAAAAbogus_callisto_test_flag_for_validation"
141+
test_flag = "gAAAAAbogus_airtbench_test_flag_for_validation"
142142

143143
async with aiohttp.ClientSession() as session:
144144
url = f"{os.environ.get('CRUCIBLE_URL', 'https://platform.dreadnode.io')}/api/challenges/{test_challenge_id}/submit-flag"
@@ -198,7 +198,7 @@ async def check_challenge_availability(challenge_id: str, api_key: str) -> bool:
198198

199199
@dn.task(name="Step")
200200
async def run_step(
201-
args: CallistoArgs,
201+
args: AIRTBenchArgs,
202202
challenge: Challenge,
203203
pipeline: rg.ChatPipeline,
204204
kernel: PythonKernel,
@@ -489,7 +489,7 @@ async def check_for_flags(content: str) -> bool:
489489

490490
@dn.task(name="Attempt challenge")
491491
async def attempt_challenge(
492-
args: CallistoArgs,
492+
args: AIRTBenchArgs,
493493
challenge: Challenge,
494494
docker_image: str,
495495
) -> None:
@@ -651,7 +651,7 @@ def on_backoff(details: backoff.types.Details) -> None:
651651
@app.default
652652
async def main(
653653
*,
654-
args: CallistoArgs,
654+
args: AIRTBenchArgs,
655655
dn_args: DreadnodeArgs
656656
| None = None, # Has to be None even though not interior fields are required
657657
) -> None:
@@ -674,7 +674,7 @@ async def main(
674674

675675
# Build the container
676676
image = build_container(
677-
"callisto",
677+
"airtbench",
678678
g_container_dir / "Dockerfile",
679679
g_container_dir,
680680
memory_limit=args.memory_limit,

0 commit comments

Comments
 (0)