Skip to content

Commit 9cf161a

Browse files
abrichrclaude
andauthored
fix: add DEBIAN_FRONTEND=noninteractive and 128GB OS disk (#38)
* fix: add DEBIAN_FRONTEND=noninteractive and 128GB disk for CLI path Docker install failed with debconf Dialog frontend error on non-interactive SSH sessions. Also add --os-disk-size-gb 128 to the az CLI create path (SDK path already had it). Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com> * chore: sync beads state --------- Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
1 parent 406d982 commit 9cf161a

6 files changed

Lines changed: 15 additions & 10 deletions

File tree

.beads/beads.db-shm

0 Bytes
Binary file not shown.

.beads/beads.db-wal

177 KB
Binary file not shown.

.beads/issues.jsonl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,5 +13,5 @@
1313
{"id":"openadapt-evals-hvm","title":"VL model fix PR #18 ready to merge","notes":"2026-02-08: openadapt-ml PR #18 was already merged on 2026-01-29. VL model fix is done.","status":"closed","priority":0,"issue_type":"task","owner":"richard.abrich@gmail.com","created_at":"2026-01-29T16:17:03.491938-05:00","created_by":"Richard Abrich","updated_at":"2026-02-08T12:55:19.233249-05:00","closed_at":"2026-02-08T12:55:19.233249-05:00","close_reason":"PR #18 already merged 2026-01-29"}
1414
{"id":"openadapt-evals-mx8","title":"Analyze evaluation results and publish findings","description":"After demo-conditioned evaluation completes, analyze results: success rates, failure modes, demo impact. Create data-driven roadmap for improvements.","status":"open","priority":1,"issue_type":"task","owner":"richard.abrich@gmail.com","created_at":"2026-02-14T12:23:06.328838-05:00","created_by":"Richard Abrich","updated_at":"2026-02-14T12:23:06.328838-05:00"}
1515
{"id":"openadapt-evals-sz4","title":"RCA: Windows product key prompt recurring issue","status":"closed","priority":0,"issue_type":"task","owner":"richard.abrich@gmail.com","created_at":"2026-01-20T18:59:36.266286-05:00","created_by":"Richard Abrich","updated_at":"2026-01-20T20:32:06.493102-05:00","closed_at":"2026-01-20T20:32:06.493102-05:00","close_reason":"RCA complete - root cause is VERSION mismatch (CLI=11, Dockerfile=11e). Fix documented in RECURRING_ISSUES.md and WINDOWS_PRODUCT_KEY_RCA.md"}
16-
{"id":"openadapt-evals-vcb","title":"Run demo-conditioned WAA evaluation","description":"Once demos are recorded, run WAA evaluation with demo-conditioned agents (RetrievalAugmentedAgent with real demos). Target: measure improvement over zero-shot baseline. Requires real demos from recording task.","notes":"PR #35 merged (v0.4.0): full pipeline implemented — record-waa (interactive WAA API recording via VNC), annotate (VLM annotation of screenshots), eval (delegates to eval-suite). 12 harder tasks defined (0/12 zero-shot). CI workflow added. PR #36 merged (v0.4.1): fixed PyPI README images. Next: spin up Azure VM, record demos for 12 harder tasks, annotate, run DC eval.","status":"open","priority":0,"issue_type":"task","owner":"richard.abrich@gmail.com","created_at":"2026-02-14T12:23:04.624305-05:00","created_by":"Richard Abrich","updated_at":"2026-02-24T02:00:07.491221-05:00"}
16+
{"id":"openadapt-evals-vcb","title":"Run demo-conditioned WAA evaluation","description":"Once demos are recorded, run WAA evaluation with demo-conditioned agents (RetrievalAugmentedAgent with real demos). Target: measure improvement over zero-shot baseline. Requires real demos from recording task.","notes":"PR #35 merged (v0.4.0): full pipeline implemented — record-waa (interactive WAA API recording via VNC), annotate (VLM annotation of screenshots), eval (delegates to eval-suite). 12 harder tasks defined (0/12 zero-shot). CI workflow added. PR #36 merged (v0.4.1): fixed PyPI README images. Next: spin up Azure VM, record demos for 12 harder tasks, annotate, run DC eval.","status":"open","priority":0,"issue_type":"task","owner":"richard.abrich@gmail.com","created_at":"2026-02-14T12:23:04.624305-05:00","created_by":"Richard Abrich","updated_at":"2026-02-24T10:42:20.670713-05:00"}
1717
{"id":"openadapt-evals-wis","title":"Add pre-flight check to detect Windows install issues","status":"closed","priority":1,"issue_type":"task","owner":"richard.abrich@gmail.com","created_at":"2026-01-20T18:59:36.865052-05:00","created_by":"Richard Abrich","updated_at":"2026-01-20T20:32:06.757261-05:00","closed_at":"2026-01-20T20:32:06.757261-05:00","close_reason":"Duplicate of openadapt-evals-0dt"}

openadapt_evals/benchmarks/vm_cli.py

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -339,12 +339,13 @@ def cmd_create(args):
339339
return 1
340340
log("CREATE", "SSH ready")
341341

342-
# Install Docker with /mnt storage
343-
log("CREATE", "Installing Docker with /mnt storage...")
342+
# Install Docker with persistent storage
343+
log("CREATE", "Installing Docker with persistent storage...")
344344
docker_setup = """
345345
set -e
346-
sudo apt-get update -qq
347-
sudo apt-get install -y -qq docker.io
346+
export DEBIAN_FRONTEND=noninteractive
347+
sudo DEBIAN_FRONTEND=noninteractive apt-get update -qq
348+
sudo DEBIAN_FRONTEND=noninteractive apt-get install -y -qq docker.io
348349
sudo systemctl start docker
349350
sudo systemctl enable docker
350351
sudo usermod -aG docker $USER

openadapt_evals/infrastructure/azure_vm.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -836,6 +836,8 @@ def _cli_create_vm(
836836
"--generate-ssh-keys",
837837
"--public-ip-sku",
838838
"Standard",
839+
"--os-disk-size-gb",
840+
"128",
839841
]
840842
)
841843

openadapt_evals/infrastructure/pool.py

Lines changed: 7 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -63,6 +63,7 @@ class PoolRunResult:
6363
# Docker setup script for WAA workers
6464
DOCKER_SETUP_SCRIPT = """
6565
set -e
66+
export DEBIAN_FRONTEND=noninteractive
6667
6768
# Wait for apt lock (unattended upgrades on fresh VMs)
6869
echo "Waiting for apt lock..."
@@ -71,8 +72,8 @@ class PoolRunResult:
7172
done
7273
echo "Apt lock released"
7374
74-
sudo apt-get update -qq
75-
sudo apt-get install -y -qq docker.io
75+
sudo DEBIAN_FRONTEND=noninteractive apt-get update -qq
76+
sudo DEBIAN_FRONTEND=noninteractive apt-get install -y -qq docker.io
7677
sudo systemctl start docker
7778
sudo systemctl enable docker
7879
sudo usermod -aG docker $USER
@@ -97,6 +98,7 @@ class PoolRunResult:
9798
# Docker setup script that pulls pre-built image from ACR instead of building
9899
DOCKER_SETUP_SCRIPT_WITH_ACR = """
99100
set -e
101+
export DEBIAN_FRONTEND=noninteractive
100102
101103
# Wait for apt lock (unattended upgrades on fresh VMs)
102104
echo "Waiting for apt lock..."
@@ -105,8 +107,8 @@ class PoolRunResult:
105107
done
106108
echo "Apt lock released"
107109
108-
sudo apt-get update -qq
109-
sudo apt-get install -y -qq docker.io
110+
sudo DEBIAN_FRONTEND=noninteractive apt-get update -qq
111+
sudo DEBIAN_FRONTEND=noninteractive apt-get install -y -qq docker.io
110112
sudo systemctl start docker
111113
sudo systemctl enable docker
112114
sudo usermod -aG docker $USER
@@ -160,7 +162,7 @@ class PoolRunResult:
160162
161163
# Set up socat proxy for evaluate server (Docker port forwarding doesn't work
162164
# due to QEMU's custom bridge networking with --cap-add NET_ADMIN)
163-
which socat >/dev/null 2>&1 || sudo apt-get install -y -qq socat
165+
which socat >/dev/null 2>&1 || sudo DEBIAN_FRONTEND=noninteractive apt-get install -y -qq socat
164166
killall socat 2>/dev/null || true
165167
sleep 2
166168
nohup socat TCP-LISTEN:5051,fork,reuseaddr EXEC:"docker exec -i winarena socat - TCP\\:127.0.0.1\\:5050" > /dev/null 2>&1 &

0 commit comments

Comments
 (0)