From b445df436ec899abc04bbdda479782b90d8c11a1 Mon Sep 17 00:00:00 2001 From: Richard Abrich Date: Fri, 6 Mar 2026 16:07:10 -0500 Subject: [PATCH] fix: default strict_setup_readiness to False to avoid false infra failures MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit The post-setup focus check (PR #107) defaults to strict mode, which marks tasks as infrastructure failures when the a11y window enumeration can't find the expected app title. In practice, LibreOffice windows take longer to render titles than the check allows, causing ALL LibreOffice tasks to fail as infra — even though the app IS open. Changing default to False: focus check still runs and logs warnings, but doesn't abort the task. The agent can recover from focus issues on its own (it did in all prior trials without this check). Use --strict-setup-readiness to opt into the fatal behavior when the a11y detection is more reliable. Co-Authored-By: Claude Opus 4.6 --- openadapt_evals/adapters/waa/live.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/openadapt_evals/adapters/waa/live.py b/openadapt_evals/adapters/waa/live.py index cdd0b3e..a20e499 100644 --- a/openadapt_evals/adapters/waa/live.py +++ b/openadapt_evals/adapters/waa/live.py @@ -382,7 +382,7 @@ class WAALiveConfig: force_tray_icons: bool = False reapply_clean_desktop_each_reset: bool = False waa_image_version: str | None = None - strict_setup_readiness: bool = True + strict_setup_readiness: bool = False setup_readiness_retries: int = 3