From bceaa2dba3d541a9ccea3efb6eeeeb27e2829f80 Mon Sep 17 00:00:00 2001 From: Bai Li Date: Thu, 30 Apr 2026 15:02:44 -0700 Subject: [PATCH 01/12] delete self-authoring --- .../e2e_employee_directory.yaml | 42 ------------ .../e2e_product_catalogue.yaml | 37 ---------- .../integration_csv_import.yaml | 33 --------- .../integration_entity_scope.yaml | 30 -------- .../integration_error_paths.yaml | 47 ------------- .../uipath-data-fabric/integration_files.yaml | 33 --------- .../integration_full_lifecycle.yaml | 52 -------------- .../integration_large_pagination.yaml | 37 ---------- .../integration_preseeded_entity.yaml | 68 ------------------- .../integration_query_filters.yaml | 58 ---------------- .../uipath-data-fabric/smoke_entities.yaml | 42 ------------ .../tasks/uipath-data-fabric/smoke_files.yaml | 27 -------- .../uipath-data-fabric/smoke_records.yaml | 49 ------------- .../e2e_02_ai_escalation_brownfield.yaml | 17 ----- .../e2e_04_multi_hitl_brownfield.yaml | 22 ------ .../e2e_05_expense_approval_brownfield.yaml | 22 ------ ...06_invoice_approval_greenfield_simple.yaml | 34 ---------- .../e2e_07_apptask_brownfield.yaml | 20 ------ .../quality_04_all_handles.yaml | 30 +------- .../quality_05_priority_and_timeout.yaml | 23 ------- .../quality_07_runtime_vars.yaml | 35 ---------- .../uipath-maestro-case/init_validate.yaml | 22 ------ .../hitl/quality_01_schema_design.yaml | 40 ----------- .../hitl/quality_02_result_downstream.yaml | 28 -------- .../hitl/quality_03_boolean_decision.yaml | 32 --------- .../hitl/quality_04_brownfield_insert.yaml | 23 ------- .../hitl/smoke_01_hitl_node_placed.yaml | 22 ------ .../hitl/smoke_02_completed_port_wired.yaml | 17 ----- .../hitl/smoke_03_multi_outcome_routing.yaml | 26 ------- .../smoke/init_validate.yaml | 23 ------- .../review_multi_project_solution.yaml | 31 --------- .../uipath-review/review_rpa_project.yaml | 23 ------- tests/tasks/uipath-rpa/coded_test_case.yaml | 35 ---------- .../uipath-solution-design/gap_detection.yaml | 29 -------- .../uipath-solution-design/pdd_to_sdd.yaml | 27 -------- .../product_selection.yaml | 21 ------ tests/tasks/uipath-tasks/e2e_fetch_tasks.yaml | 51 +------------- .../tasks/uipath-tasks/smoke_assignment.yaml | 31 --------- .../tasks/uipath-tasks/smoke_completion.yaml | 48 ------------- tests/tasks/uipath-tasks/smoke_discovery.yaml | 29 -------- 40 files changed, 2 insertions(+), 1314 deletions(-) diff --git a/tests/tasks/uipath-data-fabric/e2e_employee_directory.yaml b/tests/tasks/uipath-data-fabric/e2e_employee_directory.yaml index 4bfa2b0e9..aa08ccf4f 100644 --- a/tests/tasks/uipath-data-fabric/e2e_employee_directory.yaml +++ b/tests/tasks/uipath-data-fabric/e2e_employee_directory.yaml @@ -41,23 +41,6 @@ initial_prompt: | 2. How many employees are in each department? Use one filterGroup query per department to get the count. - Save a summary to report.json: - { - "entity_id": "", - "total_employees": 20, - "schema_evolved": true, - "performance_scores_set": 6, - "top_performers": [ - {"name": "", "score": , "department": ""} - ], - "department_counts": { - "Engineering": , - "Sales": , - "Finance": , - "HR": - } - } - Do NOT delete the entity. success_criteria: @@ -139,31 +122,6 @@ success_criteria: weight: 1.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "20 employees imported, schema evolved, 6 scores set, all 4 depts counted" - path: "report.json" - assertions: - - expression: "total_employees" - operator: equals - expected: 20 - - expression: "schema_evolved" - operator: equals - expected: true - - expression: "performance_scores_set" - operator: equals - expected: 6 - - expression: "length(top_performers)" - operator: gte - expected: 1 - weight: 5.0 - pass_threshold: 0.75 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/e2e_product_catalogue.yaml b/tests/tasks/uipath-data-fabric/e2e_product_catalogue.yaml index 4e283715d..d088f5c5a 100644 --- a/tests/tasks/uipath-data-fabric/e2e_product_catalogue.yaml +++ b/tests/tasks/uipath-data-fabric/e2e_product_catalogue.yaml @@ -37,18 +37,6 @@ initial_prompt: | - Confirm the final state: total products, how many are in stock, how many are Electronics. - Save a summary to report.json: - { - "entity_id": "", - "total_products": , - "electronics_count": , - "price_updated_count": 2, - "out_of_stock_count": 3, - "in_stock_count": , - "image_uploaded_to_sku": "", - "most_expensive_product_name": "" - } - Do NOT delete the entity. success_criteria: @@ -116,31 +104,6 @@ success_criteria: weight: 2.5 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "15 products, 5 Electronics, 2 price updates, 3 out of stock" - path: "report.json" - assertions: - - expression: "total_products" - operator: equals - expected: 15 - - expression: "electronics_count" - operator: equals - expected: 5 - - expression: "price_updated_count" - operator: equals - expected: 2 - - expression: "out_of_stock_count" - operator: equals - expected: 3 - weight: 5.0 - pass_threshold: 0.75 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/integration_csv_import.yaml b/tests/tasks/uipath-data-fabric/integration_csv_import.yaml index cf1853aa5..4ae0d31a0 100644 --- a/tests/tasks/uipath-data-fabric/integration_csv_import.yaml +++ b/tests/tasks/uipath-data-fabric/integration_csv_import.yaml @@ -42,17 +42,6 @@ initial_prompt: | 6. Verify the import: list records and check that rows were added. Note InsertedRecords and TotalRecords from the import response. - Save a summary to report.json: - { - "entity_id": "", - "entity_existed_already": , - "csv_headers": [""], - "csv_row_count": , - "csv_includes_system_fields": false, - "import_inserted_records": , - "import_total_records": - } - Use --output json on every uip df command. CSV headers must match entity field names exactly — case-sensitive. @@ -107,28 +96,6 @@ success_criteria: weight: 2.5 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "CSV has 4 rows, no system fields, import counts recorded" - path: "report.json" - assertions: - - expression: "csv_row_count" - operator: gte - expected: 4 - - expression: "csv_includes_system_fields" - operator: equals - expected: false - - expression: "import_total_records" - operator: gte - expected: 4 - weight: 3.0 - pass_threshold: 0.75 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/integration_entity_scope.yaml b/tests/tasks/uipath-data-fabric/integration_entity_scope.yaml index fef291f49..fe91ff50f 100644 --- a/tests/tasks/uipath-data-fabric/integration_entity_scope.yaml +++ b/tests/tasks/uipath-data-fabric/integration_entity_scope.yaml @@ -49,17 +49,6 @@ initial_prompt: | uip df entities create ... --folder 00000000-0000-0000-0000-000000000000 Record the error response. - Save a summary to report.json: - { - "tenant_entity_id": "", - "folder_entity_id": "", - "tenant_entity_visible_at_tenant": , - "tenant_entity_visible_from_folder_a": , - "folder_entity_isolated_from_folder_b": , - "invalid_folder_returned_error": , - "notes": "" - } - Do NOT delete entities — the test harness handles cleanup. success_criteria: @@ -111,25 +100,6 @@ success_criteria: weight: 1.5 pass_threshold: 0.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "Tenant entity visible and invalid folder returns error" - path: "report.json" - assertions: - - expression: "tenant_entity_visible_at_tenant" - operator: equals - expected: true - - expression: "invalid_folder_returned_error" - operator: equals - expected: true - weight: 4.0 - pass_threshold: 0.75 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/integration_error_paths.yaml b/tests/tasks/uipath-data-fabric/integration_error_paths.yaml index 329dee77d..3450600e5 100644 --- a/tests/tasks/uipath-data-fabric/integration_error_paths.yaml +++ b/tests/tasks/uipath-data-fabric/integration_error_paths.yaml @@ -79,31 +79,6 @@ initial_prompt: | 17. File upload local file not found: uip df files upload Score --file ./no-such-file.bin - Save a summary to report.json: - { - "entity_id": "", - "seed_record_id": "", - "errors": { - "required_field_missing": "", - "unique_constraint_insert": "", - "type_mismatch_insert": "", - "update_missing_id": "", - "update_record_not_found": "", - "unique_constraint_update": "", - "type_mismatch_update": "", - "delete_record_not_found": "", - "csv_header_mismatch": "", - "csv_malformed": "", - "file_upload_non_file_field": "", - "file_upload_record_not_found": "", - "file_upload_local_not_found": "" - }, - "all_errors_non_empty": , - "record_errors_captured": , - "import_errors_captured": , - "file_errors_captured": - } - Do NOT delete the entity — the test harness handles cleanup. success_criteria: @@ -163,28 +138,6 @@ success_criteria: weight: 2.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "Error scenarios captured per group — allows 1-2 misses per category" - path: "report.json" - assertions: - - expression: "record_errors_captured" - operator: gte - expected: 6 - - expression: "import_errors_captured" - operator: gte - expected: 1 - - expression: "file_errors_captured" - operator: gte - expected: 2 - weight: 4.0 - pass_threshold: 0.67 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/integration_files.yaml b/tests/tasks/uipath-data-fabric/integration_files.yaml index 2e08120d5..697a246a2 100644 --- a/tests/tasks/uipath-data-fabric/integration_files.yaml +++ b/tests/tasks/uipath-data-fabric/integration_files.yaml @@ -57,17 +57,6 @@ initial_prompt: | 12. Attempt to download again. The download should fail since the file was deleted. Record the result (expected: error or empty response). - Save a summary to report.json: - { - "entity_id": "", - "record_id": "", - "v1_sha256": "", - "download_sha256_matches_v1": , - "v2_sha256": "", - "overwrite_download_matches_v2": , - "post_delete_download_failed": - } - Do NOT delete the entity — only delete the file attachment. success_criteria: @@ -123,28 +112,6 @@ success_criteria: weight: 1.5 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "Byte integrity confirmed for v1, overwrite confirmed for v2, post-delete download failed" - path: "report.json" - assertions: - - expression: "download_sha256_matches_v1" - operator: equals - expected: true - - expression: "overwrite_download_matches_v2" - operator: equals - expected: true - - expression: "post_delete_download_failed" - operator: equals - expected: true - weight: 4.0 - pass_threshold: 0.75 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/integration_full_lifecycle.yaml b/tests/tasks/uipath-data-fabric/integration_full_lifecycle.yaml index f3b909be8..eaed9f90d 100644 --- a/tests/tasks/uipath-data-fabric/integration_full_lifecycle.yaml +++ b/tests/tasks/uipath-data-fabric/integration_full_lifecycle.yaml @@ -54,21 +54,6 @@ initial_prompt: | 10. Delete only the two records inserted in step 6. Do NOT delete the entity. - Save a summary to report.json: - { - "entity_id": "", - "entity_existed_already": , - "schema_ops": { - "field_id_retrieved_from": "entities get", - "addFields": [""], - "updateFields": [""] - }, - "records_inserted": ["", ""], - "query_result_count": , - "score_after_update": , - "records_deleted": ["", ""] - } - Do NOT use removeFields. Do NOT delete the entity. success_criteria: @@ -184,43 +169,6 @@ success_criteria: weight: 2.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: file_contains - description: "Report includes schema operations (addFields and updateFields)" - path: "report.json" - includes: - - "addFields" - - "updateFields" - weight: 2.0 - pass_threshold: 1.0 - - - type: json_check - description: "Full lifecycle complete: field IDs from entities get, records inserted/deleted, update verified" - path: "report.json" - assertions: - - expression: "schema_ops.field_id_retrieved_from" - operator: equals - expected: "entities get" - - expression: "length(records_inserted)" - operator: gte - expected: 2 - - expression: "score_after_update" - operator: equals - expected: 99 - - expression: "query_result_count" - operator: gte - expected: 1 - - expression: "length(records_deleted)" - operator: gte - expected: 2 - weight: 4.0 - pass_threshold: 0.75 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/integration_large_pagination.yaml b/tests/tasks/uipath-data-fabric/integration_large_pagination.yaml index c9c5f5d34..8fb4fbae2 100644 --- a/tests/tasks/uipath-data-fabric/integration_large_pagination.yaml +++ b/tests/tasks/uipath-data-fabric/integration_large_pagination.yaml @@ -65,18 +65,6 @@ initial_prompt: | - every collected record has Active=true - total count == 300 - Save a summary to report.json: - { - "entity_id": "", - "import_count": , - "pagination_pages_fetched": , - "pagination_total_unique_ids": , - "pagination_no_duplicates": , - "filtered_pages_fetched": , - "filtered_active_count": , - "filtered_all_active": - } - Do NOT delete the entity — the test harness handles cleanup. success_criteria: @@ -118,31 +106,6 @@ success_criteria: weight: 1.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "500 records paginated without duplicates; 300 Active=true records confirmed" - path: "report.json" - assertions: - - expression: "pagination_total_unique_ids" - operator: equals - expected: 500 - - expression: "pagination_no_duplicates" - operator: equals - expected: true - - expression: "filtered_active_count" - operator: equals - expected: 300 - - expression: "filtered_all_active" - operator: equals - expected: true - weight: 5.0 - pass_threshold: 0.75 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/integration_preseeded_entity.yaml b/tests/tasks/uipath-data-fabric/integration_preseeded_entity.yaml index 03a394a83..fa80d2ed7 100644 --- a/tests/tasks/uipath-data-fabric/integration_preseeded_entity.yaml +++ b/tests/tasks/uipath-data-fabric/integration_preseeded_entity.yaml @@ -103,25 +103,6 @@ initial_prompt: | Verify the restore (confirm Notes == null). Save the record ID you modified. - Save a summary to report.json: - { - "entity_found": true, - "entity_seeded_now": , - "entity_id": "", - "field_count": , - "query_active_true_count": , - "query_score_gt_7_count": , - "query_title_exact_count": , - "query_title_contains_count": , - "query_score_gte7_and_active_true_count": , - "sort_highest_score": , - "pagination_total_records": , - "pagination_no_duplicates": , - "update_record_id": "", - "update_verified": , - "restore_verified": - } - Do NOT delete any records. Do NOT delete the entity. success_criteria: @@ -205,53 +186,4 @@ success_criteria: weight: 2.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "Entity found, query counts match seed data, sort and pagination correct" - path: "report.json" - assertions: - - expression: "entity_found" - operator: equals - expected: true - - expression: "field_count" - operator: gte - expected: 7 - - expression: "query_active_true_count" - operator: equals - expected: 12 - - expression: "query_score_gt_7_count" - operator: equals - expected: 6 - - expression: "query_title_exact_count" - operator: equals - expected: 1 - - expression: "query_title_contains_count" - operator: equals - expected: 3 - - expression: "query_score_gte7_and_active_true_count" - operator: equals - expected: 7 - - expression: "sort_highest_score" - operator: gte - expected: 10 - - expression: "pagination_total_records" - operator: equals - expected: 20 - - expression: "pagination_no_duplicates" - operator: equals - expected: true - - expression: "update_verified" - operator: equals - expected: true - - expression: "restore_verified" - operator: equals - expected: true - weight: 6.0 - pass_threshold: 0.75 - # No post_run: CodeEvalTestEntity is a shared persistent fixture — never deleted between runs. diff --git a/tests/tasks/uipath-data-fabric/integration_query_filters.yaml b/tests/tasks/uipath-data-fabric/integration_query_filters.yaml index de25d6a37..e9a4ba00e 100644 --- a/tests/tasks/uipath-data-fabric/integration_query_filters.yaml +++ b/tests/tasks/uipath-data-fabric/integration_query_filters.yaml @@ -67,21 +67,6 @@ initial_prompt: | 10. Delete the 4 records you inserted in step 3. - Save a summary to report.json: - { - "entity_id": "", - "records_inserted": ["", "", "", ""], - "and_query_count": , - "or_query_count": , - "nested_query_count": , - "sort_first_value": , - "projection_value_absent": , - "projection_status_absent": , - "pagination_total_ids": , - "pagination_no_duplicates": , - "records_deleted": [""] - } - Use --output json on every uip df command. Pagination must use --limit and --cursor CLI flags — never body keys. @@ -158,49 +143,6 @@ success_criteria: weight: 2.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "AND→1, OR→2, nested→3, sort first=750, projection excludes Value/Status, pagination 4 unique IDs" - path: "report.json" - assertions: - - expression: "and_query_count" - operator: equals - expected: 1 - - expression: "or_query_count" - operator: equals - expected: 2 - - expression: "nested_query_count" - operator: equals - expected: 3 - - expression: "sort_first_value" - operator: equals - expected: 750.0 - - expression: "projection_value_absent" - operator: equals - expected: true - - expression: "projection_status_absent" - operator: equals - expected: true - - expression: "pagination_total_ids" - operator: equals - expected: 4 - - expression: "pagination_no_duplicates" - operator: equals - expected: true - - expression: "length(records_inserted)" - operator: gte - expected: 4 - - expression: "length(records_deleted)" - operator: gte - expected: 4 - weight: 5.0 - pass_threshold: 0.75 - post_run: - command: "python3 $SKILLS_REPO_PATH/tests/tasks/uipath-data-fabric/_shared/cleanup_entities.py" timeout: 60 diff --git a/tests/tasks/uipath-data-fabric/smoke_entities.yaml b/tests/tasks/uipath-data-fabric/smoke_entities.yaml index 3b35f1e15..45023f3d5 100644 --- a/tests/tasks/uipath-data-fabric/smoke_entities.yaml +++ b/tests/tasks/uipath-data-fabric/smoke_entities.yaml @@ -39,16 +39,6 @@ initial_prompt: | would come from Fields[].ID in the entities get response) in the updateFields body. - Save a summary to report.json with the bodies and commands you CONSTRUCTED - (fill these in regardless of whether the commands returned auth errors): - { - "commands_used": [""], - "create_body": { "fields": [ ... ] }, - "addFields_body": { "addFields": [ ... ] }, - "updateFields_body": { "updateFields": [ ... ] }, - "field_id_source": "entities get" - } - Additional constraints: - Use --output json on every uip df command. - Do NOT use removeFields. Do NOT delete any entity. @@ -102,35 +92,3 @@ success_criteria: weight: 1.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: file_contains - description: "Entity create and addFields bodies use fieldName key (not name)" - path: "report.json" - includes: - - "fieldName" - weight: 2.0 - pass_threshold: 1.0 - - - type: file_contains - description: "Report includes both addFields and updateFields operations" - path: "report.json" - includes: - - "addFields" - - "updateFields" - weight: 2.0 - pass_threshold: 1.0 - - - type: json_check - description: "Field IDs sourced from entities get" - path: "report.json" - assertions: - - expression: "field_id_source" - operator: equals - expected: "entities get" - weight: 1.5 - pass_threshold: 1.0 diff --git a/tests/tasks/uipath-data-fabric/smoke_files.yaml b/tests/tasks/uipath-data-fabric/smoke_files.yaml index c274137e6..882083cc6 100644 --- a/tests/tasks/uipath-data-fabric/smoke_files.yaml +++ b/tests/tasks/uipath-data-fabric/smoke_files.yaml @@ -37,15 +37,6 @@ initial_prompt: | 4. Delete the file attachment from that field: uip df files delete doc-001-ent rec-001-id Attachment - Save a summary to report.json with the commands you ran and what you observed - (fill these in based on what you sent, not the error responses): - { - "commands_used": [""], - "upload_command_uses_positional_args": true, - "download_uses_destination_flag": true, - "delete_positional_args": ["", "", ""] - } - Additional constraints: - Use --output json on every uip df command. - The download flag is --destination (not --output). @@ -90,21 +81,3 @@ success_criteria: weight: 1.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: json_check - description: "Upload uses positional args and download uses --destination flag" - path: "report.json" - assertions: - - expression: "upload_command_uses_positional_args" - operator: equals - expected: true - - expression: "download_uses_destination_flag" - operator: equals - expected: true - weight: 2.5 - pass_threshold: 1.0 diff --git a/tests/tasks/uipath-data-fabric/smoke_records.yaml b/tests/tasks/uipath-data-fabric/smoke_records.yaml index 5091ed641..b08e49844 100644 --- a/tests/tasks/uipath-data-fabric/smoke_records.yaml +++ b/tests/tasks/uipath-data-fabric/smoke_records.yaml @@ -45,20 +45,6 @@ initial_prompt: | 8. Delete the record from step 1 using records delete. Use placeholder record ID "id-single". - Save a summary to report.json with the bodies and commands you CONSTRUCTED - (fill these in based on what you sent, not the error responses): - { - "commands_used": [""], - "single_insert_uses_object": true, - "batch_insert_uses_array": true, - "get_used_record_id": true, - "query_filter": { ... the filterGroup JSON used ... }, - "pagination_method": "cursor", - "single_update_body_has_id": true, - "batch_update_all_have_id": true, - "delete_attempted": true - } - Additional constraint: - Use --output json on every uip df command. @@ -135,38 +121,3 @@ success_criteria: weight: 1.0 pass_threshold: 1.0 - - type: file_exists - description: "report.json was created" - path: "report.json" - weight: 1.0 - pass_threshold: 1.0 - - - type: file_contains - description: "Query body uses filterGroup key" - path: "report.json" - includes: - - "filterGroup" - weight: 2.0 - pass_threshold: 1.0 - - - type: json_check - description: "Array routing, cursor pagination, Id in update bodies, and delete confirmed" - path: "report.json" - assertions: - - expression: "batch_insert_uses_array" - operator: equals - expected: true - - expression: "pagination_method" - operator: equals - expected: "cursor" - - expression: "single_update_body_has_id" - operator: equals - expected: true - - expression: "batch_update_all_have_id" - operator: equals - expected: true - - expression: "delete_attempted" - operator: equals - expected: true - weight: 3.0 - pass_threshold: 0.75 diff --git a/tests/tasks/uipath-human-in-the-loop/e2e_02_ai_escalation_brownfield.yaml b/tests/tasks/uipath-human-in-the-loop/e2e_02_ai_escalation_brownfield.yaml index 40eaaacc0..3832fe4a8 100644 --- a/tests/tasks/uipath-human-in-the-loop/e2e_02_ai_escalation_brownfield.yaml +++ b/tests/tasks/uipath-human-in-the-loop/e2e_02_ai_escalation_brownfield.yaml @@ -42,14 +42,6 @@ initial_prompt: | make the final routing decision before the complaint is acted on. Insert a HITL node in the appropriate place, wire it, and validate. - Save results to report.json: - { - "hitl_node_id": "", - "inserted_position": "", - "handles_wired": [""], - "validation_passed": true - } - success_criteria: - type: file_contains description: "HITL node is present in the flow file" @@ -75,12 +67,3 @@ success_criteria: weight: 2.0 pass_threshold: 1.0 - - type: json_check - description: "report.json confirms validation passed" - path: "report.json" - assertions: - - expression: "validation_passed" - operator: equals - expected: true - weight: 2.5 - pass_threshold: 1.0 diff --git a/tests/tasks/uipath-human-in-the-loop/e2e_04_multi_hitl_brownfield.yaml b/tests/tasks/uipath-human-in-the-loop/e2e_04_multi_hitl_brownfield.yaml index a1f1d792f..26a1280c6 100644 --- a/tests/tasks/uipath-human-in-the-loop/e2e_04_multi_hitl_brownfield.yaml +++ b/tests/tasks/uipath-human-in-the-loop/e2e_04_multi_hitl_brownfield.yaml @@ -47,16 +47,6 @@ initial_prompt: | Wire the completed handles for both HITL nodes to their respective downstream steps. Validate the full flow after both nodes are added. - Save results to report.json: - { - "hitl_nodes": [ - {"id": "", "label": "