@@ -792,7 +792,7 @@ def test_full_pipeline_feature_to_verdict(self, db_session, sample_feature, tmp_
792792
793793 # The gate should evaluate (may pass or fail depending on validators)
794794 assert gate_result is not None
795- assert gate_result .verdict in ("passed" , "failed" , "partial " )
795+ assert gate_result .verdict in ("passed" , "failed" , "error " )
796796 assert gate_result .gate_mode == "all_pass"
797797 assert isinstance (gate_result .acceptance_results , list )
798798
@@ -1659,7 +1659,7 @@ def mock_turn_executor(run, spec):
16591659 assert isinstance (gate_result , GateResult ), (
16601660 f"Expected GateResult, got { type (gate_result )} "
16611661 )
1662- assert gate_result .verdict in ("passed" , "failed" , "partial " ), (
1662+ assert gate_result .verdict in ("passed" , "failed" , "error " ), (
16631663 f"Invalid verdict: '{ gate_result .verdict } '"
16641664 )
16651665 assert gate_result .gate_mode == "all_pass" , (
@@ -2032,8 +2032,8 @@ def never_completing_executor(run, spec):
20322032 assert run .final_verdict is not None , (
20332033 "final_verdict should be set after graceful termination"
20342034 )
2035- assert run .final_verdict in ("partial " , "passed" , "failed" ), (
2036- f"final_verdict should be partial /passed/failed, got '{ run .final_verdict } '"
2035+ assert run .final_verdict in ("error " , "passed" , "failed" ), (
2036+ f"final_verdict should be error /passed/failed, got '{ run .final_verdict } '"
20372037 )
20382038
20392039 def test_tokens_tracked_on_agent_run (self , db_session ):
@@ -2150,7 +2150,7 @@ class TestAcceptanceGateEvaluatesValidators:
21502150 3. ValidatorResult contains passed (bool), message (str), and score (float)
21512151 4. gate_mode='all_pass' requires ALL validators to pass for verdict='passed'
21522152 5. gate_mode='any_pass' requires at least ONE validator to pass for verdict='passed'
2153- 6. AgentRun.final_verdict is set to the gate's verdict (passed/failed/partial )
2153+ 6. AgentRun.final_verdict is set to the gate's verdict (passed/failed/error )
21542154 7. AgentRun.acceptance_results contains per-validator results as JSON array
21552155 8. An 'acceptance_check' event is recorded in agent_events with the gate results
21562156 """
@@ -2382,10 +2382,10 @@ def completing_executor(run, spec):
23822382 run_b = kernel_b .execute (spec_b , turn_executor = completing_executor )
23832383
23842384 assert run_b .final_verdict != "passed" , (
2385- f"all_pass with one failing: expected 'partial ' or 'failed', got '{ run_b .final_verdict } '"
2385+ f"all_pass with one failing: expected 'error ' or 'failed', got '{ run_b .final_verdict } '"
23862386 )
2387- assert run_b .final_verdict in ("partial " , "failed" ), (
2388- f"Expected 'partial ' or 'failed', got '{ run_b .final_verdict } '"
2387+ assert run_b .final_verdict in ("error " , "failed" ), (
2388+ f"Expected 'error ' or 'failed', got '{ run_b .final_verdict } '"
23892389 )
23902390
23912391 def test_step5_gate_mode_any_pass_requires_one_validator (
@@ -2427,7 +2427,7 @@ def test_step6_agent_run_final_verdict_set(
24272427 self , db_session , tmp_path
24282428 ):
24292429 """Step 6: Verify AgentRun.final_verdict is set to the gate's verdict
2430- (passed/failed/partial ).
2430+ (passed/failed/error ).
24312431 """
24322432 # Test passed verdict
24332433 spec , _ = self ._create_spec_with_file_validators (
@@ -2445,8 +2445,8 @@ def completing_executor(run, spec):
24452445 assert run .final_verdict is not None , (
24462446 "AgentRun.final_verdict must be set after acceptance gate evaluation"
24472447 )
2448- assert run .final_verdict in ("passed" , "failed" , "partial " ), (
2449- f"final_verdict must be one of passed/failed/partial , got '{ run .final_verdict } '"
2448+ assert run .final_verdict in ("passed" , "failed" , "error " ), (
2449+ f"final_verdict must be one of passed/failed/error , got '{ run .final_verdict } '"
24502450 )
24512451
24522452 # Verify it's persisted in the database
@@ -2708,8 +2708,8 @@ def completing_executor(run, spec):
27082708 assert run .final_verdict is not None , (
27092709 "AgentRun.final_verdict must be set after kernel execution"
27102710 )
2711- assert run .final_verdict in ("passed" , "failed" , "partial " ), (
2712- f"final_verdict must be passed/failed/partial , got '{ run .final_verdict } '"
2711+ assert run .final_verdict in ("passed" , "failed" , "error " ), (
2712+ f"final_verdict must be passed/failed/error , got '{ run .final_verdict } '"
27132713 )
27142714
27152715 # Now use sync_verdict to sync back to feature
@@ -3849,8 +3849,8 @@ def test_step6_acceptance_gate_produces_verdict(self, db_session):
38493849 assert run .final_verdict is not None , (
38503850 f"Run { run .id } : final_verdict must not be None"
38513851 )
3852- assert run .final_verdict in ("passed" , "failed" , "partial " ), (
3853- f"Run { run .id } : final_verdict must be passed/failed/partial , "
3852+ assert run .final_verdict in ("passed" , "failed" , "error " ), (
3853+ f"Run { run .id } : final_verdict must be passed/failed/error , "
38543854 f"got '{ run .final_verdict } '"
38553855 )
38563856
0 commit comments