feat(governance): 新增 release readiness readback
All checks were successful
Code Review / ai-code-review (push) Successful in 19s
CD Pipeline / tests (push) Successful in 1m28s
CD Pipeline / build-and-deploy (push) Successful in 4m46s
CD Pipeline / post-deploy-checks (push) Successful in 20s

This commit is contained in:
Your Name
2026-06-14 04:20:22 +08:00
parent f0f0adde1c
commit 755553e64f
13 changed files with 1663 additions and 8 deletions

View File

@@ -136,6 +136,9 @@ from src.services.ai_agent_result_capture_owner_acceptance_readback_preflight_ho
from src.services.ai_agent_result_capture_owner_approved_preflight_release_package import (
load_latest_ai_agent_result_capture_owner_approved_preflight_release_package,
)
from src.services.ai_agent_result_capture_owner_approved_release_readiness_readback import (
load_latest_ai_agent_result_capture_owner_approved_release_readiness_readback,
)
from src.services.ai_agent_result_capture_promotion_approval_gate import (
load_latest_ai_agent_result_capture_promotion_approval_gate,
)
@@ -1983,6 +1986,37 @@ async def get_agent_result_capture_owner_approved_preflight_release_package() ->
) from exc
@router.get(
"/agent-result-capture-owner-approved-release-readiness-readback",
response_model=dict[str, Any],
summary="取得 AI Agent result capture owner-approved release readiness readback",
description=(
"讀取最新已提交的 P2-130 owner-approved release readiness readback"
"此端點只回傳 release readiness readback、owner release readiness check、"
"live apply readiness gate、rollback readiness check、blocked readiness transition 與 operator handoff"
"不批准 owner release、不批准 maintenance window、不釋放 live apply、不套用 writer、不寫 receipt、"
"不寫 result capture、learning、PlayBook trust、reviewer queue、Gateway queue不送 Telegram、"
"不呼叫 Bot API、不讀 secret。"
),
)
async def get_agent_result_capture_owner_approved_release_readiness_readback() -> dict[str, Any]:
"""Return the latest read-only owner-approved release readiness readback."""
try:
payload = await asyncio.to_thread(load_latest_ai_agent_result_capture_owner_approved_release_readiness_readback)
return redact_public_lan_topology(payload)
except FileNotFoundError as exc:
raise HTTPException(
status_code=status.HTTP_404_NOT_FOUND,
detail=str(exc),
) from exc
except (json.JSONDecodeError, ValueError) as exc:
logger.error("ai_agent_result_capture_owner_approved_release_readiness_readback_invalid", error=str(exc))
raise HTTPException(
status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
detail="AI Agent result capture owner-approved release readiness readback 無效",
) from exc
@router.get(
"/agent-owner-approved-fixture-dry-run",
response_model=dict[str, Any],

View File

@@ -0,0 +1,420 @@
"""
AI Agent result capture owner-approved release readiness readback snapshot.
Loads the latest committed P2-130 owner-approved release readiness readback.
This module validates committed evidence only; it never approves owner release,
approves maintenance windows, releases live apply, applies writers, writes
receipts, writes result captures, writes learning records, updates PlayBook
trust, writes reviewer / Gateway queues, sends Telegram messages, reads
secrets, or performs destructive operations.
"""
from __future__ import annotations
import json
from pathlib import Path
from typing import Any
from src.services.snapshot_paths import default_evaluations_dir
_DEFAULT_EVALUATIONS_DIR = default_evaluations_dir(Path(__file__))
_SNAPSHOT_PATTERN = "ai_agent_result_capture_owner_approved_release_readiness_readback_*.json"
_SCHEMA_VERSION = "ai_agent_result_capture_owner_approved_release_readiness_readback_v1"
_RUNTIME_AUTHORITY = "result_capture_owner_approved_release_readiness_readback_only_no_live_write"
def load_latest_ai_agent_result_capture_owner_approved_release_readiness_readback(
evaluations_dir: Path | None = None,
) -> dict[str, Any]:
"""Load the newest committed owner-approved release readiness readback."""
directory = evaluations_dir or _DEFAULT_EVALUATIONS_DIR
candidates = sorted(directory.glob(_SNAPSHOT_PATTERN))
if not candidates:
raise FileNotFoundError(f"no AI Agent result capture owner-approved release readiness readback snapshots found in {directory}")
latest = candidates[-1]
with latest.open(encoding="utf-8") as handle:
payload = json.load(handle)
if not isinstance(payload, dict):
raise ValueError(f"{latest}: expected JSON object")
label = str(latest)
_require_schema(payload, label)
_require_prior(payload, label)
_require_truth(payload, label)
_require_release_readbacks(payload, label)
_require_owner_release_checks(payload, label)
_require_live_apply_readiness_gates(payload, label)
_require_rollback_readiness(payload, label)
_require_blocked_transitions(payload, label)
_require_actions(payload, label)
_require_display_redaction(payload, label)
_require_no_forbidden_display_terms(payload, label)
_require_rollup_consistency(payload, label)
return payload
def _require_schema(payload: dict[str, Any], label: str) -> None:
if payload.get("schema_version") != _SCHEMA_VERSION:
raise ValueError(f"{label}: expected schema_version={_SCHEMA_VERSION}")
status = payload.get("program_status") or {}
expected = {
"current_priority": "P2",
"current_task_id": "P2-130",
"next_task_id": "P2-131",
"read_only_mode": True,
"runtime_authority": _RUNTIME_AUTHORITY,
"overall_completion_percent": 100,
}
mismatches = _mismatches(status, expected)
if mismatches:
raise ValueError(f"{label}: program_status mismatch: {mismatches}")
if not status.get("status_note"):
raise ValueError(f"{label}: program_status.status_note is required")
def _require_prior(payload: dict[str, Any], label: str) -> None:
prior = payload.get("prior_owner_approved_preflight_release_package") or {}
expected = {
"schema_version": "ai_agent_result_capture_owner_approved_preflight_release_package_v1",
"owner_approved_release_package_count": 5,
"release_preflight_check_count": 5,
"live_apply_release_gate_count": 5,
"rollback_release_check_count": 5,
"blocked_release_transition_count": 6,
"operator_action_count": 5,
"approval_required_total": 8,
"blocked_total": 9,
"owner_release_approved_count": 0,
"maintenance_window_approved_count": 0,
"rollback_owner_confirmed_count": 0,
"post_release_verifier_ready_count": 0,
"live_apply_release_pass_count": 0,
"writer_apply_count": 0,
"execution_apply_count": 0,
"receipt_write_count": 0,
"result_capture_write_count": 0,
"learning_write_count": 0,
"playbook_trust_write_count": 0,
"reviewer_queue_write_count": 0,
"gateway_queue_write_count": 0,
"telegram_send_count": 0,
"bot_api_call_count": 0,
"report_receipt_write_count": 0,
}
mismatches = _mismatches(prior, expected)
if mismatches:
raise ValueError(f"{label}: prior_owner_approved_preflight_release_package mismatch: {mismatches}")
if not prior.get("readiness_note"):
raise ValueError(f"{label}: prior_owner_approved_preflight_release_package.readiness_note is required")
def _require_truth(payload: dict[str, Any], label: str) -> None:
truth = payload.get("release_readiness_truth") or {}
required_true = {
"p2_129_release_package_loaded",
"release_readiness_readback_ready",
"owner_release_review_required",
"maintenance_window_review_required",
"live_apply_readiness_hold_active",
"rollback_readiness_required",
"post_release_verifier_required",
"redaction_review_required",
"release_readiness_readback_only",
}
missing = sorted(field for field in required_true if truth.get(field) is not True)
if missing:
raise ValueError(f"{label}: release readiness readback flags must remain true: {missing}")
required_false = {
"owner_release_approved",
"maintenance_window_approved",
"rollback_owner_confirmed",
"post_release_verifier_ready",
"release_readiness_passed",
"live_apply_release_passed",
"writer_apply_enabled",
"execution_apply_enabled",
"receipt_write_enabled",
"reviewer_queue_write_enabled",
"gateway_queue_write_enabled",
"telegram_send_enabled",
"bot_api_call_enabled",
"report_receipt_write_enabled",
"result_capture_write_enabled",
"learning_write_enabled",
"playbook_trust_write_enabled",
"production_write_enabled",
"secret_read_enabled",
"destructive_operation_enabled",
}
unsafe = sorted(field for field in required_false if truth.get(field) is not False)
if unsafe:
raise ValueError(f"{label}: live readiness/send/write flags must remain false: {unsafe}")
zero_counts = {
"owner_release_approved_count",
"maintenance_window_approved_count",
"rollback_owner_confirmed_count",
"post_release_verifier_ready_count",
"release_readiness_pass_count",
"live_apply_release_pass_count",
"writer_apply_count",
"execution_apply_count",
"receipt_write_count",
"reviewer_queue_write_count",
"gateway_queue_write_count",
"telegram_send_count",
"bot_api_call_count",
"report_receipt_write_count",
"result_capture_write_count",
"learning_write_count",
"playbook_trust_write_count",
"production_write_count",
"secret_read_count",
"destructive_operation_count",
}
non_zero = sorted(field for field in zero_counts if truth.get(field) != 0)
if non_zero:
raise ValueError(f"{label}: release readiness live counters must remain zero: {non_zero}")
if not truth.get("truth_note"):
raise ValueError(f"{label}: release_readiness_truth.truth_note is required")
def _require_release_readbacks(payload: dict[str, Any], label: str) -> None:
items = payload.get("release_readiness_readbacks") or []
required = {
"readback_release_readiness_result_capture_writer",
"readback_release_readiness_learning_writer",
"readback_release_readiness_playbook_trust_writer",
"readback_release_readiness_reviewer_queue_writer",
"readback_release_readiness_gateway_queue_writer",
}
ids = {item.get("readback_id") for item in items}
if ids != required:
raise ValueError(f"{label}: release readiness readbacks must match {sorted(required)}")
for item in items:
item_id = item.get("readback_id")
if item.get("readback_mode") != "owner_approved_release_readiness_readback":
raise ValueError(f"{label}: release readiness readback {item_id} mode is invalid")
if item.get("release_readiness_passed") is not False or item.get("owner_release_approved") is not False:
raise ValueError(f"{label}: release readiness readback {item_id} must stay unpassed and unapproved")
if item.get("status") not in {"ready_for_owner_readback", "approval_required", "blocked_by_policy"}:
raise ValueError(f"{label}: release readiness readback {item_id} status is invalid")
if not item.get("readiness_summary") or not _is_redacted_sha256(item.get("evidence_hash")):
raise ValueError(f"{label}: release readiness readback {item_id} must include summary and redacted evidence_hash")
def _require_owner_release_checks(payload: dict[str, Any], label: str) -> None:
items = payload.get("owner_release_readiness_checks") or []
required = {
"owner_release_readiness_result_capture_writer",
"owner_release_readiness_learning_writer",
"owner_release_readiness_playbook_trust_writer",
"owner_release_readiness_reviewer_queue_writer",
"owner_release_readiness_gateway_queue_writer",
}
ids = {item.get("check_id") for item in items}
if ids != required:
raise ValueError(f"{label}: owner release readiness checks must match {sorted(required)}")
for item in items:
item_id = item.get("check_id")
if item.get("check_mode") != "owner_release_readiness_check":
raise ValueError(f"{label}: owner release readiness check {item_id} mode is invalid")
if item.get("owner_release_review_required") is not True or item.get("owner_release_approved") is not False:
raise ValueError(f"{label}: owner release readiness check {item_id} must remain required and unapproved")
if item.get("status") not in {"ready_for_owner_readback", "approval_required", "blocked_by_policy"}:
raise ValueError(f"{label}: owner release readiness check {item_id} status is invalid")
if not item.get("required_before_live_apply"):
raise ValueError(f"{label}: owner release readiness check {item_id} required_before_live_apply is required")
def _require_live_apply_readiness_gates(payload: dict[str, Any], label: str) -> None:
items = payload.get("live_apply_readiness_gates") or []
required = {
"live_apply_readiness_result_capture",
"live_apply_readiness_learning",
"live_apply_readiness_playbook_trust",
"live_apply_readiness_reviewer_queue",
"live_apply_readiness_gateway_queue",
}
ids = {item.get("gate_id") for item in items}
if ids != required:
raise ValueError(f"{label}: live apply readiness gates must match {sorted(required)}")
for item in items:
item_id = item.get("gate_id")
if item.get("gate_mode") != "live_apply_readiness_gate":
raise ValueError(f"{label}: live apply readiness gate {item_id} mode is invalid")
if item.get("release_readiness_passed") is not False or item.get("live_apply_release_enabled") is not False:
raise ValueError(f"{label}: live apply readiness gate {item_id} must stay held and disabled")
if item.get("status") not in {"ready_for_owner_readback", "approval_required", "blocked_by_policy"}:
raise ValueError(f"{label}: live apply readiness gate {item_id} status is invalid")
if not item.get("hold_reason") or not item.get("release_condition"):
raise ValueError(f"{label}: live apply readiness gate {item_id} hold_reason and release_condition are required")
def _require_rollback_readiness(payload: dict[str, Any], label: str) -> None:
items = payload.get("rollback_readiness_checks") or []
required = {
"rollback_readiness_result_capture",
"rollback_readiness_learning",
"rollback_readiness_playbook_trust",
"rollback_readiness_reviewer_queue",
"rollback_readiness_gateway_queue",
}
ids = {item.get("check_id") for item in items}
if ids != required:
raise ValueError(f"{label}: rollback readiness checks must match {sorted(required)}")
for item in items:
item_id = item.get("check_id")
if item.get("rollback_owner_required") is not True or item.get("rollback_readiness_passed") is not False:
raise ValueError(f"{label}: rollback readiness {item_id} must stay required and unpassed")
if item.get("status") not in {"ready_for_owner_readback", "approval_required", "blocked_by_policy"}:
raise ValueError(f"{label}: rollback readiness {item_id} status is invalid")
if not item.get("rollback_scope") or not item.get("hold_reason"):
raise ValueError(f"{label}: rollback readiness {item_id} scope and hold_reason are required")
def _require_blocked_transitions(payload: dict[str, Any], label: str) -> None:
items = payload.get("blocked_readiness_transitions") or []
required = {
"blocked_writer_apply_readiness",
"blocked_execution_apply_readiness",
"blocked_receipt_write_readiness",
"blocked_result_capture_write_readiness",
"blocked_gateway_queue_write_readiness",
"blocked_telegram_send_readiness",
}
ids = {item.get("blocker_id") for item in items}
if ids != required:
raise ValueError(f"{label}: blocked readiness transitions must match {sorted(required)}")
for item in items:
item_id = item.get("blocker_id")
if item.get("status") not in {"approval_required", "blocked_by_policy"}:
raise ValueError(f"{label}: blocker {item_id} status is invalid")
if item.get("severity") not in {"high", "critical"}:
raise ValueError(f"{label}: blocker {item_id} severity is invalid")
if not item.get("blocked_action") or not item.get("blocked_until"):
raise ValueError(f"{label}: blocker {item_id} must include blocked_action and blocked_until")
if not _is_redacted_sha256(item.get("evidence_hash")):
raise ValueError(f"{label}: blocker {item_id} must expose redacted evidence_hash")
def _require_actions(payload: dict[str, Any], label: str) -> None:
actions = payload.get("operator_actions") or []
required = {
"review_release_readiness_readbacks",
"verify_owner_release_readiness_checks",
"verify_live_apply_readiness_hold",
"verify_rollback_readiness",
"prepare_p2_131_owner_release_approval_gate",
}
ids = {action.get("action_id") for action in actions}
if ids != required:
raise ValueError(f"{label}: operator actions must match {sorted(required)}")
for action in actions:
action_id = action.get("action_id")
if action.get("runtime_write_allowed") is not False:
raise ValueError(f"{label}: action {action_id} must not allow runtime write")
if not action.get("operator_instruction"):
raise ValueError(f"{label}: action {action_id} operator_instruction is required")
def _require_display_redaction(payload: dict[str, Any], label: str) -> None:
contract = payload.get("display_redaction_contract") or {}
expected = {
"redaction_required": True,
"raw_prompt_display_allowed": False,
"private_reasoning_display_allowed": False,
"secret_value_display_allowed": False,
"raw_runtime_payload_display_allowed": False,
"internal_collaboration_content_display_allowed": False,
}
mismatches = _mismatches(contract, expected)
if mismatches:
raise ValueError(f"{label}: display_redaction_contract mismatch: {mismatches}")
if not contract.get("frontend_display_policy"):
raise ValueError(f"{label}: display_redaction_contract.frontend_display_policy is required")
def _require_rollup_consistency(payload: dict[str, Any], label: str) -> None:
rollups = payload.get("rollups") or {}
readbacks = payload.get("release_readiness_readbacks") or []
checks = payload.get("owner_release_readiness_checks") or []
gates = payload.get("live_apply_readiness_gates") or []
rollbacks = payload.get("rollback_readiness_checks") or []
blockers = payload.get("blocked_readiness_transitions") or []
actions = payload.get("operator_actions") or []
expected = {
"release_readiness_readback_count": len(readbacks),
"owner_release_readiness_check_count": len(checks),
"live_apply_readiness_gate_count": len(gates),
"rollback_readiness_check_count": len(rollbacks),
"blocked_readiness_transition_count": len(blockers),
"operator_action_count": len(actions),
"approval_required_readback_count": sum(1 for item in readbacks if item.get("status") == "approval_required"),
"blocked_readback_count": sum(1 for item in readbacks if item.get("status") == "blocked_by_policy"),
"approval_required_owner_release_check_count": sum(1 for item in checks if item.get("status") == "approval_required"),
"blocked_owner_release_check_count": sum(1 for item in checks if item.get("status") == "blocked_by_policy"),
"approval_required_readiness_gate_count": sum(1 for item in gates if item.get("status") == "approval_required"),
"blocked_readiness_gate_count": sum(1 for item in gates if item.get("status") == "blocked_by_policy"),
"approval_required_rollback_count": sum(1 for item in rollbacks if item.get("status") == "approval_required"),
"blocked_rollback_count": sum(1 for item in rollbacks if item.get("status") == "blocked_by_policy"),
"critical_blocker_count": sum(1 for item in blockers if item.get("severity") == "critical"),
"owner_release_approved_count": 0,
"maintenance_window_approved_count": 0,
"rollback_owner_confirmed_count": 0,
"post_release_verifier_ready_count": 0,
"release_readiness_pass_count": 0,
"live_apply_release_pass_count": 0,
"writer_apply_count": 0,
"execution_apply_count": 0,
"receipt_write_count": 0,
"reviewer_queue_write_count": 0,
"gateway_queue_write_count": 0,
"telegram_send_count": 0,
"bot_api_call_count": 0,
"report_receipt_write_count": 0,
"result_capture_write_count": 0,
"learning_write_count": 0,
"playbook_trust_write_count": 0,
"production_write_count": 0,
"secret_read_count": 0,
"destructive_operation_count": 0,
}
mismatches = _mismatches(rollups, expected)
if mismatches:
raise ValueError(f"{label}: rollup counts mismatch: {mismatches}")
def _require_no_forbidden_display_terms(payload: dict[str, Any], label: str) -> None:
serialized = json.dumps(payload, ensure_ascii=False)
forbidden = {
"work_window_transcript",
"session_id",
"browser_context",
"authorization_header",
"raw Telegram payload",
"private reasoning",
"raw prompt",
"chain-of-thought",
}
hits = sorted(term for term in forbidden if term in serialized)
if hits:
raise ValueError(f"{label}: forbidden display terms present: {hits}")
def _is_redacted_sha256(value: Any) -> bool:
if not isinstance(value, str) or not value.startswith("sha256:"):
return False
digest = value.removeprefix("sha256:")
return len(digest) == 64 and all(char in "0123456789abcdef" for char in digest)
def _mismatches(payload: dict[str, Any], expected: dict[str, Any]) -> dict[str, dict[str, Any]]:
return {
key: {"expected": value, "actual": payload.get(key)}
for key, value in expected.items()
if payload.get(key) != value
}