255 lines
10 KiB
Python
255 lines
10 KiB
Python
"""
|
|
AI provider route matrix snapshot.
|
|
|
|
Loads the latest committed, read-only AI Router / Ollama / OpenClaw /
|
|
Nemotron / Gemini provider route matrix. This module never switches providers,
|
|
calls paid APIs, probes external providers, reads secrets, changes runtime
|
|
routes, enters shadow/canary, triggers workflows, or executes runtime actions.
|
|
"""
|
|
|
|
from __future__ import annotations
|
|
|
|
import json
|
|
from pathlib import Path
|
|
from typing import Any
|
|
|
|
from src.services.snapshot_paths import default_evaluations_dir
|
|
|
|
_DEFAULT_EVALUATIONS_DIR = default_evaluations_dir(Path(__file__))
|
|
_SNAPSHOT_PATTERN = "ai_provider_route_matrix_*.json"
|
|
_SCHEMA_VERSION = "ai_provider_route_matrix_v1"
|
|
|
|
|
|
def load_latest_ai_provider_route_matrix(
|
|
evaluations_dir: Path | None = None,
|
|
) -> dict[str, Any]:
|
|
"""Load the newest committed AI provider route matrix snapshot."""
|
|
directory = evaluations_dir or _DEFAULT_EVALUATIONS_DIR
|
|
candidates = sorted(directory.glob(_SNAPSHOT_PATTERN))
|
|
if not candidates:
|
|
raise FileNotFoundError(f"no AI provider route matrix snapshots found in {directory}")
|
|
|
|
latest = candidates[-1]
|
|
with latest.open(encoding="utf-8") as handle:
|
|
payload = json.load(handle)
|
|
|
|
if not isinstance(payload, dict):
|
|
raise ValueError(f"{latest}: expected JSON object")
|
|
_require_schema(payload, _SCHEMA_VERSION, str(latest))
|
|
_require_read_only_boundaries(payload, str(latest))
|
|
_require_operation_boundaries(payload, str(latest))
|
|
_require_rollup_consistency(payload, str(latest))
|
|
_require_route_evidence(payload, str(latest))
|
|
_require_candidate_gates(payload, str(latest))
|
|
_require_operator_denials(payload, str(latest))
|
|
_require_no_plaintext_secret_payload_keys(payload, str(latest))
|
|
return payload
|
|
|
|
|
|
def _require_schema(payload: dict[str, Any], expected: str, label: str) -> None:
|
|
actual = payload.get("schema_version")
|
|
if actual != expected:
|
|
raise ValueError(f"{label}: expected schema_version={expected}, got {actual!r}")
|
|
|
|
|
|
def _require_read_only_boundaries(payload: dict[str, Any], label: str) -> None:
|
|
program_status = payload.get("program_status") or {}
|
|
if program_status.get("read_only_mode") is not True:
|
|
raise ValueError(f"{label}: program_status.read_only_mode must be true")
|
|
|
|
approval_boundaries = payload.get("approval_boundaries") or {}
|
|
allowed = sorted(key for key, value in approval_boundaries.items() if value is not False)
|
|
if allowed:
|
|
raise ValueError(f"{label}: approval boundaries must remain false: {allowed}")
|
|
|
|
|
|
def _require_operation_boundaries(payload: dict[str, Any], label: str) -> None:
|
|
boundaries = payload.get("operation_boundaries") or {}
|
|
if boundaries.get("read_only_api_allowed") is not True:
|
|
raise ValueError(f"{label}: read_only_api_allowed must be true")
|
|
|
|
blocked_flags = {
|
|
"provider_switch_allowed",
|
|
"production_routing_change_allowed",
|
|
"use_ai_router_toggle_allowed",
|
|
"fallback_order_change_allowed",
|
|
"ollama_endpoint_change_allowed",
|
|
"paid_api_call_allowed",
|
|
"paid_api_frequency_increase_allowed",
|
|
"external_provider_probe_allowed",
|
|
"live_benchmark_allowed",
|
|
"shadow_or_canary_allowed",
|
|
"openclaw_replacement_allowed",
|
|
"nemotron_shadow_allowed",
|
|
"gemini_direct_call_allowed",
|
|
"secret_read_allowed",
|
|
"secret_plaintext_allowed",
|
|
"notification_send_allowed",
|
|
"workflow_trigger_allowed",
|
|
"deploy_trigger_allowed",
|
|
"reload_trigger_allowed",
|
|
"runtime_execution_allowed",
|
|
}
|
|
allowed = sorted(flag for flag in blocked_flags if boundaries.get(flag) is not False)
|
|
if allowed:
|
|
raise ValueError(f"{label}: operation boundaries must remain false: {allowed}")
|
|
|
|
|
|
def _require_rollup_consistency(payload: dict[str, Any], label: str) -> None:
|
|
routes = payload.get("provider_routes") or []
|
|
gates = payload.get("candidate_gates") or []
|
|
gaps = payload.get("source_gaps") or []
|
|
rollups = payload.get("rollups") or {}
|
|
|
|
if rollups.get("total_routes") != len(routes):
|
|
raise ValueError(f"{label}: rollups.total_routes must match provider_routes")
|
|
if rollups.get("by_kind") != _count_by(routes, "kind"):
|
|
raise ValueError(f"{label}: rollups.by_kind must match provider_routes")
|
|
if rollups.get("by_status") != _count_by(routes, "status"):
|
|
raise ValueError(f"{label}: rollups.by_status must match provider_routes")
|
|
if rollups.get("by_route_gate") != _count_by(routes, "route_gate"):
|
|
raise ValueError(f"{label}: rollups.by_route_gate must match provider_routes")
|
|
|
|
requiring_action = sorted(
|
|
route.get("route_id")
|
|
for route in routes
|
|
if route.get("status") == "action_required"
|
|
)
|
|
if sorted(rollups.get("route_ids_requiring_action") or []) != requiring_action:
|
|
raise ValueError(f"{label}: rollups.route_ids_requiring_action must match routes")
|
|
|
|
approval_gates = sorted(
|
|
gate.get("gate_id")
|
|
for gate in gates
|
|
if gate.get("approval_required") is True
|
|
)
|
|
if sorted(rollups.get("candidate_gate_ids_requiring_approval") or []) != approval_gates:
|
|
raise ValueError(
|
|
f"{label}: rollups.candidate_gate_ids_requiring_approval must match candidate_gates"
|
|
)
|
|
|
|
if sorted(rollups.get("source_gap_ids") or []) != sorted(gap.get("gap_id") for gap in gaps):
|
|
raise ValueError(f"{label}: rollups.source_gap_ids must match source_gaps")
|
|
|
|
zero_count_fields = {
|
|
"provider_switch_allowed_count",
|
|
"paid_api_call_allowed_count",
|
|
"shadow_or_canary_allowed_count",
|
|
"runtime_route_change_allowed_count",
|
|
}
|
|
non_zero = sorted(field for field in zero_count_fields if rollups.get(field) != 0)
|
|
if non_zero:
|
|
raise ValueError(f"{label}: route permission rollup counts must remain 0: {non_zero}")
|
|
|
|
|
|
def _require_route_evidence(payload: dict[str, Any], label: str) -> None:
|
|
routes = payload.get("provider_routes") or []
|
|
missing = sorted(
|
|
route.get("route_id")
|
|
for route in routes
|
|
if not route.get("current_policy")
|
|
or not route.get("provider_order")
|
|
or not route.get("fallback_policy")
|
|
or not route.get("evidence_refs")
|
|
or not route.get("next_action")
|
|
)
|
|
if missing:
|
|
raise ValueError(f"{label}: provider_routes must include policy, order, evidence, next_action: {missing}")
|
|
|
|
required_route_ids = {
|
|
"ai_router_execution_policy",
|
|
"ollama_global_endpoint_order",
|
|
"alert_ai_ollama_first_lane",
|
|
"openclaw_nemo_rca_lane",
|
|
"nemotron_tool_calling_candidate",
|
|
"gemini_final_fallback_policy",
|
|
}
|
|
present = {route.get("route_id") for route in routes}
|
|
missing_required = sorted(required_route_ids - present)
|
|
if missing_required:
|
|
raise ValueError(f"{label}: missing required provider routes: {missing_required}")
|
|
|
|
blocked_candidates = sorted(
|
|
route.get("route_id")
|
|
for route in routes
|
|
if route.get("kind") == "nemotron_candidate" and route.get("status") != "blocked"
|
|
)
|
|
if blocked_candidates:
|
|
raise ValueError(f"{label}: Nemotron candidates must remain blocked: {blocked_candidates}")
|
|
|
|
|
|
def _require_candidate_gates(payload: dict[str, Any], label: str) -> None:
|
|
gates = payload.get("candidate_gates") or []
|
|
required_ids = {
|
|
"provider_switch_gate",
|
|
"nemotron_replay_gate",
|
|
"paid_provider_call_gate",
|
|
}
|
|
present = {gate.get("gate_id") for gate in gates}
|
|
missing = sorted(required_ids - present)
|
|
if missing:
|
|
raise ValueError(f"{label}: missing required candidate gates: {missing}")
|
|
|
|
not_approval_required = sorted(
|
|
gate.get("gate_id")
|
|
for gate in gates
|
|
if gate.get("approval_required") is not True
|
|
)
|
|
if not_approval_required:
|
|
raise ValueError(f"{label}: candidate gates must require approval: {not_approval_required}")
|
|
|
|
|
|
def _require_operator_denials(payload: dict[str, Any], label: str) -> None:
|
|
contract = payload.get("operator_contract") or {}
|
|
must_not_interpret_as = set(contract.get("must_not_interpret_as") or [])
|
|
required_denials = {
|
|
"provider 切換批准",
|
|
"production routing change 批准",
|
|
"Gemini / Claude / NVIDIA 付費呼叫批准",
|
|
"OpenClaw 取代或降級批准",
|
|
"Nemotron 進 shadow / canary 批准",
|
|
"fallback order 修改批准",
|
|
"Ollama endpoint / ConfigMap 修改批准",
|
|
"Secret payload 已讀取或可輸出",
|
|
"外部 live probe 或 benchmark 批准",
|
|
"workflow / deploy / reload 觸發批准",
|
|
"runtime execution 授權",
|
|
}
|
|
if not required_denials.issubset(must_not_interpret_as):
|
|
raise ValueError(f"{label}: operator_contract.must_not_interpret_as is missing required denials")
|
|
|
|
provider_switch_policy = str(contract.get("provider_switch_policy") or "")
|
|
if "P1-004" not in provider_switch_policy or "只能盤點與顯示" not in provider_switch_policy:
|
|
raise ValueError(f"{label}: provider_switch_policy must preserve P1-004 read-only boundary")
|
|
|
|
|
|
def _require_no_plaintext_secret_payload_keys(value: Any, label: str, path: str = "$") -> None:
|
|
if isinstance(value, dict):
|
|
forbidden_key_fragments = {
|
|
"secret_value",
|
|
"token_value",
|
|
"authorization_header",
|
|
"private_key",
|
|
"webhook_secret",
|
|
"runner_token",
|
|
"gemini_api_key_value",
|
|
"nvidia_api_key_value",
|
|
"claude_api_key_value",
|
|
}
|
|
for key, nested in value.items():
|
|
lowered = str(key).lower()
|
|
if any(fragment in lowered for fragment in forbidden_key_fragments):
|
|
raise ValueError(f"{label}: forbidden secret payload key at {path}.{key}")
|
|
_require_no_plaintext_secret_payload_keys(nested, label, f"{path}.{key}")
|
|
elif isinstance(value, list):
|
|
for index, nested in enumerate(value):
|
|
_require_no_plaintext_secret_payload_keys(nested, label, f"{path}[{index}]")
|
|
|
|
|
|
def _count_by(items: list[dict[str, Any]], key: str) -> dict[str, int]:
|
|
counts: dict[str, int] = {}
|
|
for item in items:
|
|
value = item.get(key)
|
|
counts[value] = counts.get(value, 0) + 1
|
|
return counts
|