Files
awoooi/docs/evaluations/examples/agent_nemotron_replay_finalizer_report.sample.json
Your Name cfb866d055
Some checks failed
Ansible Lint / lint (push) Successful in 35s
CD Pipeline / tests (push) Failing after 13s
CD Pipeline / build-and-deploy (push) Has been skipped
CD Pipeline / post-deploy-checks (push) Has been skipped
Code Review / ai-code-review (push) Failing after 11s
feat(governance): add agent market automation surfaces
2026-06-04 21:50:55 +08:00

81 lines
2.1 KiB
JSON

{
"schema_version": "agent_nemotron_replay_finalizer_report_v1",
"candidate_id": "nemo_nemotron_fabric",
"stage": "promotion_gate",
"approved": false,
"decision": "blocked",
"failures": [
"scorecard_not_eligible_for_canary",
"sample_too_small:1<50"
],
"import_report": {
"schema_version": "agent_nemotron_import_report_v1",
"candidate_id": "nemo_nemotron_fabric",
"external_results": 1,
"imported_results": 1,
"requests": 1,
"valid": true,
"failures": [],
"duplicate_results": [],
"missing_results": [],
"unexpected_results": [],
"external_error_records": 0,
"fallback_used_records": 0,
"incomplete_trace_records": 0,
"total_cost_usd": 0,
"avg_latency_ms": 8500,
"p95_latency_ms": 8500,
"model_distribution": {
"nvidia/nemotron-mini-4b-instruct": 1
}
},
"contract_report": {
"schema_version": "agent_replay_contract_report_v1",
"candidate_id": "nemo_nemotron_fabric",
"inputs": 1,
"results": 1,
"valid": true,
"failures": []
},
"pipeline_report": {
"schema_version": "agent_replay_pipeline_report_v1",
"candidate_id": "nemo_nemotron_fabric",
"contract_valid": true,
"input_records": 1,
"result_records": 1,
"normalized_records": 1,
"graded_records": 1,
"baseline_records": 1,
"ignored_nonbaseline_records": 0,
"label_grading_applied": true,
"scorecard_written": true
},
"grading_report": {
"schema_version": "agent_replay_grading_report_v1",
"records": 1,
"graded_records": 1,
"action_match_true": 1,
"action_match_false": 0,
"missing_fixtures": [],
"missing_expected_markers": []
},
"scorecard": null,
"promotion_gate": {
"schema_version": "agent_replay_promotion_gate_v1",
"candidate_id": "nemo_nemotron_fabric",
"target_stage": "shadow",
"approved": false,
"decision": "blocked",
"failures": [
"scorecard_not_eligible_for_canary",
"sample_too_small:1<50"
],
"evidence": {
"import_report": {
"provided": true,
"valid": true
}
}
}
}