81 lines
2.1 KiB
JSON
81 lines
2.1 KiB
JSON
{
|
|
"schema_version": "agent_nemotron_replay_finalizer_report_v1",
|
|
"candidate_id": "nemo_nemotron_fabric",
|
|
"stage": "promotion_gate",
|
|
"approved": false,
|
|
"decision": "blocked",
|
|
"failures": [
|
|
"scorecard_not_eligible_for_canary",
|
|
"sample_too_small:1<50"
|
|
],
|
|
"import_report": {
|
|
"schema_version": "agent_nemotron_import_report_v1",
|
|
"candidate_id": "nemo_nemotron_fabric",
|
|
"external_results": 1,
|
|
"imported_results": 1,
|
|
"requests": 1,
|
|
"valid": true,
|
|
"failures": [],
|
|
"duplicate_results": [],
|
|
"missing_results": [],
|
|
"unexpected_results": [],
|
|
"external_error_records": 0,
|
|
"fallback_used_records": 0,
|
|
"incomplete_trace_records": 0,
|
|
"total_cost_usd": 0,
|
|
"avg_latency_ms": 8500,
|
|
"p95_latency_ms": 8500,
|
|
"model_distribution": {
|
|
"nvidia/nemotron-mini-4b-instruct": 1
|
|
}
|
|
},
|
|
"contract_report": {
|
|
"schema_version": "agent_replay_contract_report_v1",
|
|
"candidate_id": "nemo_nemotron_fabric",
|
|
"inputs": 1,
|
|
"results": 1,
|
|
"valid": true,
|
|
"failures": []
|
|
},
|
|
"pipeline_report": {
|
|
"schema_version": "agent_replay_pipeline_report_v1",
|
|
"candidate_id": "nemo_nemotron_fabric",
|
|
"contract_valid": true,
|
|
"input_records": 1,
|
|
"result_records": 1,
|
|
"normalized_records": 1,
|
|
"graded_records": 1,
|
|
"baseline_records": 1,
|
|
"ignored_nonbaseline_records": 0,
|
|
"label_grading_applied": true,
|
|
"scorecard_written": true
|
|
},
|
|
"grading_report": {
|
|
"schema_version": "agent_replay_grading_report_v1",
|
|
"records": 1,
|
|
"graded_records": 1,
|
|
"action_match_true": 1,
|
|
"action_match_false": 0,
|
|
"missing_fixtures": [],
|
|
"missing_expected_markers": []
|
|
},
|
|
"scorecard": null,
|
|
"promotion_gate": {
|
|
"schema_version": "agent_replay_promotion_gate_v1",
|
|
"candidate_id": "nemo_nemotron_fabric",
|
|
"target_stage": "shadow",
|
|
"approved": false,
|
|
"decision": "blocked",
|
|
"failures": [
|
|
"scorecard_not_eligible_for_canary",
|
|
"sample_too_small:1<50"
|
|
],
|
|
"evidence": {
|
|
"import_report": {
|
|
"provided": true,
|
|
"valid": true
|
|
}
|
|
}
|
|
}
|
|
}
|