Files
awoooi/docs/evaluations/agent_langgraph_replay_pipeline_2026-06-02.json
Your Name cfb866d055
Some checks failed
Ansible Lint / lint (push) Successful in 35s
CD Pipeline / tests (push) Failing after 13s
CD Pipeline / build-and-deploy (push) Has been skipped
CD Pipeline / post-deploy-checks (push) Has been skipped
Code Review / ai-code-review (push) Failing after 11s
feat(governance): add agent market automation surfaces
2026-06-04 21:50:55 +08:00

21 lines
1.1 KiB
JSON

{
"baseline": "/tmp/nemotron-replay-prod-20260602095438-openclaw-incumbent.jsonl",
"candidate_id": "langgraph_incident_kernel",
"contract_report": "/tmp/nemotron-replay-prod-20260602095438-langgraph-contract-report.json",
"contract_valid": true,
"fixtures": "/tmp/nemotron-replay-prod-20260602095438-sanitized-fixtures.jsonl",
"graded_output": "/tmp/nemotron-replay-prod-20260602095438-langgraph-graded.jsonl",
"graded_records": 50,
"grading_report": "/tmp/nemotron-replay-prod-20260602095438-langgraph-grading-report.json",
"input_records": 50,
"inputs": "/tmp/nemotron-replay-prod-20260602095438-sanitized-candidate-inputs.jsonl",
"label_grading_applied": true,
"normalized_output": "/tmp/nemotron-replay-prod-20260602095438-langgraph-normalized.jsonl",
"normalized_records": 50,
"result_records": 50,
"results": "/tmp/nemotron-replay-prod-20260602095438-langgraph-candidate-raw.jsonl",
"schema_version": "agent_replay_pipeline_report_v1",
"scorecard": "docs/evaluations/agent_langgraph_replay_scorecard_2026-06-02.json",
"scorecard_written": true
}