{"name":"viktorbezdek-agent-evaluation-agent-evaluation","owner":{"name":"ClaudePluginHub"},"plugins":[{"name":"viktorbezdek-agent-evaluation-agent-evaluation","source":{"source":"github","repo":"viktorbezdek/skillstack"},"description":"Comprehensive evaluation framework for LLM agent systems. Multi-dimensional rubrics, LLM-as-judge with bias mitigation, pairwise comparison, direct scoring, confidence calibration, and continuous monitoring.","version":"1.0.4","strict":true,"keywords":["claude-code","skill","evaluation","llm-as-judge","bias-mitigation","rubrics","pairwise-comparison"],"category":"utilities"}]}