{"eval":{"version":"openagentskill-skill-eval-v1","slug":"microsoft-responsible-ai-toolbox","name":"Responsible AI Toolbox","generated_at":"2026-07-04T00:16:01.201Z","task_input":"Evaluate Responsible AI Toolbox before installing it in an AI agent workflow","status":"passed","score":91,"risk_level":"low","decision":{"recommendation":"shortlist","reason":"All required eval gates passed for an agent shortlist.","auto_install_allowed":true,"policy":"allow","human_review_required":false},"task_fit":{"score":94,"suited_tasks":["GitHub automation workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect repository metadata","Compare code changes","Write concise engineering summaries","Load tabular data","Calculate trends"],"suited_agents":["TypeScript","Data Analysis","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"]},"install":{"command":"npx skills add microsoft/responsible-ai-toolbox","ready":true,"policy":"allow","safety_label":"Safe to install with normal review","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add microsoft/responsible-ai-toolbox"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Responsible AI Toolbox\" agent skill from https://github.com/microsoft/responsible-ai-toolbox. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Responsible AI Toolbox is a suite of tools providing model and data exploration and assessment user interfaces and libraries that enable a better understanding of AI systems. These interfaces and libraries empower developers and stakeholders of AI systems to develop and monitor AI more responsibly, and take better data-driven actions."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Responsible AI Toolbox\" as a Claude Code skill from https://github.com/microsoft/responsible-ai-toolbox. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Responsible AI Toolbox is a suite of tools providing model and data exploration and assessment user interfaces and libraries that enable a better understanding of AI systems. These interfaces and libraries empower developers and stakeholders of AI systems to develop and monitor AI more responsibly, and take better data-driven actions."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Responsible AI Toolbox\" from https://github.com/microsoft/responsible-ai-toolbox into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Responsible AI Toolbox is a suite of tools providing model and data exploration and assessment user interfaces and libraries that enable a better understanding of AI systems. These interfaces and libraries empower developers and stakeholders of AI systems to develop and monitor AI more responsibly, and take better data-driven actions."}]},"trust":{"score":90,"label":"Production candidate","version":"trust-score-v4","evidence":{"stars":"1.8K GitHub stars","repoActivity":"1.8K stars, 478 forks","lastPushed":"2mo since push","license":"MIT","repository":"https://github.com/microsoft/responsible-ai-toolbox","install":"npx skills add microsoft/responsible-ai-toolbox","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":92,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":[]},"safety_gate":{"score":84,"tier":"verified","label":"Verified","auto_install_policy":"allow","blocked":false,"permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"}],"policy_warnings":[]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":94,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate Responsible AI Toolbox before installing it in an AI agent workflow","data-analysis","GitHub automation workflows; Claude Code teams; teams that value GitHub adoption signals"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add microsoft/responsible-ai-toolbox"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add microsoft/responsible-ai-toolbox"]},{"id":"trust_score","label":"Trust score","status":"pass","score":90,"required_for_auto_install":true,"detail":"Strong OpenAgentSkill Trust Score across adoption, recent maintenance, license clarity, documentation, dependency/runtime risk, install safety, permission surface, and install availability.","evidence":["Production candidate","1.8K GitHub stars","MIT"]},{"id":"audit_score","label":"Audit score","status":"pass","score":92,"required_for_auto_install":true,"detail":"Safe to try","evidence":["No major audit warning from metadata."]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"pass","score":84,"required_for_auto_install":true,"detail":"Strong metadata, audit, install, and review signals. Suitable for agent shortlists after normal workspace review.","evidence":["Allow agent install in a sandbox or low-risk workspace, then promote after one successful narrow task.","Verified listing"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"pass","score":90,"required_for_auto_install":false,"detail":"Metadata includes enough usage and workflow context","evidence":["Strong README/SKILL.md context"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"MIT","evidence":["MIT"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"pass","score":88,"required_for_auto_install":false,"detail":"2mo since push","evidence":["2mo since push"]},{"id":"permission_surface","label":"Permission surface","status":"pass","score":86,"required_for_auto_install":true,"detail":"filesystem or document access","evidence":["Network access: medium","Filesystem access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["d3-d3","grafana-grafana","apache-superset","apache-echarts"]}],"blockers":[],"warnings":[],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","No major trust warnings detected from available metadata","Production credentials, payments, or irreversible account changes without explicit human review","Sensitive private data before reviewing repository code, license, and permission surface"],"alternatives":[{"slug":"d3-d3","name":"D3","url":"https://www.openagentskill.com/skills/d3-d3","stars":113096,"install_command":"npx skills add d3/d3","trust_score":89,"audit_score":91},{"slug":"grafana-grafana","name":"Grafana","url":"https://www.openagentskill.com/skills/grafana-grafana","stars":74422,"install_command":"npx skills add grafana/grafana","trust_score":92,"audit_score":94},{"slug":"apache-superset","name":"Superset","url":"https://www.openagentskill.com/skills/apache-superset","stars":73285,"install_command":"npx skills add apache/superset","trust_score":92,"audit_score":95},{"slug":"apache-echarts","name":"Echarts","url":"https://www.openagentskill.com/skills/apache-echarts","stars":66600,"install_command":"npx skills add apache/echarts","trust_score":91,"audit_score":92}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"microsoft-responsible-ai-toolbox","name":"Responsible AI Toolbox","description":"Responsible AI Toolbox is a suite of tools providing model and data exploration and assessment user interfaces and libraries that enable a better understanding of AI systems. These interfaces and libraries empower developers and stakeholders of AI systems to develop and monitor AI more responsibly, and take better data-driven actions.","category":"data-analysis","url":"https://www.openagentskill.com/skills/microsoft-responsible-ai-toolbox","repository":"https://github.com/microsoft/responsible-ai-toolbox","github_repo":"microsoft/responsible-ai-toolbox"},"suited_tasks":["GitHub automation workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect repository metadata","Compare code changes","Write concise engineering summaries","Load tabular data","Calculate trends"],"suited_agents":["TypeScript","Data Analysis","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"],"install":{"command":"npx skills add microsoft/responsible-ai-toolbox","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add microsoft/responsible-ai-toolbox"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Responsible AI Toolbox\" agent skill from https://github.com/microsoft/responsible-ai-toolbox. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Responsible AI Toolbox is a suite of tools providing model and data exploration and assessment user interfaces and libraries that enable a better understanding of AI systems. These interfaces and libraries empower developers and stakeholders of AI systems to develop and monitor AI more responsibly, and take better data-driven actions."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Responsible AI Toolbox\" as a Claude Code skill from https://github.com/microsoft/responsible-ai-toolbox. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Responsible AI Toolbox is a suite of tools providing model and data exploration and assessment user interfaces and libraries that enable a better understanding of AI systems. These interfaces and libraries empower developers and stakeholders of AI systems to develop and monitor AI more responsibly, and take better data-driven actions."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Responsible AI Toolbox\" from https://github.com/microsoft/responsible-ai-toolbox into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Responsible AI Toolbox is a suite of tools providing model and data exploration and assessment user interfaces and libraries that enable a better understanding of AI systems. These interfaces and libraries empower developers and stakeholders of AI systems to develop and monitor AI more responsibly, and take better data-driven actions."}],"handoff_url":"https://www.openagentskill.com/api/skills/microsoft-responsible-ai-toolbox/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/microsoft-responsible-ai-toolbox"},"trust":{"score":90,"label":"Production candidate","version":"trust-score-v4","install_policy":"agent_install_candidate","evidence":{"stars":"1.8K GitHub stars","repoActivity":"1.8K stars, 478 forks","lastPushed":"2mo since push","license":"MIT","repository":"https://github.com/microsoft/responsible-ai-toolbox","install":"npx skills add microsoft/responsible-ai-toolbox","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":true,"sandbox_required":true,"reason":"Trust Score v4 allows sandbox-first agent installation after normal workspace review."},"best_for":["data-analysis","analytics","data","data-science","data-visualization","error-analysis"],"known_risks":[]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":92,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":[]},"safety_gate":{"tier":"verified","label":"Verified","auto_install_policy":"allow","auto_install_allowed":true,"human_review_required":false,"blocked":false,"recommended_action":"Allow agent install in a sandbox or low-risk workspace, then promote after one successful narrow task."},"quality":{"score":98,"label":"Excellent"},"supply":{"track":"Data, BI, and analytics","scenario":"Data analysis","maintenance":"2mo since push","risk":"Safe to try"},"alternative_skills":[{"slug":"d3-d3","name":"D3","url":"https://www.openagentskill.com/skills/d3-d3","stars":113096,"install_command":"npx skills add d3/d3","trust_score":89,"audit_score":91},{"slug":"grafana-grafana","name":"Grafana","url":"https://www.openagentskill.com/skills/grafana-grafana","stars":74422,"install_command":"npx skills add grafana/grafana","trust_score":92,"audit_score":94},{"slug":"apache-superset","name":"Superset","url":"https://www.openagentskill.com/skills/apache-superset","stars":73285,"install_command":"npx skills add apache/superset","trust_score":92,"audit_score":95},{"slug":"apache-echarts","name":"Echarts","url":"https://www.openagentskill.com/skills/apache-echarts","stars":66600,"install_command":"npx skills add apache/echarts","trust_score":91,"audit_score":92}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","No major trust warnings detected from available metadata","Production credentials, payments, or irreversible account changes without explicit human review","Sensitive private data before reviewing repository code, license, and permission surface"],"agent_contract":{"task_input":"Evaluate Responsible AI Toolbox before installing it in an AI agent workflow","recommended_action":"Allow agent install in a sandbox or low-risk workspace, then promote after one successful narrow task.","install_policy":"allow","minimum_review_before_use":["Trust: 90/100 Production candidate","Audit: 92/100 Safe to try","Safety: 84/100 Safe to install with normal review","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"microsoft-responsible-ai-toolbox (Responsible AI Toolbox)","install_command":"npx skills add microsoft/responsible-ai-toolbox","risk_summary":"Safe to try; Verified; Low metadata risk","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"microsoft-responsible-ai-toolbox","task":"Evaluate Responsible AI Toolbox before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/microsoft-responsible-ai-toolbox","api":"https://www.openagentskill.com/api/agent/skills/microsoft-responsible-ai-toolbox","audit":"https://www.openagentskill.com/skills/microsoft-responsible-ai-toolbox/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=microsoft-responsible-ai-toolbox&task=Evaluate%20Responsible%20AI%20Toolbox%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Responsible%20AI%20Toolbox%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20Responsible%20AI%20Toolbox%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/microsoft-responsible-ai-toolbox/install","manifest":"https://www.openagentskill.com/api/registry/manifest/microsoft-responsible-ai-toolbox"}},"endpoints":{"web":"https://www.openagentskill.com/skills/microsoft-responsible-ai-toolbox","api":"https://www.openagentskill.com/api/agent/skills/microsoft-responsible-ai-toolbox","eval":"https://www.openagentskill.com/api/agent/evals?slug=microsoft-responsible-ai-toolbox","audit":"https://www.openagentskill.com/skills/microsoft-responsible-ai-toolbox/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Responsible%20AI%20Toolbox%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-04T00:16:01.201Z"}}