{"eval":{"version":"openagentskill-skill-eval-v1","slug":"devtoys-app-devtoys","name":"DevToys","generated_at":"2026-07-04T04:45:08.817Z","task_input":"Evaluate DevToys before installing it in an AI agent workflow","status":"passed","score":89,"risk_level":"low","decision":{"recommendation":"shortlist","reason":"All required eval gates passed for an agent shortlist.","auto_install_allowed":true,"policy":"allow","human_review_required":false},"task_fit":{"score":84,"suited_tasks":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect source files","Explain architecture","Patch bugs and verify changes","Navigate local resources","Run repeatable desktop actions"],"suited_agents":["C#","Developer Tools","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"]},"install":{"command":"npx skills add DevToys-app/DevToys","ready":true,"policy":"allow","safety_label":"Safe to install with normal review","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add DevToys-app/DevToys"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"DevToys\" agent skill from https://github.com/DevToys-app/DevToys. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: A Swiss Army knife for developers."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"DevToys\" as a Claude Code skill from https://github.com/DevToys-app/DevToys. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: A Swiss Army knife for developers."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"DevToys\" from https://github.com/DevToys-app/DevToys into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: A Swiss Army knife for developers."}]},"trust":{"score":89,"label":"Production candidate","version":"trust-score-v4","evidence":{"stars":"32K GitHub stars","repoActivity":"32K stars, 1.8K forks","lastPushed":"4mo since push","license":"MIT","repository":"https://github.com/DevToys-app/DevToys","install":"npx skills add DevToys-app/DevToys","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access","documentation":"Usable metadata, review docs","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":90,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":[]},"safety_gate":{"score":82,"tier":"verified","label":"Verified","auto_install_policy":"allow","blocked":false,"permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"}],"policy_warnings":[]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":84,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate DevToys before installing it in an AI agent workflow","coding-agents","Coding agents workflows; Claude Code teams; teams that value GitHub adoption signals"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add DevToys-app/DevToys"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add DevToys-app/DevToys"]},{"id":"trust_score","label":"Trust score","status":"pass","score":89,"required_for_auto_install":true,"detail":"Strong OpenAgentSkill Trust Score across adoption, recent maintenance, license clarity, documentation, dependency/runtime risk, install safety, permission surface, and install availability.","evidence":["Production candidate","32K GitHub stars","MIT"]},{"id":"audit_score","label":"Audit score","status":"pass","score":90,"required_for_auto_install":true,"detail":"Safe to try","evidence":["No major audit warning from metadata."]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"pass","score":82,"required_for_auto_install":true,"detail":"Strong metadata, audit, install, and review signals. Suitable for agent shortlists after normal workspace review.","evidence":["Allow agent install in a sandbox or low-risk workspace, then promote after one successful narrow task.","Verified listing"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"warn","score":74,"required_for_auto_install":false,"detail":"Public metadata needs stronger README/SKILL.md context","evidence":["Usable metadata, review docs"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"MIT","evidence":["MIT"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"warn","score":76,"required_for_auto_install":false,"detail":"4mo since push","evidence":["4mo since push"]},{"id":"permission_surface","label":"Permission surface","status":"pass","score":86,"required_for_auto_install":true,"detail":"filesystem or document access","evidence":["Network access: medium","Filesystem access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["anomalyco-opencode","puppeteer-puppeteer","openai-codex","hoppscotch-hoppscotch"]}],"blockers":[],"warnings":["README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context","Recent maintenance: 4mo since push"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","No major trust warnings detected from available metadata","Production credentials, payments, or irreversible account changes without explicit human review","Sensitive private data before reviewing repository code, license, and permission surface"],"alternatives":[{"slug":"anomalyco-opencode","name":"Opencode","url":"https://www.openagentskill.com/skills/anomalyco-opencode","stars":175041,"install_command":"npx skills add anomalyco/opencode","trust_score":92,"audit_score":95},{"slug":"puppeteer-puppeteer","name":"Puppeteer","url":"https://www.openagentskill.com/skills/puppeteer-puppeteer","stars":94783,"install_command":"npx skills add puppeteer/puppeteer","trust_score":90,"audit_score":94},{"slug":"openai-codex","name":"Codex","url":"https://www.openagentskill.com/skills/openai-codex","stars":91367,"install_command":"npx skills add openai/codex","trust_score":88,"audit_score":92},{"slug":"hoppscotch-hoppscotch","name":"Hoppscotch","url":"https://www.openagentskill.com/skills/hoppscotch-hoppscotch","stars":79567,"install_command":"npx skills add hoppscotch/hoppscotch","trust_score":89,"audit_score":93}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"devtoys-app-devtoys","name":"DevToys","description":"A Swiss Army knife for developers.","category":"coding-agents","url":"https://www.openagentskill.com/skills/devtoys-app-devtoys","repository":"https://github.com/DevToys-app/DevToys","github_repo":"DevToys-app/DevToys"},"suited_tasks":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect source files","Explain architecture","Patch bugs and verify changes","Navigate local resources","Run repeatable desktop actions"],"suited_agents":["C#","Developer Tools","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"],"install":{"command":"npx skills add DevToys-app/DevToys","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add DevToys-app/DevToys"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"DevToys\" agent skill from https://github.com/DevToys-app/DevToys. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: A Swiss Army knife for developers."},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"DevToys\" as a Claude Code skill from https://github.com/DevToys-app/DevToys. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: A Swiss Army knife for developers."},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"DevToys\" from https://github.com/DevToys-app/DevToys into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: A Swiss Army knife for developers."}],"handoff_url":"https://www.openagentskill.com/api/skills/devtoys-app-devtoys/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/devtoys-app-devtoys"},"trust":{"score":89,"label":"Production candidate","version":"trust-score-v4","install_policy":"agent_install_candidate","evidence":{"stars":"32K GitHub stars","repoActivity":"32K stars, 1.8K forks","lastPushed":"4mo since push","license":"MIT","repository":"https://github.com/DevToys-app/DevToys","install":"npx skills add DevToys-app/DevToys","installSafety":"standard package or runtime install path","permissionSurface":"filesystem or document access","documentation":"Usable metadata, review docs","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":true,"sandbox_required":true,"reason":"Trust Score v4 allows sandbox-first agent installation after normal workspace review."},"best_for":["coding-agents","developer-tools","automation","coding","blazor","cross-platform"],"known_risks":[]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":90,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":[]},"safety_gate":{"tier":"verified","label":"Verified","auto_install_policy":"allow","auto_install_allowed":true,"human_review_required":false,"blocked":false,"recommended_action":"Allow agent install in a sandbox or low-risk workspace, then promote after one successful narrow task."},"quality":{"score":100,"label":"Excellent"},"supply":{"track":"Coding and developer agents","scenario":"Coding agents","maintenance":"4mo since push","risk":"Safe to try"},"alternative_skills":[{"slug":"anomalyco-opencode","name":"Opencode","url":"https://www.openagentskill.com/skills/anomalyco-opencode","stars":175041,"install_command":"npx skills add anomalyco/opencode","trust_score":92,"audit_score":95},{"slug":"puppeteer-puppeteer","name":"Puppeteer","url":"https://www.openagentskill.com/skills/puppeteer-puppeteer","stars":94783,"install_command":"npx skills add puppeteer/puppeteer","trust_score":90,"audit_score":94},{"slug":"openai-codex","name":"Codex","url":"https://www.openagentskill.com/skills/openai-codex","stars":91367,"install_command":"npx skills add openai/codex","trust_score":88,"audit_score":92},{"slug":"hoppscotch-hoppscotch","name":"Hoppscotch","url":"https://www.openagentskill.com/skills/hoppscotch-hoppscotch","stars":79567,"install_command":"npx skills add hoppscotch/hoppscotch","trust_score":89,"audit_score":93}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","No major trust warnings detected from available metadata","Production credentials, payments, or irreversible account changes without explicit human review","Sensitive private data before reviewing repository code, license, and permission surface"],"agent_contract":{"task_input":"Evaluate DevToys before installing it in an AI agent workflow","recommended_action":"Allow agent install in a sandbox or low-risk workspace, then promote after one successful narrow task.","install_policy":"allow","minimum_review_before_use":["Trust: 89/100 Production candidate","Audit: 90/100 Safe to try","Safety: 82/100 Safe to install with normal review","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"devtoys-app-devtoys (DevToys)","install_command":"npx skills add DevToys-app/DevToys","risk_summary":"Safe to try; Verified; Low metadata risk","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"devtoys-app-devtoys","task":"Evaluate DevToys before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/devtoys-app-devtoys","api":"https://www.openagentskill.com/api/agent/skills/devtoys-app-devtoys","audit":"https://www.openagentskill.com/skills/devtoys-app-devtoys/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=devtoys-app-devtoys&task=Evaluate%20DevToys%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20DevToys%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20DevToys%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/devtoys-app-devtoys/install","manifest":"https://www.openagentskill.com/api/registry/manifest/devtoys-app-devtoys"}},"endpoints":{"web":"https://www.openagentskill.com/skills/devtoys-app-devtoys","api":"https://www.openagentskill.com/api/agent/skills/devtoys-app-devtoys","eval":"https://www.openagentskill.com/api/agent/evals?slug=devtoys-app-devtoys","audit":"https://www.openagentskill.com/skills/devtoys-app-devtoys/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20DevToys%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-04T04:45:08.817Z"}}