{"eval":{"version":"openagentskill-skill-eval-v1","slug":"rtk-ai-rtk","name":"Rtk","generated_at":"2026-07-03T21:47:49.280Z","task_input":"Evaluate Rtk before installing it in an AI agent workflow","status":"failed","score":83,"risk_level":"high","decision":{"recommendation":"do_not_auto_install","reason":"Permission surface: secrets or environment access, shell or command execution","auto_install_allowed":false,"policy":"block","human_review_required":true},"task_fit":{"score":84,"suited_tasks":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect source files","Explain architecture","Patch bugs and verify changes","Inspect repository metadata","Compare code changes"],"suited_agents":["Rust","Developer Tools","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"]},"install":{"command":"npx skills add rtk-ai/rtk","ready":true,"policy":"review","safety_label":"Avoid automatic install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add rtk-ai/rtk"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Rtk\" agent skill from https://github.com/rtk-ai/rtk. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: CLI proxy that reduces LLM token consumption by 60-90% on common dev commands. Single Rust binary, zero dependencies"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Rtk\" as a Claude Code skill from https://github.com/rtk-ai/rtk. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: CLI proxy that reduces LLM token consumption by 60-90% on common dev commands. Single Rust binary, zero dependencies"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Rtk\" from https://github.com/rtk-ai/rtk into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: CLI proxy that reduces LLM token consumption by 60-90% on common dev commands. Single Rust binary, zero dependencies"}]},"trust":{"score":87,"label":"Production candidate","version":"trust-score-v4","evidence":{"stars":"64K GitHub stars","repoActivity":"64K stars, 3.9K forks","lastPushed":"14d since push","license":"Apache-2.0","repository":"https://github.com/rtk-ai/rtk","install":"npx skills add rtk-ai/rtk","installSafety":"standard package or runtime install path","permissionSurface":"secrets or environment access, shell or command execution","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":92,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Dependency or permission surface needs review","Permission surface may require sandboxing","Permission surface needs review: secrets or environment access, shell or command execution","Dependency/runtime risk: command execution surface, credential or environment access","Permission surface: secrets or environment access, shell or command execution"]},"safety_gate":{"score":52,"tier":"experimental","label":"Experimental","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"shell","label":"Shell or command execution","reason":"Skill metadata references terminal, CLI, shell, subprocess, or command execution workflows.","severity":"high"},{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"},{"id":"secrets","label":"Secrets or environment access","reason":"Skill metadata references credentials, tokens, environment variables, or secret-bearing workflows.","severity":"high"}],"policy_warnings":["High-risk permission hints: Shell or command execution, Secrets or environment access","Dependency or permission surface needs review"]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":84,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate Rtk before installing it in an AI agent workflow","coding-agents","Coding agents workflows; Claude Code teams; teams that value GitHub adoption signals"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add rtk-ai/rtk"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add rtk-ai/rtk"]},{"id":"trust_score","label":"Trust score","status":"pass","score":87,"required_for_auto_install":true,"detail":"Strong OpenAgentSkill Trust Score across adoption, recent maintenance, license clarity, documentation, dependency/runtime risk, install safety, permission surface, and install availability.","evidence":["Production candidate","64K GitHub stars","Apache-2.0"]},{"id":"audit_score","label":"Audit score","status":"warn","score":92,"required_for_auto_install":true,"detail":"Needs review","evidence":["Dependency or permission surface needs review"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":52,"required_for_auto_install":true,"detail":"Sparse or mixed signals. Useful for discovery, but not for autonomous installation.","evidence":["Test manually in an isolated workspace and compare against safer alternatives.","Metadata combines secrets access with shell or command execution"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"pass","score":90,"required_for_auto_install":false,"detail":"Metadata includes enough usage and workflow context","evidence":["Strong README/SKILL.md context"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"Apache-2.0","evidence":["Apache-2.0"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"pass","score":100,"required_for_auto_install":false,"detail":"14d since push","evidence":["14d since push"]},{"id":"permission_surface","label":"Permission surface","status":"fail","score":36,"required_for_auto_install":true,"detail":"secrets or environment access, shell or command execution","evidence":["Shell or command execution: high","Network access: medium","Filesystem access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["anomalyco-opencode","puppeteer-puppeteer","openai-codex","hoppscotch-hoppscotch"]}],"blockers":["Permission surface: secrets or environment access, shell or command execution"],"warnings":["Audit score: Needs review","Agent safety gate: Sparse or mixed signals. Useful for discovery, but not for autonomous installation.","High-risk permission hints: Shell or command execution, Secrets or environment access","Dependency or permission surface needs review","Permission surface may require sandboxing","Permission surface needs review: secrets or environment access, shell or command execution","Dependency/runtime risk: command execution surface, credential or environment access","Permission surface: secrets or environment access, shell or command execution"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","High-risk permission hints: Shell or command execution, Secrets or environment access","Dependency or permission surface needs review","Permission surface may require sandboxing","Permission surface needs review: secrets or environment access, shell or command execution","Dependency/runtime risk: command execution surface, credential or environment access"],"alternatives":[{"slug":"anomalyco-opencode","name":"Opencode","url":"https://www.openagentskill.com/skills/anomalyco-opencode","stars":175041,"install_command":"npx skills add anomalyco/opencode","trust_score":92,"audit_score":95},{"slug":"puppeteer-puppeteer","name":"Puppeteer","url":"https://www.openagentskill.com/skills/puppeteer-puppeteer","stars":94783,"install_command":"npx skills add puppeteer/puppeteer","trust_score":90,"audit_score":94},{"slug":"openai-codex","name":"Codex","url":"https://www.openagentskill.com/skills/openai-codex","stars":91367,"install_command":"npx skills add openai/codex","trust_score":88,"audit_score":92},{"slug":"hoppscotch-hoppscotch","name":"Hoppscotch","url":"https://www.openagentskill.com/skills/hoppscotch-hoppscotch","stars":79567,"install_command":"npx skills add hoppscotch/hoppscotch","trust_score":89,"audit_score":93}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"rtk-ai-rtk","name":"Rtk","description":"CLI proxy that reduces LLM token consumption by 60-90% on common dev commands. Single Rust binary, zero dependencies","category":"coding-agents","url":"https://www.openagentskill.com/skills/rtk-ai-rtk","repository":"https://github.com/rtk-ai/rtk","github_repo":"rtk-ai/rtk"},"suited_tasks":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect source files","Explain architecture","Patch bugs and verify changes","Inspect repository metadata","Compare code changes"],"suited_agents":["Rust","Developer Tools","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"],"install":{"command":"npx skills add rtk-ai/rtk","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add rtk-ai/rtk"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Rtk\" agent skill from https://github.com/rtk-ai/rtk. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: CLI proxy that reduces LLM token consumption by 60-90% on common dev commands. Single Rust binary, zero dependencies"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Rtk\" as a Claude Code skill from https://github.com/rtk-ai/rtk. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: CLI proxy that reduces LLM token consumption by 60-90% on common dev commands. Single Rust binary, zero dependencies"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Rtk\" from https://github.com/rtk-ai/rtk into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: CLI proxy that reduces LLM token consumption by 60-90% on common dev commands. Single Rust binary, zero dependencies"}],"handoff_url":"https://www.openagentskill.com/api/skills/rtk-ai-rtk/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/rtk-ai-rtk"},"trust":{"score":87,"label":"Production candidate","version":"trust-score-v4","install_policy":"agent_install_candidate","evidence":{"stars":"64K GitHub stars","repoActivity":"64K stars, 3.9K forks","lastPushed":"14d since push","license":"Apache-2.0","repository":"https://github.com/rtk-ai/rtk","install":"npx skills add rtk-ai/rtk","installSafety":"standard package or runtime install path","permissionSurface":"secrets or environment access, shell or command execution","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":true,"sandbox_required":true,"reason":"Trust Score v4 allows sandbox-first agent installation after normal workspace review."},"best_for":["coding-agents","developer-tools","automation","coding","agentic-coding","ai-coding"],"known_risks":["Permission surface needs review: secrets or environment access, shell or command execution","Dependency/runtime risk: command execution surface, credential or environment access","Permission surface: secrets or environment access, shell or command execution"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":92,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Dependency or permission surface needs review","Permission surface may require sandboxing","Permission surface needs review: secrets or environment access, shell or command execution","Dependency/runtime risk: command execution surface, credential or environment access","Permission surface: secrets or environment access, shell or command execution"]},"safety_gate":{"tier":"experimental","label":"Experimental","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Test manually in an isolated workspace and compare against safer alternatives."},"quality":{"score":100,"label":"Excellent"},"supply":{"track":"Coding and developer agents","scenario":"Coding agents","maintenance":"14d since push","risk":"Needs review"},"alternative_skills":[{"slug":"anomalyco-opencode","name":"Opencode","url":"https://www.openagentskill.com/skills/anomalyco-opencode","stars":175041,"install_command":"npx skills add anomalyco/opencode","trust_score":92,"audit_score":95},{"slug":"puppeteer-puppeteer","name":"Puppeteer","url":"https://www.openagentskill.com/skills/puppeteer-puppeteer","stars":94783,"install_command":"npx skills add puppeteer/puppeteer","trust_score":90,"audit_score":94},{"slug":"openai-codex","name":"Codex","url":"https://www.openagentskill.com/skills/openai-codex","stars":91367,"install_command":"npx skills add openai/codex","trust_score":88,"audit_score":92},{"slug":"hoppscotch-hoppscotch","name":"Hoppscotch","url":"https://www.openagentskill.com/skills/hoppscotch-hoppscotch","stars":79567,"install_command":"npx skills add hoppscotch/hoppscotch","trust_score":89,"audit_score":93}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","High-risk permission hints: Shell or command execution, Secrets or environment access","Dependency or permission surface needs review","Permission surface may require sandboxing","Permission surface needs review: secrets or environment access, shell or command execution","Dependency/runtime risk: command execution surface, credential or environment access"],"agent_contract":{"task_input":"Evaluate Rtk before installing it in an AI agent workflow","recommended_action":"Test manually in an isolated workspace and compare against safer alternatives.","install_policy":"review","minimum_review_before_use":["Trust: 87/100 Production candidate","Audit: 92/100 Needs review","Safety: 52/100 Avoid automatic install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"rtk-ai-rtk (Rtk)","install_command":"npx skills add rtk-ai/rtk","risk_summary":"Needs review; Experimental; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"rtk-ai-rtk","task":"Evaluate Rtk before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/rtk-ai-rtk","api":"https://www.openagentskill.com/api/agent/skills/rtk-ai-rtk","audit":"https://www.openagentskill.com/skills/rtk-ai-rtk/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=rtk-ai-rtk&task=Evaluate%20Rtk%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Rtk%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20Rtk%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/rtk-ai-rtk/install","manifest":"https://www.openagentskill.com/api/registry/manifest/rtk-ai-rtk"}},"endpoints":{"web":"https://www.openagentskill.com/skills/rtk-ai-rtk","api":"https://www.openagentskill.com/api/agent/skills/rtk-ai-rtk","eval":"https://www.openagentskill.com/api/agent/evals?slug=rtk-ai-rtk","audit":"https://www.openagentskill.com/skills/rtk-ai-rtk/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Rtk%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-03T21:47:49.281Z"}}