{"eval":{"version":"openagentskill-skill-eval-v1","slug":"coasty-ai-open-computer-use","name":"Open Computer Use","generated_at":"2026-07-03T23:14:13.525Z","task_input":"Evaluate Open Computer Use before installing it in an AI agent workflow","status":"failed","score":79,"risk_level":"high","decision":{"recommendation":"do_not_auto_install","reason":"Permission surface: secrets or environment access, filesystem or document access","auto_install_allowed":false,"policy":"block","human_review_required":true},"task_fit":{"score":94,"suited_tasks":["Local desktop workflows","Claude Code teams","teams that value GitHub adoption signals","Navigate local resources","Run repeatable desktop actions","Verify file outputs","Inspect source files","Explain architecture"],"suited_agents":["TypeScript","Computer Use","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"]},"install":{"command":"npx skills add coasty-ai/open-computer-use","ready":true,"policy":"review","safety_label":"Review before install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add coasty-ai/open-computer-use"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Open Computer Use\" agent skill from https://github.com/coasty-ai/open-computer-use. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: State of the Art 82% OSWorld Computer Using Agent, production-ready. Remote and Local! Setup using one API Key"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Open Computer Use\" as a Claude Code skill from https://github.com/coasty-ai/open-computer-use. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: State of the Art 82% OSWorld Computer Using Agent, production-ready. Remote and Local! Setup using one API Key"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Open Computer Use\" from https://github.com/coasty-ai/open-computer-use into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: State of the Art 82% OSWorld Computer Using Agent, production-ready. Remote and Local! Setup using one API Key"}]},"trust":{"score":79,"label":"Strong shortlist","version":"trust-score-v4","evidence":{"stars":"762 GitHub stars","repoActivity":"762 stars, 94 forks","lastPushed":"19d since push","license":"Apache-2.0","repository":"https://github.com/coasty-ai/open-computer-use","install":"npx skills add coasty-ai/open-computer-use","installSafety":"standard package or runtime install path","permissionSurface":"secrets or environment access, filesystem or document access","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":86,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: secrets or environment access, filesystem or document access","Permission surface: secrets or environment access, filesystem or document access"]},"safety_gate":{"score":58,"tier":"reviewed","label":"Reviewed with permission notes","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"},{"id":"filesystem","label":"Filesystem access","reason":"Skill may read or write project files, documents, generated artifacts, or local workspace state.","severity":"medium"},{"id":"secrets","label":"Secrets or environment access","reason":"Skill metadata references credentials, tokens, environment variables, or secret-bearing workflows.","severity":"high"}],"policy_warnings":["High-risk permission hints: Secrets or environment access","Permission surface may require sandboxing"]},"checks":[{"id":"task_fit","label":"Task fit","status":"pass","score":94,"required_for_auto_install":true,"detail":"Task wording matches this skill metadata.","evidence":["Evaluate Open Computer Use before installing it in an AI agent workflow","automation","Local desktop workflows; Claude Code teams; teams that value GitHub adoption signals"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add coasty-ai/open-computer-use"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add coasty-ai/open-computer-use"]},{"id":"trust_score","label":"Trust score","status":"warn","score":79,"required_for_auto_install":true,"detail":"Good trust signals with a few areas worth checking before rollout.","evidence":["Strong shortlist","762 GitHub stars","Apache-2.0"]},{"id":"audit_score","label":"Audit score","status":"warn","score":86,"required_for_auto_install":true,"detail":"Needs review","evidence":["Permission surface may require sandboxing"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":58,"required_for_auto_install":true,"detail":"Usable candidate, but the agent should surface permission and audit notes before installation.","evidence":["Require human approval before installing into a real workspace.","High-risk permission hints: Secrets or environment access"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"pass","score":90,"required_for_auto_install":false,"detail":"Metadata includes enough usage and workflow context","evidence":["Strong README/SKILL.md context"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"Apache-2.0","evidence":["Apache-2.0"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"pass","score":100,"required_for_auto_install":false,"detail":"19d since push","evidence":["19d since push"]},{"id":"permission_surface","label":"Permission surface","status":"fail","score":46,"required_for_auto_install":true,"detail":"secrets or environment access, filesystem or document access","evidence":["Network access: medium","Filesystem access: medium","Secrets or environment access: high"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["harry0703-moneyprinterturbo","huginn-huginn","fastlane-fastlane"]}],"blockers":["Permission surface: secrets or environment access, filesystem or document access"],"warnings":["Trust score: Good trust signals with a few areas worth checking before rollout.","Audit score: Needs review","Agent safety gate: Usable candidate, but the agent should surface permission and audit notes before installation.","High-risk permission hints: Secrets or environment access","Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: secrets or environment access, filesystem or document access","Permission surface: secrets or environment access, filesystem or document access"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","High-risk permission hints: Secrets or environment access","Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: secrets or environment access, filesystem or document access","Permission surface: secrets or environment access, filesystem or document access"],"alternatives":[{"slug":"harry0703-moneyprinterturbo","name":"MoneyPrinterTurbo","url":"https://www.openagentskill.com/skills/harry0703-moneyprinterturbo","stars":88538,"install_command":"npx skills add harry0703/MoneyPrinterTurbo","trust_score":92,"audit_score":95},{"slug":"huginn-huginn","name":"Huginn","url":"https://www.openagentskill.com/skills/huginn-huginn","stars":49478,"install_command":"npx skills add huginn/huginn","trust_score":93,"audit_score":95},{"slug":"fastlane-fastlane","name":"Fastlane","url":"https://www.openagentskill.com/skills/fastlane-fastlane","stars":41664,"install_command":"npx skills add fastlane/fastlane","trust_score":92,"audit_score":95}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"coasty-ai-open-computer-use","name":"Open Computer Use","description":"State of the Art 82% OSWorld Computer Using Agent, production-ready. Remote and Local! Setup using one API Key","category":"automation","url":"https://www.openagentskill.com/skills/coasty-ai-open-computer-use","repository":"https://github.com/coasty-ai/open-computer-use","github_repo":"coasty-ai/open-computer-use"},"suited_tasks":["Local desktop workflows","Claude Code teams","teams that value GitHub adoption signals","Navigate local resources","Run repeatable desktop actions","Verify file outputs","Inspect source files","Explain architecture"],"suited_agents":["TypeScript","Computer Use","Codex","Claude Code","Cursor","OpenAgentSkill CLI","CLI"],"install":{"command":"npx skills add coasty-ai/open-computer-use","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add coasty-ai/open-computer-use"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Open Computer Use\" agent skill from https://github.com/coasty-ai/open-computer-use. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: State of the Art 82% OSWorld Computer Using Agent, production-ready. Remote and Local! Setup using one API Key"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Open Computer Use\" as a Claude Code skill from https://github.com/coasty-ai/open-computer-use. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: State of the Art 82% OSWorld Computer Using Agent, production-ready. Remote and Local! Setup using one API Key"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Open Computer Use\" from https://github.com/coasty-ai/open-computer-use into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: State of the Art 82% OSWorld Computer Using Agent, production-ready. Remote and Local! Setup using one API Key"}],"handoff_url":"https://www.openagentskill.com/api/skills/coasty-ai-open-computer-use/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/coasty-ai-open-computer-use"},"trust":{"score":79,"label":"Strong shortlist","version":"trust-score-v4","install_policy":"human_review_before_install","evidence":{"stars":"762 GitHub stars","repoActivity":"762 stars, 94 forks","lastPushed":"19d since push","license":"Apache-2.0","repository":"https://github.com/coasty-ai/open-computer-use","install":"npx skills add coasty-ai/open-computer-use","installSafety":"standard package or runtime install path","permissionSurface":"secrets or environment access, filesystem or document access","documentation":"Strong README/SKILL.md context","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":false,"sandbox_required":true,"reason":"Human review or sandbox validation is required before automatic installation."},"best_for":["automation","computer-use","desktop-agent","agent","agentic-framework","ai"],"known_risks":["Quality score needs review","Permission surface needs review: secrets or environment access, filesystem or document access","Permission surface: secrets or environment access, filesystem or document access"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":86,"risk_level":"needs_review","risk_label":"Needs review","warnings":["Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: secrets or environment access, filesystem or document access","Permission surface: secrets or environment access, filesystem or document access"]},"safety_gate":{"tier":"reviewed","label":"Reviewed with permission notes","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Require human approval before installing into a real workspace."},"quality":{"score":86,"label":"Excellent"},"supply":{"track":"Coding and developer agents","scenario":"Coding agents","maintenance":"19d since push","risk":"Needs review"},"alternative_skills":[{"slug":"harry0703-moneyprinterturbo","name":"MoneyPrinterTurbo","url":"https://www.openagentskill.com/skills/harry0703-moneyprinterturbo","stars":88538,"install_command":"npx skills add harry0703/MoneyPrinterTurbo","trust_score":92,"audit_score":95},{"slug":"huginn-huginn","name":"Huginn","url":"https://www.openagentskill.com/skills/huginn-huginn","stars":49478,"install_command":"npx skills add huginn/huginn","trust_score":93,"audit_score":95},{"slug":"fastlane-fastlane","name":"Fastlane","url":"https://www.openagentskill.com/skills/fastlane-fastlane","stars":41664,"install_command":"npx skills add fastlane/fastlane","trust_score":92,"audit_score":95}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","High-risk permission hints: Secrets or environment access","Permission surface may require sandboxing","Quality score needs review","Permission surface needs review: secrets or environment access, filesystem or document access","Permission surface: secrets or environment access, filesystem or document access"],"agent_contract":{"task_input":"Evaluate Open Computer Use before installing it in an AI agent workflow","recommended_action":"Require human approval before installing into a real workspace.","install_policy":"review","minimum_review_before_use":["Trust: 79/100 Strong shortlist","Audit: 86/100 Needs review","Safety: 58/100 Review before install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"coasty-ai-open-computer-use (Open Computer Use)","install_command":"npx skills add coasty-ai/open-computer-use","risk_summary":"Needs review; Reviewed with permission notes; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"coasty-ai-open-computer-use","task":"Evaluate Open Computer Use before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/coasty-ai-open-computer-use","api":"https://www.openagentskill.com/api/agent/skills/coasty-ai-open-computer-use","audit":"https://www.openagentskill.com/skills/coasty-ai-open-computer-use/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=coasty-ai-open-computer-use&task=Evaluate%20Open%20Computer%20Use%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Open%20Computer%20Use%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20Open%20Computer%20Use%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/coasty-ai-open-computer-use/install","manifest":"https://www.openagentskill.com/api/registry/manifest/coasty-ai-open-computer-use"}},"endpoints":{"web":"https://www.openagentskill.com/skills/coasty-ai-open-computer-use","api":"https://www.openagentskill.com/api/agent/skills/coasty-ai-open-computer-use","eval":"https://www.openagentskill.com/api/agent/evals?slug=coasty-ai-open-computer-use","audit":"https://www.openagentskill.com/skills/coasty-ai-open-computer-use/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Open%20Computer%20Use%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-03T23:14:13.525Z"}}