{"eval":{"version":"openagentskill-skill-eval-v1","slug":"e2b-dev-e2b","name":"E2B","generated_at":"2026-07-03T22:11:56.217Z","task_input":"Evaluate E2B before installing it in an AI agent workflow","status":"review","score":87,"risk_level":"medium","decision":{"recommendation":"manual_review","reason":"Require human approval before installing into a real workspace.","auto_install_allowed":false,"policy":"review","human_review_required":true},"task_fit":{"score":70,"suited_tasks":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect source files","Explain architecture","Patch bugs and verify changes","Inspect repository metadata","Compare code changes"],"suited_agents":["Python","Sandbox","Code Interpreter","Codex","Claude Code","Cursor","CLI"]},"install":{"command":"npx skills add e2b-dev/E2B","ready":true,"policy":"review","safety_label":"Review before install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add e2b-dev/E2B"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"E2B\" agent skill from https://github.com/e2b-dev/E2B. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Run agent code safely in cloud sandboxes"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"E2B\" as a Claude Code skill from https://github.com/e2b-dev/E2B. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Run agent code safely in cloud sandboxes"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"E2B\" from https://github.com/e2b-dev/E2B into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Run agent code safely in cloud sandboxes"}]},"trust":{"score":86,"label":"Production candidate","version":"trust-score-v4","evidence":{"stars":"13K GitHub stars","repoActivity":"13K stars, 957 forks","lastPushed":"1d since push","license":"Unknown","repository":"https://github.com/e2b-dev/E2B","install":"npx skills add e2b-dev/E2B","installSafety":"standard package or runtime install path","permissionSurface":"no high-risk permission surface in public metadata","documentation":"Thin public metadata","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":91,"risk_level":"needs_review","risk_label":"Needs review","warnings":["License is unclear","Documentation summary is thin","License clarity: Unknown","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"]},"safety_gate":{"score":79,"tier":"reviewed","label":"Reviewed with permission notes","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"}],"policy_warnings":["License is unclear"]},"checks":[{"id":"task_fit","label":"Task fit","status":"warn","score":70,"required_for_auto_install":true,"detail":"Task fit is weak; compare alternatives before selecting.","evidence":["Evaluate E2B before installing it in an AI agent workflow","development","Coding agents workflows; Claude Code teams; teams that value GitHub adoption signals"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add e2b-dev/E2B"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add e2b-dev/E2B"]},{"id":"trust_score","label":"Trust score","status":"pass","score":86,"required_for_auto_install":true,"detail":"Strong OpenAgentSkill Trust Score across adoption, recent maintenance, license clarity, documentation, dependency/runtime risk, install safety, permission surface, and install availability.","evidence":["Production candidate","13K GitHub stars","Unknown"]},{"id":"audit_score","label":"Audit score","status":"warn","score":91,"required_for_auto_install":true,"detail":"Needs review","evidence":["License is unclear"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":79,"required_for_auto_install":true,"detail":"Usable candidate, but the agent should surface permission and audit notes before installation.","evidence":["Require human approval before installing into a real workspace.","License is unclear"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"fail","score":50,"required_for_auto_install":false,"detail":"Public metadata needs stronger README/SKILL.md context","evidence":["Thin public metadata"]},{"id":"license_clarity","label":"License clarity","status":"warn","score":42,"required_for_auto_install":true,"detail":"Unknown","evidence":["Unknown"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"pass","score":100,"required_for_auto_install":false,"detail":"1d since push","evidence":["1d since push"]},{"id":"permission_surface","label":"Permission surface","status":"pass","score":100,"required_for_auto_install":true,"detail":"no high-risk permission surface in public metadata","evidence":["Network access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["google-gemini-gemini-cli","x1xhlol-system-prompts-and-models-of-ai-tools","juliusbrussee-caveman","sickn33-antigravity-awesome-skills"]}],"blockers":[],"warnings":["Task fit: Task fit is weak; compare alternatives before selecting.","Audit score: Needs review","Agent safety gate: Usable candidate, but the agent should surface permission and audit notes before installation.","License clarity: Unknown","License is unclear","Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","License is unclear","Documentation summary is thin","License clarity: Unknown","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context","Production credentials, payments, or irreversible account changes without explicit human review"],"alternatives":[{"slug":"google-gemini-gemini-cli","name":"Gemini CLI","url":"https://www.openagentskill.com/skills/google-gemini-gemini-cli","stars":105720,"install_command":"npx skills add google-gemini/gemini-cli","trust_score":83,"audit_score":89},{"slug":"x1xhlol-system-prompts-and-models-of-ai-tools","name":"System Prompts And Models Of AI Tools","url":"https://www.openagentskill.com/skills/x1xhlol-system-prompts-and-models-of-ai-tools","stars":141169,"install_command":"npx skills add x1xhlol/system-prompts-and-models-of-ai-tools","trust_score":94,"audit_score":96},{"slug":"juliusbrussee-caveman","name":"Caveman","url":"https://www.openagentskill.com/skills/juliusbrussee-caveman","stars":82837,"install_command":"npx skills add JuliusBrussee/caveman","trust_score":90,"audit_score":93},{"slug":"sickn33-antigravity-awesome-skills","name":"Antigravity Awesome Skills","url":"https://www.openagentskill.com/skills/sickn33-antigravity-awesome-skills","stars":42248,"install_command":"npx skills add sickn33/antigravity-awesome-skills","trust_score":88,"audit_score":91}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"e2b-dev-e2b","name":"E2B","description":"Run agent code safely in cloud sandboxes","category":"development","url":"https://www.openagentskill.com/skills/e2b-dev-e2b","repository":"https://github.com/e2b-dev/E2B","github_repo":"e2b-dev/E2B"},"suited_tasks":["Coding agents workflows","Claude Code teams","teams that value GitHub adoption signals","Inspect source files","Explain architecture","Patch bugs and verify changes","Inspect repository metadata","Compare code changes"],"suited_agents":["Python","Sandbox","Code Interpreter","Codex","Claude Code","Cursor","CLI"],"install":{"command":"npx skills add e2b-dev/E2B","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add e2b-dev/E2B"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"E2B\" agent skill from https://github.com/e2b-dev/E2B. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Run agent code safely in cloud sandboxes"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"E2B\" as a Claude Code skill from https://github.com/e2b-dev/E2B. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Run agent code safely in cloud sandboxes"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"E2B\" from https://github.com/e2b-dev/E2B into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Run agent code safely in cloud sandboxes"}],"handoff_url":"https://www.openagentskill.com/api/skills/e2b-dev-e2b/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/e2b-dev-e2b"},"trust":{"score":86,"label":"Production candidate","version":"trust-score-v4","install_policy":"human_review_before_install","evidence":{"stars":"13K GitHub stars","repoActivity":"13K stars, 957 forks","lastPushed":"1d since push","license":"Unknown","repository":"https://github.com/e2b-dev/E2B","install":"npx skills add e2b-dev/E2B","installSafety":"standard package or runtime install path","permissionSurface":"no high-risk permission surface in public metadata","documentation":"Thin public metadata","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":false,"sandbox_required":true,"reason":"Human review or sandbox validation is required before automatic installation."},"best_for":["development","sandbox","code-execution","agents","Python","Code Interpreter"],"known_risks":["License is unclear","Documentation summary is thin","License clarity: Unknown","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":91,"risk_level":"needs_review","risk_label":"Needs review","warnings":["License is unclear","Documentation summary is thin","License clarity: Unknown","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"]},"safety_gate":{"tier":"reviewed","label":"Reviewed with permission notes","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Require human approval before installing into a real workspace."},"quality":{"score":100,"label":"Excellent"},"supply":{"track":"Coding and developer agents","scenario":"Coding agents","maintenance":"1d since push","risk":"Needs review"},"alternative_skills":[{"slug":"google-gemini-gemini-cli","name":"Gemini CLI","url":"https://www.openagentskill.com/skills/google-gemini-gemini-cli","stars":105720,"install_command":"npx skills add google-gemini/gemini-cli","trust_score":83,"audit_score":89},{"slug":"x1xhlol-system-prompts-and-models-of-ai-tools","name":"System Prompts And Models Of AI Tools","url":"https://www.openagentskill.com/skills/x1xhlol-system-prompts-and-models-of-ai-tools","stars":141169,"install_command":"npx skills add x1xhlol/system-prompts-and-models-of-ai-tools","trust_score":94,"audit_score":96},{"slug":"juliusbrussee-caveman","name":"Caveman","url":"https://www.openagentskill.com/skills/juliusbrussee-caveman","stars":82837,"install_command":"npx skills add JuliusBrussee/caveman","trust_score":90,"audit_score":93},{"slug":"sickn33-antigravity-awesome-skills","name":"Antigravity Awesome Skills","url":"https://www.openagentskill.com/skills/sickn33-antigravity-awesome-skills","stars":42248,"install_command":"npx skills add sickn33/antigravity-awesome-skills","trust_score":88,"audit_score":91}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","License is unclear","Documentation summary is thin","License clarity: Unknown","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context","Production credentials, payments, or irreversible account changes without explicit human review"],"agent_contract":{"task_input":"Evaluate E2B before installing it in an AI agent workflow","recommended_action":"Require human approval before installing into a real workspace.","install_policy":"review","minimum_review_before_use":["Trust: 86/100 Production candidate","Audit: 91/100 Needs review","Safety: 79/100 Review before install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"e2b-dev-e2b (E2B)","install_command":"npx skills add e2b-dev/E2B","risk_summary":"Needs review; Reviewed with permission notes; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"e2b-dev-e2b","task":"Evaluate E2B before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/e2b-dev-e2b","api":"https://www.openagentskill.com/api/agent/skills/e2b-dev-e2b","audit":"https://www.openagentskill.com/skills/e2b-dev-e2b/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=e2b-dev-e2b&task=Evaluate%20E2B%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20E2B%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20E2B%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/e2b-dev-e2b/install","manifest":"https://www.openagentskill.com/api/registry/manifest/e2b-dev-e2b"}},"endpoints":{"web":"https://www.openagentskill.com/skills/e2b-dev-e2b","api":"https://www.openagentskill.com/api/agent/skills/e2b-dev-e2b","eval":"https://www.openagentskill.com/api/agent/evals?slug=e2b-dev-e2b","audit":"https://www.openagentskill.com/skills/e2b-dev-e2b/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20E2B%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-03T22:11:56.217Z"}}