{"eval":{"version":"openagentskill-skill-eval-v1","slug":"composio","name":"Composio","generated_at":"2026-07-04T03:14:08.582Z","task_input":"Evaluate Composio before installing it in an AI agent workflow","status":"review","score":88,"risk_level":"medium","decision":{"recommendation":"manual_review","reason":"Review the audit page, then allow agent install in a sandboxed workflow.","auto_install_allowed":false,"policy":"review","human_review_required":true},"task_fit":{"score":70,"suited_tasks":["Browser automation workflows","Claude Code teams","teams that value GitHub adoption signals","Navigate pages","Click and type safely","Check visual and DOM state","Move data between tools","Transform files"],"suited_agents":["Claude","GPT-4","LangChain","CrewAI","AutoGPT","OpenClaw","Claude Code","OpenAI Agents"]},"install":{"command":"npx skills add ComposioHQ/composio","ready":true,"policy":"review","safety_label":"Review before install","targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add ComposioHQ/composio"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Composio\" agent skill from https://github.com/ComposioHQ/composio. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Integration platform for AI agents with 250+ app connectors"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Composio\" as a Claude Code skill from https://github.com/ComposioHQ/composio. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Integration platform for AI agents with 250+ app connectors"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Composio\" from https://github.com/ComposioHQ/composio into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Integration platform for AI agents with 250+ app connectors"}]},"trust":{"score":88,"label":"Production candidate","version":"trust-score-v4","evidence":{"stars":"29K GitHub stars","repoActivity":"29K stars, 4.6K forks","lastPushed":"Pushed today","license":"MIT","repository":"https://github.com/ComposioHQ/composio","install":"npx skills add ComposioHQ/composio","installSafety":"standard package or runtime install path","permissionSurface":"network or browser access","documentation":"Thin public metadata","agentOutcomes":"No agent outcome data yet"}},"audit":{"score":93,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":["Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"]},"safety_gate":{"score":81,"tier":"reviewed","label":"Reviewed","auto_install_policy":"review","blocked":false,"permission_hints":[{"id":"network","label":"Network access","reason":"Skill likely fetches remote pages, APIs, repositories, or external services.","severity":"medium"}],"policy_warnings":["Documentation summary is thin"]},"checks":[{"id":"task_fit","label":"Task fit","status":"warn","score":70,"required_for_auto_install":true,"detail":"Task fit is weak; compare alternatives before selecting.","evidence":["Evaluate Composio before installing it in an AI agent workflow","integrations","Browser automation workflows; Claude Code teams; teams that value GitHub adoption signals"]},{"id":"install_path","label":"Install path","status":"pass","score":92,"required_for_auto_install":true,"detail":"Install handoff is available.","evidence":["npx skills add ComposioHQ/composio"]},{"id":"install_safety","label":"Install command safety","status":"pass","score":92,"required_for_auto_install":true,"detail":"standard package or runtime install path","evidence":["npx skills add ComposioHQ/composio"]},{"id":"trust_score","label":"Trust score","status":"pass","score":88,"required_for_auto_install":true,"detail":"Strong OpenAgentSkill Trust Score across adoption, recent maintenance, license clarity, documentation, dependency/runtime risk, install safety, permission surface, and install availability.","evidence":["Production candidate","29K GitHub stars","MIT"]},{"id":"audit_score","label":"Audit score","status":"pass","score":93,"required_for_auto_install":true,"detail":"Safe to try","evidence":["Documentation summary is thin"]},{"id":"agent_safety_gate","label":"Agent safety gate","status":"warn","score":81,"required_for_auto_install":true,"detail":"Good audit and safety signals with no high-risk permission hints in public metadata.","evidence":["Review the audit page, then allow agent install in a sandboxed workflow.","Safe-to-try audit"]},{"id":"readme_skillmd_completeness","label":"README/SKILL.md completeness","status":"fail","score":50,"required_for_auto_install":false,"detail":"Public metadata needs stronger README/SKILL.md context","evidence":["Thin public metadata"]},{"id":"license_clarity","label":"License clarity","status":"pass","score":86,"required_for_auto_install":true,"detail":"MIT","evidence":["MIT"]},{"id":"recent_maintenance","label":"Recent maintenance","status":"pass","score":100,"required_for_auto_install":false,"detail":"Pushed today","evidence":["Pushed today"]},{"id":"permission_surface","label":"Permission surface","status":"pass","score":86,"required_for_auto_install":true,"detail":"network or browser access","evidence":["Network access: medium"]},{"id":"alternatives","label":"Alternatives available","status":"pass","score":82,"required_for_auto_install":false,"detail":"Alternative skills are available for comparison.","evidence":["josstorer-rwkv-runner","vmware-vsphere-automation-sdk-python"]}],"blockers":[],"warnings":["Task fit: Task fit is weak; compare alternatives before selecting.","Agent safety gate: Good audit and safety signals with no high-risk permission hints in public metadata.","Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"],"validation_plan":["Inspect repository, README/SKILL.md, license, and recent commits before production use.","Install in an isolated workspace or sandbox with no production secrets available.","Run the smallest representative task and record files touched, commands run, network access, and outputs.","Compare the selected skill against at least one alternative when the eval status is review or failed.","Promote only after the agent reports a successful verification result and unresolved warnings are accepted."],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context","Production credentials, payments, or irreversible account changes without explicit human review","Sensitive private data before reviewing repository code, license, and permission surface"],"alternatives":[{"slug":"josstorer-rwkv-runner","name":"RWKV Runner","url":"https://www.openagentskill.com/skills/josstorer-rwkv-runner","stars":6394,"install_command":"npx skills add josStorer/RWKV-Runner","trust_score":89,"audit_score":92},{"slug":"vmware-vsphere-automation-sdk-python","name":"Vsphere Automation Sdk Python","url":"https://www.openagentskill.com/skills/vmware-vsphere-automation-sdk-python","stars":798,"install_command":"npx skills add vmware/vsphere-automation-sdk-python","trust_score":81,"audit_score":84}],"machine_metadata":{"version":"openagentskill-agent-metadata-v2","skill":{"slug":"composio","name":"Composio","description":"Integration platform for AI agents with 250+ app connectors","category":"integrations","url":"https://www.openagentskill.com/skills/composio","repository":"https://github.com/ComposioHQ/composio","github_repo":"ComposioHQ/composio"},"suited_tasks":["Browser automation workflows","Claude Code teams","teams that value GitHub adoption signals","Navigate pages","Click and type safely","Check visual and DOM state","Move data between tools","Transform files"],"suited_agents":["Claude","GPT-4","LangChain","CrewAI","AutoGPT","OpenClaw","Claude Code","OpenAI Agents"],"install":{"command":"npx skills add ComposioHQ/composio","ready":true,"targets":[{"id":"openagentskill-cli","label":"CLI","kind":"command","value":"npx skills add ComposioHQ/composio"},{"id":"codex","label":"Codex","kind":"agent-prompt","value":"Install the \"Composio\" agent skill from https://github.com/ComposioHQ/composio. Read its SKILL.md or equivalent instructions first, install only the files needed for this workspace, and summarize any required setup before using it. Skill purpose: Integration platform for AI agents with 250+ app connectors"},{"id":"claude-code","label":"Claude Code","kind":"agent-prompt","value":"Add \"Composio\" as a Claude Code skill from https://github.com/ComposioHQ/composio. Inspect the skill instructions, place the reusable skill files in the appropriate local skills location for this project, and report the activation steps. Skill purpose: Integration platform for AI agents with 250+ app connectors"},{"id":"cursor","label":"Cursor","kind":"agent-prompt","value":"Turn \"Composio\" from https://github.com/ComposioHQ/composio into a reusable Cursor project rule or agent instruction. Preserve the core workflow, adapt paths to this repo, and keep the rule scoped to tasks where it is relevant. Skill purpose: Integration platform for AI agents with 250+ app connectors"}],"handoff_url":"https://www.openagentskill.com/api/skills/composio/install","manifest_url":"https://www.openagentskill.com/api/registry/manifest/composio"},"trust":{"score":88,"label":"Production candidate","version":"trust-score-v4","install_policy":"agent_install_candidate","evidence":{"stars":"29K GitHub stars","repoActivity":"29K stars, 4.6K forks","lastPushed":"Pushed today","license":"MIT","repository":"https://github.com/ComposioHQ/composio","install":"npx skills add ComposioHQ/composio","installSafety":"standard package or runtime install path","permissionSurface":"network or browser access","documentation":"Thin public metadata","agentOutcomes":"No agent outcome data yet"},"outcome_evidence":{"total":0,"successes":0,"failures":0,"not_relevant":0,"success_rate":null,"recent_success_rate":null,"recent_failure_rate":null,"install_attempts":0,"install_success_rate":null,"risk_blocked":0,"setup_required":0,"avg_output_quality":null,"production_outcomes":0,"last_outcome_at":null,"label":"No agent outcome data yet"},"auto_install":{"allowed":true,"sandbox_required":true,"reason":"Trust Score v4 allows sandbox-first agent installation after normal workspace review."},"best_for":["integrations","api","connectors","automation","Claude","GPT-4"],"known_risks":["Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"]},"agent_proven":{"version":"agent-proven-v1","score":0,"tier":"unproven","label":"Needs first agent run","summary":"No agent outcome reports yet. Use Resolve, run one narrow sandbox task, then report the result.","metrics":{"totalOutcomes":0,"successfulOutcomes":0,"failedOutcomes":0,"installAttempts":0,"installSuccessRate":null,"successRate":null,"recentSuccessRate":null,"recentFailureRate":null,"riskBlocked":0,"setupRequired":0,"notRelevant":0,"avgOutputQuality":null,"avgTimeToUsefulMs":null,"productionOutcomes":0,"humanReviewRequired":0,"uniqueAgents":0,"lastOutcomeAt":null},"signals":[],"penalties":["No real agent outcome evidence yet"]},"audit":{"score":93,"risk_level":"safe_to_try","risk_label":"Safe to try","warnings":["Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context"]},"safety_gate":{"tier":"reviewed","label":"Reviewed","auto_install_policy":"review","auto_install_allowed":false,"human_review_required":true,"blocked":false,"recommended_action":"Review the audit page, then allow agent install in a sandboxed workflow."},"quality":{"score":100,"label":"Excellent"},"supply":{"track":"Coding and developer agents","scenario":"GitHub automation","maintenance":"Pushed today","risk":"Safe to try"},"alternative_skills":[{"slug":"josstorer-rwkv-runner","name":"RWKV Runner","url":"https://www.openagentskill.com/skills/josstorer-rwkv-runner","stars":6394,"install_command":"npx skills add josStorer/RWKV-Runner","trust_score":89,"audit_score":92},{"slug":"vmware-vsphere-automation-sdk-python","name":"Vsphere Automation Sdk Python","url":"https://www.openagentskill.com/skills/vmware-vsphere-automation-sdk-python","stars":798,"install_command":"npx skills add vmware/vsphere-automation-sdk-python","trust_score":81,"audit_score":84}],"do_not_use_when":["teams that need a vendor-supported SLA","high-compliance environments without internal security review","No major risk signals from current metadata","Documentation summary is thin","README/SKILL.md completeness: Public metadata needs stronger README/SKILL.md context","Production credentials, payments, or irreversible account changes without explicit human review","Sensitive private data before reviewing repository code, license, and permission surface"],"agent_contract":{"task_input":"Evaluate Composio before installing it in an AI agent workflow","recommended_action":"Review the audit page, then allow agent install in a sandboxed workflow.","install_policy":"review","minimum_review_before_use":["Trust: 88/100 Production candidate","Audit: 93/100 Safe to try","Safety: 81/100 Review before install","Review repository, license, install command, and permission surface before production use."],"expected_agent_output":{"selected_skill":"composio (Composio)","install_command":"npx skills add ComposioHQ/composio","risk_summary":"Safe to try; Reviewed; Review before production","verification_result":"Report the smallest successful task, files touched, warnings, and any missing setup."}},"outcome_feedback":{"endpoint":"https://www.openagentskill.com/api/agent/outcome","method":"POST","requires_resolve_event_id":true,"event_id_source":"Use install_receipt.outcome_feedback.event_id or feedback.event_id returned by /api/agent/resolve for the current task.","expected_outcomes":["success","failed","not_relevant","blocked_by_risk","setup_required"],"payload_template":{"event_id":"<install_receipt.outcome_feedback.event_id or feedback.event_id from /api/agent/resolve>","skill_slug":"composio","task":"Evaluate Composio before installing it in an AI agent workflow","agent":"codex","outcome":"success","install_used":true,"risk_blocked":false,"setup_required":false,"task_success":true,"output_quality":4,"error_type":null,"human_review_required":false,"workspace":"sandbox","time_to_useful_ms":120000,"notes":"Report the smallest successful task, setup friction, files touched, and risk notes."}},"endpoints":{"web":"https://www.openagentskill.com/skills/composio","api":"https://www.openagentskill.com/api/agent/skills/composio","audit":"https://www.openagentskill.com/skills/composio/audit","eval":"https://www.openagentskill.com/api/agent/evals?slug=composio&task=Evaluate%20Composio%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&max_risk=medium","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Composio%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium","receipt":"https://www.openagentskill.com/api/agent/receipt?task=Evaluate%20Composio%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium&format=text","install":"https://www.openagentskill.com/api/skills/composio/install","manifest":"https://www.openagentskill.com/api/registry/manifest/composio"}},"endpoints":{"web":"https://www.openagentskill.com/skills/composio","api":"https://www.openagentskill.com/api/agent/skills/composio","eval":"https://www.openagentskill.com/api/agent/evals?slug=composio","audit":"https://www.openagentskill.com/skills/composio/audit","resolve":"https://www.openagentskill.com/api/agent/resolve?task=Evaluate%20Composio%20before%20installing%20it%20in%20an%20AI%20agent%20workflow&agent=codex&max_risk=medium"}},"meta":{"endpoint":"/api/agent/evals","mode":"skill_eval","purpose":"Pre-install eval contract for a single skill. Agents should read this before installing a reusable skill.","generated_at":"2026-07-04T03:14:08.582Z"}}